Coverage for flair/flair/datasets/__init__.py: 100%

Shortcuts on this page

r m x   toggle line displays

j k   next/prev highlighted chunk

0   (zero) top of page

1   (one) first highlighted chunk

249 statements  

1# Expose base classses 

2from .base import DataLoader 

3from .base import SentenceDataset 

4from .base import StringDataset 

5from .base import MongoDataset 

6 

7# Expose all sequence labeling datasets 

8from .sequence_labeling import ColumnCorpus 

9from .sequence_labeling import ColumnDataset 

10# standard NER datasets 

11from .sequence_labeling import CONLL_03 

12from .sequence_labeling import CONLL_03_GERMAN 

13from .sequence_labeling import CONLL_03_DUTCH 

14from .sequence_labeling import CONLL_03_SPANISH 

15from .sequence_labeling import CONLL_2000 

16from .sequence_labeling import BIOSCOPE 

17from .sequence_labeling import WNUT_17 

18# other NER datasets 

19from .sequence_labeling import NER_ARABIC_ANER 

20from .sequence_labeling import NER_ARABIC_AQMAR 

21from .sequence_labeling import NER_BASQUE 

22from .sequence_labeling import NER_CHINESE_WEIBO 

23from .sequence_labeling import NER_DANISH_DANE 

24from .sequence_labeling import NER_ENGLISH_MOVIE_SIMPLE 

25from .sequence_labeling import NER_ENGLISH_MOVIE_COMPLEX 

26from .sequence_labeling import NER_ENGLISH_PERSON 

27from .sequence_labeling import NER_ENGLISH_RESTAURANT 

28from .sequence_labeling import NER_ENGLISH_SEC_FILLINGS 

29from .sequence_labeling import NER_ENGLISH_STACKOVERFLOW 

30from .sequence_labeling import NER_ENGLISH_TWITTER 

31from .sequence_labeling import NER_ENGLISH_WIKIGOLD 

32from .sequence_labeling import NER_ENGLISH_WNUT_2020 

33from .sequence_labeling import NER_ENGLISH_WEBPAGES 

34from .sequence_labeling import NER_FINNISH 

35from .sequence_labeling import NER_GERMAN_BIOFID 

36from .sequence_labeling import NER_GERMAN_EUROPARL 

37from .sequence_labeling import NER_GERMAN_GERMEVAL 

38from .sequence_labeling import NER_GERMAN_LEGAL 

39from .sequence_labeling import NER_GERMAN_POLITICS 

40from .sequence_labeling import NER_HUNGARIAN 

41from .sequence_labeling import NER_ICELANDIC 

42from .sequence_labeling import NER_JAPANESE 

43from .sequence_labeling import NER_MASAKHANE 

44from .sequence_labeling import NER_MULTI_WIKINER 

45from .sequence_labeling import NER_MULTI_WIKIANN 

46from .sequence_labeling import NER_MULTI_XTREME 

47from .sequence_labeling import NER_SWEDISH 

48from .sequence_labeling import NER_TURKU 

49from .sequence_labeling import MultiCoNer 

50# keyphrase detection datasets 

51from .sequence_labeling import KEYPHRASE_INSPEC 

52from .sequence_labeling import KEYPHRASE_SEMEVAL2010 

53from .sequence_labeling import KEYPHRASE_SEMEVAL2017 

54# universal proposition banks 

55from .sequence_labeling import UP_CHINESE 

56from .sequence_labeling import UP_ENGLISH 

57from .sequence_labeling import UP_FINNISH 

58from .sequence_labeling import UP_FRENCH 

59from .sequence_labeling import UP_GERMAN 

60from .sequence_labeling import UP_ITALIAN 

61from .sequence_labeling import UP_SPANISH 

62from .sequence_labeling import UP_SPANISH_ANCORA 

63 

64# Expose all entity linking datasets 

65from .entity_linking import EntityLinkingCorpus 

66from .entity_linking import NEL_ENGLISH_AIDA 

67from .entity_linking import NEL_ENGLISH_AQUAINT 

68from .entity_linking import NEL_ENGLISH_IITB 

69from .entity_linking import NEL_ENGLISH_REDDIT 

70from .entity_linking import NEL_ENGLISH_TWEEKI 

71from .entity_linking import NEL_GERMAN_HIPE 

72 

73# word sense disambiguation 

74from .entity_linking import WSD_UFSAC 

75from .entity_linking import WSD_RAGANATO_ALL 

76from .entity_linking import WSD_SEMCOR 

77from .entity_linking import WSD_WORDNET_GLOSS_TAGGED 

78from .entity_linking import WSD_MASC 

79from .entity_linking import WSD_OMSTI 

80from .entity_linking import WSD_TRAINOMATIC 

81 

82# Expose all document classification datasets 

83from .document_classification import ClassificationCorpus 

84from .document_classification import ClassificationDataset 

85from .document_classification import CSVClassificationCorpus 

86from .document_classification import CSVClassificationDataset 

87from .document_classification import AMAZON_REVIEWS 

88from .document_classification import COMMUNICATIVE_FUNCTIONS 

89from .document_classification import GERMEVAL_2018_OFFENSIVE_LANGUAGE 

90from .document_classification import GLUE_COLA 

91from .document_classification import GO_EMOTIONS 

92from .document_classification import IMDB 

93from .document_classification import NEWSGROUPS 

94from .document_classification import SENTIMENT_140 

95from .document_classification import SENTEVAL_CR 

96from .document_classification import SENTEVAL_MR 

97from .document_classification import SENTEVAL_MPQA 

98from .document_classification import SENTEVAL_SUBJ 

99from .document_classification import SENTEVAL_SST_BINARY 

100from .document_classification import SENTEVAL_SST_GRANULAR 

101from .document_classification import TREC_50 

102from .document_classification import TREC_6 

103from .document_classification import WASSA_ANGER 

104from .document_classification import WASSA_FEAR 

105from .document_classification import WASSA_JOY 

106from .document_classification import WASSA_SADNESS 

107from .document_classification import YAHOO_ANSWERS 

108 

109# Expose all treebanks 

110from .treebanks import UniversalDependenciesCorpus 

111from .treebanks import UniversalDependenciesDataset 

112from .treebanks import UD_ARMENIAN 

113from .treebanks import UD_ENGLISH 

114from .treebanks import UD_ANCIENT_GREEK 

115from .treebanks import UD_KAZAKH 

116from .treebanks import UD_ESTONIAN 

117from .treebanks import UD_GERMAN 

118from .treebanks import UD_GERMAN_HDT 

119from .treebanks import UD_DUTCH 

120from .treebanks import UD_FAROESE 

121from .treebanks import UD_FRENCH 

122from .treebanks import UD_ITALIAN 

123from .treebanks import UD_SPANISH 

124from .treebanks import UD_PORTUGUESE 

125from .treebanks import UD_ROMANIAN 

126from .treebanks import UD_CATALAN 

127from .treebanks import UD_POLISH 

128from .treebanks import UD_CZECH 

129from .treebanks import UD_SLOVAK 

130from .treebanks import UD_SWEDISH 

131from .treebanks import UD_DANISH 

132from .treebanks import UD_NORWEGIAN 

133from .treebanks import UD_FINNISH 

134from .treebanks import UD_SLOVENIAN 

135from .treebanks import UD_CROATIAN 

136from .treebanks import UD_SERBIAN 

137from .treebanks import UD_BULGARIAN 

138from .treebanks import UD_ARABIC 

139from .treebanks import UD_HEBREW 

140from .treebanks import UD_TURKISH 

141from .treebanks import UD_PERSIAN 

142from .treebanks import UD_RUSSIAN 

143from .treebanks import UD_HINDI 

144from .treebanks import UD_INDONESIAN 

145from .treebanks import UD_JAPANESE 

146from .treebanks import UD_CHINESE 

147from .treebanks import UD_KOREAN 

148from .treebanks import UD_BASQUE 

149from .treebanks import UD_GREEK 

150from .treebanks import UD_LIVVI 

151from .treebanks import UD_NORTH_SAMI 

152from .treebanks import UD_MARATHI 

153from .treebanks import UD_MALTESE 

154from .treebanks import UD_AFRIKAANS 

155from .treebanks import UD_OLD_FRENCH 

156from .treebanks import UD_GOTHIC 

157from .treebanks import UD_WOLOF 

158from .treebanks import UD_BELARUSIAN 

159from .treebanks import UD_OLD_CHURCH_SLAVONIC 

160from .treebanks import UD_COPTIC 

161from .treebanks import UD_IRISH 

162from .treebanks import UD_LATVIAN 

163from .treebanks import UD_LITHUANIAN 

164from .treebanks import UD_GALICIAN 

165from .treebanks import UD_LATIN 

166 

167# Expose all text-text datasets 

168from .text_text import ParallelTextCorpus 

169from .text_text import ParallelTextDataset 

170from .text_text import OpusParallelCorpus 

171from .text_text import DataPairDataset 

172from .text_text import DataPairCorpus 

173from .text_text import GLUE_MNLI 

174from .text_text import GLUE_MRPC 

175from .text_text import GLUE_RTE 

176from .text_text import GLUE_QNLI 

177from .text_text import GLUE_QQP 

178from .text_text import GLUE_WNLI 

179from .text_text import SUPERGLUE_RTE 

180 

181# Expose all text-image datasets 

182from .text_image import FeideggerCorpus 

183from .text_image import FeideggerDataset 

184 

185# Expose all biomedical data sets 

186from .biomedical import ANAT_EM 

187from .biomedical import AZDZ 

188from .biomedical import BIONLP2013_PC 

189from .biomedical import BIONLP2013_CG 

190from .biomedical import BIO_INFER 

191from .biomedical import BIOSEMANTICS 

192from .biomedical import BC2GM 

193from .biomedical import CELL_FINDER 

194from .biomedical import CEMP 

195from .biomedical import CDR 

196from .biomedical import CHEMDNER 

197from .biomedical import CRAFT 

198from .biomedical import CRAFT_V4 

199from .biomedical import CLL 

200from .biomedical import DECA 

201from .biomedical import FSU 

202from .biomedical import GELLUS 

203from .biomedical import GPRO 

204from .biomedical import IEPA 

205from .biomedical import JNLPBA 

206from .biomedical import LOCTEXT 

207from .biomedical import LINNEAUS 

208from .biomedical import NCBI_DISEASE 

209from .biomedical import MIRNA 

210from .biomedical import OSIRIS 

211from .biomedical import PDR 

212from .biomedical import S800 

213from .biomedical import SCAI_CHEMICALS 

214from .biomedical import SCAI_DISEASE 

215from .biomedical import VARIOME 

216 

217# Expose all biomedical data sets using the HUNER splits 

218from .biomedical import HUNER_CHEMICAL 

219from .biomedical import HUNER_CHEMICAL_CHEBI 

220from .biomedical import HUNER_CHEMICAL_CHEMDNER 

221from .biomedical import HUNER_CHEMICAL_CDR 

222from .biomedical import HUNER_CHEMICAL_CEMP 

223from .biomedical import HUNER_CHEMICAL_SCAI 

224from .biomedical import HUNER_CHEMICAL_CRAFT_V4 

225# - 

226from .biomedical import HUNER_CELL_LINE 

227from .biomedical import HUNER_CELL_LINE_CLL 

228from .biomedical import HUNER_CELL_LINE_CELL_FINDER 

229from .biomedical import HUNER_CELL_LINE_GELLUS 

230from .biomedical import HUNER_CELL_LINE_JNLPBA 

231# - 

232from .biomedical import HUNER_DISEASE 

233from .biomedical import HUNER_DISEASE_CDR 

234from .biomedical import HUNER_DISEASE_MIRNA 

235from .biomedical import HUNER_DISEASE_NCBI 

236from .biomedical import HUNER_DISEASE_SCAI 

237from .biomedical import HUNER_DISEASE_VARIOME 

238from .biomedical import HUNER_DISEASE_PDR 

239# - 

240from .biomedical import HUNER_GENE 

241from .biomedical import HUNER_GENE_BIO_INFER 

242from .biomedical import HUNER_GENE_BC2GM 

243from .biomedical import HUNER_GENE_CHEBI 

244from .biomedical import HUNER_GENE_CRAFT_V4 

245from .biomedical import HUNER_GENE_CELL_FINDER 

246from .biomedical import HUNER_GENE_DECA 

247from .biomedical import HUNER_GENE_FSU 

248from .biomedical import HUNER_GENE_GPRO 

249from .biomedical import HUNER_GENE_IEPA 

250from .biomedical import HUNER_GENE_JNLPBA 

251from .biomedical import HUNER_GENE_LOCTEXT 

252from .biomedical import HUNER_GENE_MIRNA 

253from .biomedical import HUNER_GENE_OSIRIS 

254from .biomedical import HUNER_GENE_VARIOME 

255# - 

256from .biomedical import HUNER_SPECIES 

257from .biomedical import HUNER_SPECIES_CELL_FINDER 

258from .biomedical import HUNER_SPECIES_CHEBI 

259from .biomedical import HUNER_SPECIES_CRAFT_V4 

260from .biomedical import HUNER_SPECIES_LOCTEXT 

261from .biomedical import HUNER_SPECIES_LINNEAUS 

262from .biomedical import HUNER_SPECIES_MIRNA 

263from .biomedical import HUNER_SPECIES_S800 

264from .biomedical import HUNER_SPECIES_VARIOME 

265 

266# Expose all biomedical data sets used for the evaluation of BioBERT 

267from .biomedical import BIOBERT_CHEMICAL_BC4CHEMD 

268from .biomedical import BIOBERT_CHEMICAL_BC5CDR 

269from .biomedical import BIOBERT_DISEASE_NCBI 

270from .biomedical import BIOBERT_DISEASE_BC5CDR 

271from .biomedical import BIOBERT_SPECIES_LINNAEUS 

272from .biomedical import BIOBERT_SPECIES_S800 

273from .biomedical import BIOBERT_GENE_BC2GM 

274from .biomedical import BIOBERT_GENE_JNLPBA 

275 

276# Expose all relation extraction datasets 

277from .relation_extraction import RE_ENGLISH_SEMEVAL2010 

278from .relation_extraction import RE_ENGLISH_TACRED 

279from .relation_extraction import RE_ENGLISH_CONLL04 

280from .relation_extraction import RE_ENGLISH_DRUGPROT