Coverage for flair/flair/datasets/__init__.py: 100%

Shortcuts on this page

r m x   toggle line displays

j k   next/prev highlighted chunk

0   (zero) top of page

1   (one) first highlighted chunk

248 statements  

1# Expose base classses 

2from .base import DataLoader 

3from .base import SentenceDataset 

4from .base import StringDataset 

5from .base import MongoDataset 

6 

7# Expose all sequence labeling datasets 

8from .sequence_labeling import ColumnCorpus 

9from .sequence_labeling import ColumnDataset 

10# standard NER datasets 

11from .sequence_labeling import CONLL_03 

12from .sequence_labeling import CONLL_03_GERMAN 

13from .sequence_labeling import CONLL_03_DUTCH 

14from .sequence_labeling import CONLL_03_SPANISH 

15from .sequence_labeling import CONLL_2000 

16from .sequence_labeling import BIOSCOPE 

17from .sequence_labeling import WNUT_17 

18# other NER datasets 

19from .sequence_labeling import NER_ARABIC_ANER 

20from .sequence_labeling import NER_ARABIC_AQMAR 

21from .sequence_labeling import NER_BASQUE 

22from .sequence_labeling import NER_CHINESE_WEIBO 

23from .sequence_labeling import NER_DANISH_DANE 

24from .sequence_labeling import NER_ENGLISH_MOVIE_SIMPLE 

25from .sequence_labeling import NER_ENGLISH_MOVIE_COMPLEX 

26from .sequence_labeling import NER_ENGLISH_PERSON 

27from .sequence_labeling import NER_ENGLISH_RESTAURANT 

28from .sequence_labeling import NER_ENGLISH_SEC_FILLINGS 

29from .sequence_labeling import NER_ENGLISH_STACKOVERFLOW 

30from .sequence_labeling import NER_ENGLISH_TWITTER 

31from .sequence_labeling import NER_ENGLISH_WIKIGOLD 

32from .sequence_labeling import NER_ENGLISH_WNUT_2020 

33from .sequence_labeling import NER_ENGLISH_WEBPAGES 

34from .sequence_labeling import NER_FINNISH 

35from .sequence_labeling import NER_GERMAN_BIOFID 

36from .sequence_labeling import NER_GERMAN_EUROPARL 

37from .sequence_labeling import NER_GERMAN_GERMEVAL 

38from .sequence_labeling import NER_GERMAN_LEGAL 

39from .sequence_labeling import NER_GERMAN_POLITICS 

40from .sequence_labeling import NER_HUNGARIAN 

41from .sequence_labeling import NER_ICELANDIC 

42from .sequence_labeling import NER_JAPANESE 

43from .sequence_labeling import NER_MASAKHANE 

44from .sequence_labeling import NER_MULTI_WIKINER 

45from .sequence_labeling import NER_MULTI_WIKIANN 

46from .sequence_labeling import NER_MULTI_XTREME 

47from .sequence_labeling import NER_SWEDISH 

48from .sequence_labeling import NER_TURKU 

49# keyphrase detection datasets 

50from .sequence_labeling import KEYPHRASE_INSPEC 

51from .sequence_labeling import KEYPHRASE_SEMEVAL2010 

52from .sequence_labeling import KEYPHRASE_SEMEVAL2017 

53# universal proposition banks 

54from .sequence_labeling import UP_CHINESE 

55from .sequence_labeling import UP_ENGLISH 

56from .sequence_labeling import UP_FINNISH 

57from .sequence_labeling import UP_FRENCH 

58from .sequence_labeling import UP_GERMAN 

59from .sequence_labeling import UP_ITALIAN 

60from .sequence_labeling import UP_SPANISH 

61from .sequence_labeling import UP_SPANISH_ANCORA 

62 

63# Expose all entity linking datasets 

64from .entity_linking import EntityLinkingCorpus 

65from .entity_linking import NEL_ENGLISH_AIDA 

66from .entity_linking import NEL_ENGLISH_AQUAINT 

67from .entity_linking import NEL_ENGLISH_IITB 

68from .entity_linking import NEL_ENGLISH_REDDIT 

69from .entity_linking import NEL_ENGLISH_TWEEKI 

70from .entity_linking import NEL_GERMAN_HIPE 

71 

72# word sense disambiguation 

73from .entity_linking import WSD_UFSAC 

74from .entity_linking import WSD_RAGANATO_ALL 

75from .entity_linking import WSD_SEMCOR 

76from .entity_linking import WSD_WORDNET_GLOSS_TAGGED 

77from .entity_linking import WSD_MASC 

78from .entity_linking import WSD_OMSTI 

79from .entity_linking import WSD_TRAINOMATIC 

80 

81# Expose all document classification datasets 

82from .document_classification import ClassificationCorpus 

83from .document_classification import ClassificationDataset 

84from .document_classification import CSVClassificationCorpus 

85from .document_classification import CSVClassificationDataset 

86from .document_classification import AMAZON_REVIEWS 

87from .document_classification import COMMUNICATIVE_FUNCTIONS 

88from .document_classification import GERMEVAL_2018_OFFENSIVE_LANGUAGE 

89from .document_classification import GLUE_COLA 

90from .document_classification import GO_EMOTIONS 

91from .document_classification import IMDB 

92from .document_classification import NEWSGROUPS 

93from .document_classification import SENTIMENT_140 

94from .document_classification import SENTEVAL_CR 

95from .document_classification import SENTEVAL_MR 

96from .document_classification import SENTEVAL_MPQA 

97from .document_classification import SENTEVAL_SUBJ 

98from .document_classification import SENTEVAL_SST_BINARY 

99from .document_classification import SENTEVAL_SST_GRANULAR 

100from .document_classification import TREC_50 

101from .document_classification import TREC_6 

102from .document_classification import WASSA_ANGER 

103from .document_classification import WASSA_FEAR 

104from .document_classification import WASSA_JOY 

105from .document_classification import WASSA_SADNESS 

106from .document_classification import YAHOO_ANSWERS 

107 

108# Expose all treebanks 

109from .treebanks import UniversalDependenciesCorpus 

110from .treebanks import UniversalDependenciesDataset 

111from .treebanks import UD_ARMENIAN 

112from .treebanks import UD_ENGLISH 

113from .treebanks import UD_ANCIENT_GREEK 

114from .treebanks import UD_KAZAKH 

115from .treebanks import UD_ESTONIAN 

116from .treebanks import UD_GERMAN 

117from .treebanks import UD_GERMAN_HDT 

118from .treebanks import UD_DUTCH 

119from .treebanks import UD_FAROESE 

120from .treebanks import UD_FRENCH 

121from .treebanks import UD_ITALIAN 

122from .treebanks import UD_SPANISH 

123from .treebanks import UD_PORTUGUESE 

124from .treebanks import UD_ROMANIAN 

125from .treebanks import UD_CATALAN 

126from .treebanks import UD_POLISH 

127from .treebanks import UD_CZECH 

128from .treebanks import UD_SLOVAK 

129from .treebanks import UD_SWEDISH 

130from .treebanks import UD_DANISH 

131from .treebanks import UD_NORWEGIAN 

132from .treebanks import UD_FINNISH 

133from .treebanks import UD_SLOVENIAN 

134from .treebanks import UD_CROATIAN 

135from .treebanks import UD_SERBIAN 

136from .treebanks import UD_BULGARIAN 

137from .treebanks import UD_ARABIC 

138from .treebanks import UD_HEBREW 

139from .treebanks import UD_TURKISH 

140from .treebanks import UD_PERSIAN 

141from .treebanks import UD_RUSSIAN 

142from .treebanks import UD_HINDI 

143from .treebanks import UD_INDONESIAN 

144from .treebanks import UD_JAPANESE 

145from .treebanks import UD_CHINESE 

146from .treebanks import UD_KOREAN 

147from .treebanks import UD_BASQUE 

148from .treebanks import UD_GREEK 

149from .treebanks import UD_LIVVI 

150from .treebanks import UD_NORTH_SAMI 

151from .treebanks import UD_MARATHI 

152from .treebanks import UD_MALTESE 

153from .treebanks import UD_AFRIKAANS 

154from .treebanks import UD_OLD_FRENCH 

155from .treebanks import UD_GOTHIC 

156from .treebanks import UD_WOLOF 

157from .treebanks import UD_BELARUSIAN 

158from .treebanks import UD_OLD_CHURCH_SLAVONIC 

159from .treebanks import UD_COPTIC 

160from .treebanks import UD_IRISH 

161from .treebanks import UD_LATVIAN 

162from .treebanks import UD_LITHUANIAN 

163from .treebanks import UD_GALICIAN 

164from .treebanks import UD_LATIN 

165 

166# Expose all text-text datasets 

167from .text_text import ParallelTextCorpus 

168from .text_text import ParallelTextDataset 

169from .text_text import OpusParallelCorpus 

170from .text_text import DataPairDataset 

171from .text_text import DataPairCorpus 

172from .text_text import GLUE_MNLI 

173from .text_text import GLUE_MRPC 

174from .text_text import GLUE_RTE 

175from .text_text import GLUE_QNLI 

176from .text_text import GLUE_QQP 

177from .text_text import GLUE_WNLI 

178from .text_text import SUPERGLUE_RTE 

179 

180# Expose all text-image datasets 

181from .text_image import FeideggerCorpus 

182from .text_image import FeideggerDataset 

183 

184# Expose all biomedical data sets 

185from .biomedical import ANAT_EM 

186from .biomedical import AZDZ 

187from .biomedical import BIONLP2013_PC 

188from .biomedical import BIONLP2013_CG 

189from .biomedical import BIO_INFER 

190from .biomedical import BIOSEMANTICS 

191from .biomedical import BC2GM 

192from .biomedical import CELL_FINDER 

193from .biomedical import CEMP 

194from .biomedical import CDR 

195from .biomedical import CHEMDNER 

196from .biomedical import CRAFT 

197from .biomedical import CRAFT_V4 

198from .biomedical import CLL 

199from .biomedical import DECA 

200from .biomedical import FSU 

201from .biomedical import GELLUS 

202from .biomedical import GPRO 

203from .biomedical import IEPA 

204from .biomedical import JNLPBA 

205from .biomedical import LOCTEXT 

206from .biomedical import LINNEAUS 

207from .biomedical import NCBI_DISEASE 

208from .biomedical import MIRNA 

209from .biomedical import OSIRIS 

210from .biomedical import PDR 

211from .biomedical import S800 

212from .biomedical import SCAI_CHEMICALS 

213from .biomedical import SCAI_DISEASE 

214from .biomedical import VARIOME 

215 

216# Expose all biomedical data sets using the HUNER splits 

217from .biomedical import HUNER_CHEMICAL 

218from .biomedical import HUNER_CHEMICAL_CHEBI 

219from .biomedical import HUNER_CHEMICAL_CHEMDNER 

220from .biomedical import HUNER_CHEMICAL_CDR 

221from .biomedical import HUNER_CHEMICAL_CEMP 

222from .biomedical import HUNER_CHEMICAL_SCAI 

223from .biomedical import HUNER_CHEMICAL_CRAFT_V4 

224# - 

225from .biomedical import HUNER_CELL_LINE 

226from .biomedical import HUNER_CELL_LINE_CLL 

227from .biomedical import HUNER_CELL_LINE_CELL_FINDER 

228from .biomedical import HUNER_CELL_LINE_GELLUS 

229from .biomedical import HUNER_CELL_LINE_JNLPBA 

230# - 

231from .biomedical import HUNER_DISEASE 

232from .biomedical import HUNER_DISEASE_CDR 

233from .biomedical import HUNER_DISEASE_MIRNA 

234from .biomedical import HUNER_DISEASE_NCBI 

235from .biomedical import HUNER_DISEASE_SCAI 

236from .biomedical import HUNER_DISEASE_VARIOME 

237from .biomedical import HUNER_DISEASE_PDR 

238# - 

239from .biomedical import HUNER_GENE 

240from .biomedical import HUNER_GENE_BIO_INFER 

241from .biomedical import HUNER_GENE_BC2GM 

242from .biomedical import HUNER_GENE_CHEBI 

243from .biomedical import HUNER_GENE_CRAFT_V4 

244from .biomedical import HUNER_GENE_CELL_FINDER 

245from .biomedical import HUNER_GENE_DECA 

246from .biomedical import HUNER_GENE_FSU 

247from .biomedical import HUNER_GENE_GPRO 

248from .biomedical import HUNER_GENE_IEPA 

249from .biomedical import HUNER_GENE_JNLPBA 

250from .biomedical import HUNER_GENE_LOCTEXT 

251from .biomedical import HUNER_GENE_MIRNA 

252from .biomedical import HUNER_GENE_OSIRIS 

253from .biomedical import HUNER_GENE_VARIOME 

254# - 

255from .biomedical import HUNER_SPECIES 

256from .biomedical import HUNER_SPECIES_CELL_FINDER 

257from .biomedical import HUNER_SPECIES_CHEBI 

258from .biomedical import HUNER_SPECIES_CRAFT_V4 

259from .biomedical import HUNER_SPECIES_LOCTEXT 

260from .biomedical import HUNER_SPECIES_LINNEAUS 

261from .biomedical import HUNER_SPECIES_MIRNA 

262from .biomedical import HUNER_SPECIES_S800 

263from .biomedical import HUNER_SPECIES_VARIOME 

264 

265# Expose all biomedical data sets used for the evaluation of BioBERT 

266from .biomedical import BIOBERT_CHEMICAL_BC4CHEMD 

267from .biomedical import BIOBERT_CHEMICAL_BC5CDR 

268from .biomedical import BIOBERT_DISEASE_NCBI 

269from .biomedical import BIOBERT_DISEASE_BC5CDR 

270from .biomedical import BIOBERT_SPECIES_LINNAEUS 

271from .biomedical import BIOBERT_SPECIES_S800 

272from .biomedical import BIOBERT_GENE_BC2GM 

273from .biomedical import BIOBERT_GENE_JNLPBA 

274 

275# Expose all relation extraction datasets 

276from .relation_extraction import RE_ENGLISH_SEMEVAL2010 

277from .relation_extraction import RE_ENGLISH_TACRED 

278from .relation_extraction import RE_ENGLISH_CONLL04 

279from .relation_extraction import RE_ENGLISH_DRUGPROT