Coverage for flair/flair/datasets/__init__.py: 100%
Shortcuts on this page
r m x toggle line displays
j k next/prev highlighted chunk
0 (zero) top of page
1 (one) first highlighted chunk
Shortcuts on this page
r m x toggle line displays
j k next/prev highlighted chunk
0 (zero) top of page
1 (one) first highlighted chunk
1# Expose base classses
2from .base import DataLoader
3from .base import SentenceDataset
4from .base import StringDataset
5from .base import MongoDataset
7# Expose all sequence labeling datasets
8from .sequence_labeling import ColumnCorpus
9from .sequence_labeling import ColumnDataset
10# standard NER datasets
11from .sequence_labeling import CONLL_03
12from .sequence_labeling import CONLL_03_GERMAN
13from .sequence_labeling import CONLL_03_DUTCH
14from .sequence_labeling import CONLL_03_SPANISH
15from .sequence_labeling import CONLL_2000
16from .sequence_labeling import BIOSCOPE
17from .sequence_labeling import WNUT_17
18# other NER datasets
19from .sequence_labeling import NER_ARABIC_ANER
20from .sequence_labeling import NER_ARABIC_AQMAR
21from .sequence_labeling import NER_BASQUE
22from .sequence_labeling import NER_CHINESE_WEIBO
23from .sequence_labeling import NER_DANISH_DANE
24from .sequence_labeling import NER_ENGLISH_MOVIE_SIMPLE
25from .sequence_labeling import NER_ENGLISH_MOVIE_COMPLEX
26from .sequence_labeling import NER_ENGLISH_PERSON
27from .sequence_labeling import NER_ENGLISH_RESTAURANT
28from .sequence_labeling import NER_ENGLISH_SEC_FILLINGS
29from .sequence_labeling import NER_ENGLISH_STACKOVERFLOW
30from .sequence_labeling import NER_ENGLISH_TWITTER
31from .sequence_labeling import NER_ENGLISH_WIKIGOLD
32from .sequence_labeling import NER_ENGLISH_WNUT_2020
33from .sequence_labeling import NER_ENGLISH_WEBPAGES
34from .sequence_labeling import NER_FINNISH
35from .sequence_labeling import NER_GERMAN_BIOFID
36from .sequence_labeling import NER_GERMAN_EUROPARL
37from .sequence_labeling import NER_GERMAN_GERMEVAL
38from .sequence_labeling import NER_GERMAN_LEGAL
39from .sequence_labeling import NER_GERMAN_POLITICS
40from .sequence_labeling import NER_HUNGARIAN
41from .sequence_labeling import NER_ICELANDIC
42from .sequence_labeling import NER_JAPANESE
43from .sequence_labeling import NER_MASAKHANE
44from .sequence_labeling import NER_MULTI_WIKINER
45from .sequence_labeling import NER_MULTI_WIKIANN
46from .sequence_labeling import NER_MULTI_XTREME
47from .sequence_labeling import NER_SWEDISH
48from .sequence_labeling import NER_TURKU
49# keyphrase detection datasets
50from .sequence_labeling import KEYPHRASE_INSPEC
51from .sequence_labeling import KEYPHRASE_SEMEVAL2010
52from .sequence_labeling import KEYPHRASE_SEMEVAL2017
53# universal proposition banks
54from .sequence_labeling import UP_CHINESE
55from .sequence_labeling import UP_ENGLISH
56from .sequence_labeling import UP_FINNISH
57from .sequence_labeling import UP_FRENCH
58from .sequence_labeling import UP_GERMAN
59from .sequence_labeling import UP_ITALIAN
60from .sequence_labeling import UP_SPANISH
61from .sequence_labeling import UP_SPANISH_ANCORA
63# Expose all entity linking datasets
64from .entity_linking import EntityLinkingCorpus
65from .entity_linking import NEL_ENGLISH_AIDA
66from .entity_linking import NEL_ENGLISH_AQUAINT
67from .entity_linking import NEL_ENGLISH_IITB
68from .entity_linking import NEL_ENGLISH_REDDIT
69from .entity_linking import NEL_ENGLISH_TWEEKI
70from .entity_linking import NEL_GERMAN_HIPE
72# word sense disambiguation
73from .entity_linking import WSD_UFSAC
74from .entity_linking import WSD_RAGANATO_ALL
75from .entity_linking import WSD_SEMCOR
76from .entity_linking import WSD_WORDNET_GLOSS_TAGGED
77from .entity_linking import WSD_MASC
78from .entity_linking import WSD_OMSTI
79from .entity_linking import WSD_TRAINOMATIC
81# Expose all document classification datasets
82from .document_classification import ClassificationCorpus
83from .document_classification import ClassificationDataset
84from .document_classification import CSVClassificationCorpus
85from .document_classification import CSVClassificationDataset
86from .document_classification import AMAZON_REVIEWS
87from .document_classification import COMMUNICATIVE_FUNCTIONS
88from .document_classification import GERMEVAL_2018_OFFENSIVE_LANGUAGE
89from .document_classification import GLUE_COLA
90from .document_classification import GO_EMOTIONS
91from .document_classification import IMDB
92from .document_classification import NEWSGROUPS
93from .document_classification import SENTIMENT_140
94from .document_classification import SENTEVAL_CR
95from .document_classification import SENTEVAL_MR
96from .document_classification import SENTEVAL_MPQA
97from .document_classification import SENTEVAL_SUBJ
98from .document_classification import SENTEVAL_SST_BINARY
99from .document_classification import SENTEVAL_SST_GRANULAR
100from .document_classification import TREC_50
101from .document_classification import TREC_6
102from .document_classification import WASSA_ANGER
103from .document_classification import WASSA_FEAR
104from .document_classification import WASSA_JOY
105from .document_classification import WASSA_SADNESS
106from .document_classification import YAHOO_ANSWERS
108# Expose all treebanks
109from .treebanks import UniversalDependenciesCorpus
110from .treebanks import UniversalDependenciesDataset
111from .treebanks import UD_ARMENIAN
112from .treebanks import UD_ENGLISH
113from .treebanks import UD_ANCIENT_GREEK
114from .treebanks import UD_KAZAKH
115from .treebanks import UD_ESTONIAN
116from .treebanks import UD_GERMAN
117from .treebanks import UD_GERMAN_HDT
118from .treebanks import UD_DUTCH
119from .treebanks import UD_FAROESE
120from .treebanks import UD_FRENCH
121from .treebanks import UD_ITALIAN
122from .treebanks import UD_SPANISH
123from .treebanks import UD_PORTUGUESE
124from .treebanks import UD_ROMANIAN
125from .treebanks import UD_CATALAN
126from .treebanks import UD_POLISH
127from .treebanks import UD_CZECH
128from .treebanks import UD_SLOVAK
129from .treebanks import UD_SWEDISH
130from .treebanks import UD_DANISH
131from .treebanks import UD_NORWEGIAN
132from .treebanks import UD_FINNISH
133from .treebanks import UD_SLOVENIAN
134from .treebanks import UD_CROATIAN
135from .treebanks import UD_SERBIAN
136from .treebanks import UD_BULGARIAN
137from .treebanks import UD_ARABIC
138from .treebanks import UD_HEBREW
139from .treebanks import UD_TURKISH
140from .treebanks import UD_PERSIAN
141from .treebanks import UD_RUSSIAN
142from .treebanks import UD_HINDI
143from .treebanks import UD_INDONESIAN
144from .treebanks import UD_JAPANESE
145from .treebanks import UD_CHINESE
146from .treebanks import UD_KOREAN
147from .treebanks import UD_BASQUE
148from .treebanks import UD_GREEK
149from .treebanks import UD_LIVVI
150from .treebanks import UD_NORTH_SAMI
151from .treebanks import UD_MARATHI
152from .treebanks import UD_MALTESE
153from .treebanks import UD_AFRIKAANS
154from .treebanks import UD_OLD_FRENCH
155from .treebanks import UD_GOTHIC
156from .treebanks import UD_WOLOF
157from .treebanks import UD_BELARUSIAN
158from .treebanks import UD_OLD_CHURCH_SLAVONIC
159from .treebanks import UD_COPTIC
160from .treebanks import UD_IRISH
161from .treebanks import UD_LATVIAN
162from .treebanks import UD_LITHUANIAN
163from .treebanks import UD_GALICIAN
164from .treebanks import UD_LATIN
166# Expose all text-text datasets
167from .text_text import ParallelTextCorpus
168from .text_text import ParallelTextDataset
169from .text_text import OpusParallelCorpus
170from .text_text import DataPairDataset
171from .text_text import DataPairCorpus
172from .text_text import GLUE_MNLI
173from .text_text import GLUE_MRPC
174from .text_text import GLUE_RTE
175from .text_text import GLUE_QNLI
176from .text_text import GLUE_QQP
177from .text_text import GLUE_WNLI
178from .text_text import SUPERGLUE_RTE
180# Expose all text-image datasets
181from .text_image import FeideggerCorpus
182from .text_image import FeideggerDataset
184# Expose all biomedical data sets
185from .biomedical import ANAT_EM
186from .biomedical import AZDZ
187from .biomedical import BIONLP2013_PC
188from .biomedical import BIONLP2013_CG
189from .biomedical import BIO_INFER
190from .biomedical import BIOSEMANTICS
191from .biomedical import BC2GM
192from .biomedical import CELL_FINDER
193from .biomedical import CEMP
194from .biomedical import CDR
195from .biomedical import CHEMDNER
196from .biomedical import CRAFT
197from .biomedical import CRAFT_V4
198from .biomedical import CLL
199from .biomedical import DECA
200from .biomedical import FSU
201from .biomedical import GELLUS
202from .biomedical import GPRO
203from .biomedical import IEPA
204from .biomedical import JNLPBA
205from .biomedical import LOCTEXT
206from .biomedical import LINNEAUS
207from .biomedical import NCBI_DISEASE
208from .biomedical import MIRNA
209from .biomedical import OSIRIS
210from .biomedical import PDR
211from .biomedical import S800
212from .biomedical import SCAI_CHEMICALS
213from .biomedical import SCAI_DISEASE
214from .biomedical import VARIOME
216# Expose all biomedical data sets using the HUNER splits
217from .biomedical import HUNER_CHEMICAL
218from .biomedical import HUNER_CHEMICAL_CHEBI
219from .biomedical import HUNER_CHEMICAL_CHEMDNER
220from .biomedical import HUNER_CHEMICAL_CDR
221from .biomedical import HUNER_CHEMICAL_CEMP
222from .biomedical import HUNER_CHEMICAL_SCAI
223from .biomedical import HUNER_CHEMICAL_CRAFT_V4
224# -
225from .biomedical import HUNER_CELL_LINE
226from .biomedical import HUNER_CELL_LINE_CLL
227from .biomedical import HUNER_CELL_LINE_CELL_FINDER
228from .biomedical import HUNER_CELL_LINE_GELLUS
229from .biomedical import HUNER_CELL_LINE_JNLPBA
230# -
231from .biomedical import HUNER_DISEASE
232from .biomedical import HUNER_DISEASE_CDR
233from .biomedical import HUNER_DISEASE_MIRNA
234from .biomedical import HUNER_DISEASE_NCBI
235from .biomedical import HUNER_DISEASE_SCAI
236from .biomedical import HUNER_DISEASE_VARIOME
237from .biomedical import HUNER_DISEASE_PDR
238# -
239from .biomedical import HUNER_GENE
240from .biomedical import HUNER_GENE_BIO_INFER
241from .biomedical import HUNER_GENE_BC2GM
242from .biomedical import HUNER_GENE_CHEBI
243from .biomedical import HUNER_GENE_CRAFT_V4
244from .biomedical import HUNER_GENE_CELL_FINDER
245from .biomedical import HUNER_GENE_DECA
246from .biomedical import HUNER_GENE_FSU
247from .biomedical import HUNER_GENE_GPRO
248from .biomedical import HUNER_GENE_IEPA
249from .biomedical import HUNER_GENE_JNLPBA
250from .biomedical import HUNER_GENE_LOCTEXT
251from .biomedical import HUNER_GENE_MIRNA
252from .biomedical import HUNER_GENE_OSIRIS
253from .biomedical import HUNER_GENE_VARIOME
254# -
255from .biomedical import HUNER_SPECIES
256from .biomedical import HUNER_SPECIES_CELL_FINDER
257from .biomedical import HUNER_SPECIES_CHEBI
258from .biomedical import HUNER_SPECIES_CRAFT_V4
259from .biomedical import HUNER_SPECIES_LOCTEXT
260from .biomedical import HUNER_SPECIES_LINNEAUS
261from .biomedical import HUNER_SPECIES_MIRNA
262from .biomedical import HUNER_SPECIES_S800
263from .biomedical import HUNER_SPECIES_VARIOME
265# Expose all biomedical data sets used for the evaluation of BioBERT
266from .biomedical import BIOBERT_CHEMICAL_BC4CHEMD
267from .biomedical import BIOBERT_CHEMICAL_BC5CDR
268from .biomedical import BIOBERT_DISEASE_NCBI
269from .biomedical import BIOBERT_DISEASE_BC5CDR
270from .biomedical import BIOBERT_SPECIES_LINNAEUS
271from .biomedical import BIOBERT_SPECIES_S800
272from .biomedical import BIOBERT_GENE_BC2GM
273from .biomedical import BIOBERT_GENE_JNLPBA
275# Expose all relation extraction datasets
276from .relation_extraction import RE_ENGLISH_SEMEVAL2010
277from .relation_extraction import RE_ENGLISH_TACRED
278from .relation_extraction import RE_ENGLISH_CONLL04
279from .relation_extraction import RE_ENGLISH_DRUGPROT