Coverage for flair/flair/datasets/__init__.py: 100%
Shortcuts on this page
r m x toggle line displays
j k next/prev highlighted chunk
0 (zero) top of page
1 (one) first highlighted chunk
Shortcuts on this page
r m x toggle line displays
j k next/prev highlighted chunk
0 (zero) top of page
1 (one) first highlighted chunk
1# Expose base classses
2from .base import DataLoader
3from .base import SentenceDataset
4from .base import StringDataset
5from .base import MongoDataset
7# Expose all sequence labeling datasets
8from .sequence_labeling import ColumnCorpus
9from .sequence_labeling import ColumnDataset
10# standard NER datasets
11from .sequence_labeling import CONLL_03
12from .sequence_labeling import CONLL_03_GERMAN
13from .sequence_labeling import CONLL_03_DUTCH
14from .sequence_labeling import CONLL_03_SPANISH
15from .sequence_labeling import CONLL_2000
16from .sequence_labeling import BIOSCOPE
17from .sequence_labeling import WNUT_17
18# other NER datasets
19from .sequence_labeling import NER_ARABIC_ANER
20from .sequence_labeling import NER_ARABIC_AQMAR
21from .sequence_labeling import NER_BASQUE
22from .sequence_labeling import NER_CHINESE_WEIBO
23from .sequence_labeling import NER_DANISH_DANE
24from .sequence_labeling import NER_ENGLISH_MOVIE_SIMPLE
25from .sequence_labeling import NER_ENGLISH_MOVIE_COMPLEX
26from .sequence_labeling import NER_ENGLISH_PERSON
27from .sequence_labeling import NER_ENGLISH_RESTAURANT
28from .sequence_labeling import NER_ENGLISH_SEC_FILLINGS
29from .sequence_labeling import NER_ENGLISH_STACKOVERFLOW
30from .sequence_labeling import NER_ENGLISH_TWITTER
31from .sequence_labeling import NER_ENGLISH_WIKIGOLD
32from .sequence_labeling import NER_ENGLISH_WNUT_2020
33from .sequence_labeling import NER_ENGLISH_WEBPAGES
34from .sequence_labeling import NER_FINNISH
35from .sequence_labeling import NER_GERMAN_BIOFID
36from .sequence_labeling import NER_GERMAN_EUROPARL
37from .sequence_labeling import NER_GERMAN_GERMEVAL
38from .sequence_labeling import NER_GERMAN_LEGAL
39from .sequence_labeling import NER_GERMAN_POLITICS
40from .sequence_labeling import NER_HUNGARIAN
41from .sequence_labeling import NER_ICELANDIC
42from .sequence_labeling import NER_JAPANESE
43from .sequence_labeling import NER_MASAKHANE
44from .sequence_labeling import NER_MULTI_WIKINER
45from .sequence_labeling import NER_MULTI_WIKIANN
46from .sequence_labeling import NER_MULTI_XTREME
47from .sequence_labeling import NER_SWEDISH
48from .sequence_labeling import NER_TURKU
49from .sequence_labeling import MultiCoNer
50# keyphrase detection datasets
51from .sequence_labeling import KEYPHRASE_INSPEC
52from .sequence_labeling import KEYPHRASE_SEMEVAL2010
53from .sequence_labeling import KEYPHRASE_SEMEVAL2017
54# universal proposition banks
55from .sequence_labeling import UP_CHINESE
56from .sequence_labeling import UP_ENGLISH
57from .sequence_labeling import UP_FINNISH
58from .sequence_labeling import UP_FRENCH
59from .sequence_labeling import UP_GERMAN
60from .sequence_labeling import UP_ITALIAN
61from .sequence_labeling import UP_SPANISH
62from .sequence_labeling import UP_SPANISH_ANCORA
64# Expose all entity linking datasets
65from .entity_linking import EntityLinkingCorpus
66from .entity_linking import NEL_ENGLISH_AIDA
67from .entity_linking import NEL_ENGLISH_AQUAINT
68from .entity_linking import NEL_ENGLISH_IITB
69from .entity_linking import NEL_ENGLISH_REDDIT
70from .entity_linking import NEL_ENGLISH_TWEEKI
71from .entity_linking import NEL_GERMAN_HIPE
73# word sense disambiguation
74from .entity_linking import WSD_UFSAC
75from .entity_linking import WSD_RAGANATO_ALL
76from .entity_linking import WSD_SEMCOR
77from .entity_linking import WSD_WORDNET_GLOSS_TAGGED
78from .entity_linking import WSD_MASC
79from .entity_linking import WSD_OMSTI
80from .entity_linking import WSD_TRAINOMATIC
82# Expose all document classification datasets
83from .document_classification import ClassificationCorpus
84from .document_classification import ClassificationDataset
85from .document_classification import CSVClassificationCorpus
86from .document_classification import CSVClassificationDataset
87from .document_classification import AMAZON_REVIEWS
88from .document_classification import COMMUNICATIVE_FUNCTIONS
89from .document_classification import GERMEVAL_2018_OFFENSIVE_LANGUAGE
90from .document_classification import GLUE_COLA
91from .document_classification import GO_EMOTIONS
92from .document_classification import IMDB
93from .document_classification import NEWSGROUPS
94from .document_classification import SENTIMENT_140
95from .document_classification import SENTEVAL_CR
96from .document_classification import SENTEVAL_MR
97from .document_classification import SENTEVAL_MPQA
98from .document_classification import SENTEVAL_SUBJ
99from .document_classification import SENTEVAL_SST_BINARY
100from .document_classification import SENTEVAL_SST_GRANULAR
101from .document_classification import TREC_50
102from .document_classification import TREC_6
103from .document_classification import WASSA_ANGER
104from .document_classification import WASSA_FEAR
105from .document_classification import WASSA_JOY
106from .document_classification import WASSA_SADNESS
107from .document_classification import YAHOO_ANSWERS
109# Expose all treebanks
110from .treebanks import UniversalDependenciesCorpus
111from .treebanks import UniversalDependenciesDataset
112from .treebanks import UD_ARMENIAN
113from .treebanks import UD_ENGLISH
114from .treebanks import UD_ANCIENT_GREEK
115from .treebanks import UD_KAZAKH
116from .treebanks import UD_ESTONIAN
117from .treebanks import UD_GERMAN
118from .treebanks import UD_GERMAN_HDT
119from .treebanks import UD_DUTCH
120from .treebanks import UD_FAROESE
121from .treebanks import UD_FRENCH
122from .treebanks import UD_ITALIAN
123from .treebanks import UD_SPANISH
124from .treebanks import UD_PORTUGUESE
125from .treebanks import UD_ROMANIAN
126from .treebanks import UD_CATALAN
127from .treebanks import UD_POLISH
128from .treebanks import UD_CZECH
129from .treebanks import UD_SLOVAK
130from .treebanks import UD_SWEDISH
131from .treebanks import UD_DANISH
132from .treebanks import UD_NORWEGIAN
133from .treebanks import UD_FINNISH
134from .treebanks import UD_SLOVENIAN
135from .treebanks import UD_CROATIAN
136from .treebanks import UD_SERBIAN
137from .treebanks import UD_BULGARIAN
138from .treebanks import UD_ARABIC
139from .treebanks import UD_HEBREW
140from .treebanks import UD_TURKISH
141from .treebanks import UD_PERSIAN
142from .treebanks import UD_RUSSIAN
143from .treebanks import UD_HINDI
144from .treebanks import UD_INDONESIAN
145from .treebanks import UD_JAPANESE
146from .treebanks import UD_CHINESE
147from .treebanks import UD_KOREAN
148from .treebanks import UD_BASQUE
149from .treebanks import UD_GREEK
150from .treebanks import UD_LIVVI
151from .treebanks import UD_NORTH_SAMI
152from .treebanks import UD_MARATHI
153from .treebanks import UD_MALTESE
154from .treebanks import UD_AFRIKAANS
155from .treebanks import UD_OLD_FRENCH
156from .treebanks import UD_GOTHIC
157from .treebanks import UD_WOLOF
158from .treebanks import UD_BELARUSIAN
159from .treebanks import UD_OLD_CHURCH_SLAVONIC
160from .treebanks import UD_COPTIC
161from .treebanks import UD_IRISH
162from .treebanks import UD_LATVIAN
163from .treebanks import UD_LITHUANIAN
164from .treebanks import UD_GALICIAN
165from .treebanks import UD_LATIN
167# Expose all text-text datasets
168from .text_text import ParallelTextCorpus
169from .text_text import ParallelTextDataset
170from .text_text import OpusParallelCorpus
171from .text_text import DataPairDataset
172from .text_text import DataPairCorpus
173from .text_text import GLUE_MNLI
174from .text_text import GLUE_MRPC
175from .text_text import GLUE_RTE
176from .text_text import GLUE_QNLI
177from .text_text import GLUE_QQP
178from .text_text import GLUE_WNLI
179from .text_text import SUPERGLUE_RTE
181# Expose all text-image datasets
182from .text_image import FeideggerCorpus
183from .text_image import FeideggerDataset
185# Expose all biomedical data sets
186from .biomedical import ANAT_EM
187from .biomedical import AZDZ
188from .biomedical import BIONLP2013_PC
189from .biomedical import BIONLP2013_CG
190from .biomedical import BIO_INFER
191from .biomedical import BIOSEMANTICS
192from .biomedical import BC2GM
193from .biomedical import CELL_FINDER
194from .biomedical import CEMP
195from .biomedical import CDR
196from .biomedical import CHEMDNER
197from .biomedical import CRAFT
198from .biomedical import CRAFT_V4
199from .biomedical import CLL
200from .biomedical import DECA
201from .biomedical import FSU
202from .biomedical import GELLUS
203from .biomedical import GPRO
204from .biomedical import IEPA
205from .biomedical import JNLPBA
206from .biomedical import LOCTEXT
207from .biomedical import LINNEAUS
208from .biomedical import NCBI_DISEASE
209from .biomedical import MIRNA
210from .biomedical import OSIRIS
211from .biomedical import PDR
212from .biomedical import S800
213from .biomedical import SCAI_CHEMICALS
214from .biomedical import SCAI_DISEASE
215from .biomedical import VARIOME
217# Expose all biomedical data sets using the HUNER splits
218from .biomedical import HUNER_CHEMICAL
219from .biomedical import HUNER_CHEMICAL_CHEBI
220from .biomedical import HUNER_CHEMICAL_CHEMDNER
221from .biomedical import HUNER_CHEMICAL_CDR
222from .biomedical import HUNER_CHEMICAL_CEMP
223from .biomedical import HUNER_CHEMICAL_SCAI
224from .biomedical import HUNER_CHEMICAL_CRAFT_V4
225# -
226from .biomedical import HUNER_CELL_LINE
227from .biomedical import HUNER_CELL_LINE_CLL
228from .biomedical import HUNER_CELL_LINE_CELL_FINDER
229from .biomedical import HUNER_CELL_LINE_GELLUS
230from .biomedical import HUNER_CELL_LINE_JNLPBA
231# -
232from .biomedical import HUNER_DISEASE
233from .biomedical import HUNER_DISEASE_CDR
234from .biomedical import HUNER_DISEASE_MIRNA
235from .biomedical import HUNER_DISEASE_NCBI
236from .biomedical import HUNER_DISEASE_SCAI
237from .biomedical import HUNER_DISEASE_VARIOME
238from .biomedical import HUNER_DISEASE_PDR
239# -
240from .biomedical import HUNER_GENE
241from .biomedical import HUNER_GENE_BIO_INFER
242from .biomedical import HUNER_GENE_BC2GM
243from .biomedical import HUNER_GENE_CHEBI
244from .biomedical import HUNER_GENE_CRAFT_V4
245from .biomedical import HUNER_GENE_CELL_FINDER
246from .biomedical import HUNER_GENE_DECA
247from .biomedical import HUNER_GENE_FSU
248from .biomedical import HUNER_GENE_GPRO
249from .biomedical import HUNER_GENE_IEPA
250from .biomedical import HUNER_GENE_JNLPBA
251from .biomedical import HUNER_GENE_LOCTEXT
252from .biomedical import HUNER_GENE_MIRNA
253from .biomedical import HUNER_GENE_OSIRIS
254from .biomedical import HUNER_GENE_VARIOME
255# -
256from .biomedical import HUNER_SPECIES
257from .biomedical import HUNER_SPECIES_CELL_FINDER
258from .biomedical import HUNER_SPECIES_CHEBI
259from .biomedical import HUNER_SPECIES_CRAFT_V4
260from .biomedical import HUNER_SPECIES_LOCTEXT
261from .biomedical import HUNER_SPECIES_LINNEAUS
262from .biomedical import HUNER_SPECIES_MIRNA
263from .biomedical import HUNER_SPECIES_S800
264from .biomedical import HUNER_SPECIES_VARIOME
266# Expose all biomedical data sets used for the evaluation of BioBERT
267from .biomedical import BIOBERT_CHEMICAL_BC4CHEMD
268from .biomedical import BIOBERT_CHEMICAL_BC5CDR
269from .biomedical import BIOBERT_DISEASE_NCBI
270from .biomedical import BIOBERT_DISEASE_BC5CDR
271from .biomedical import BIOBERT_SPECIES_LINNAEUS
272from .biomedical import BIOBERT_SPECIES_S800
273from .biomedical import BIOBERT_GENE_BC2GM
274from .biomedical import BIOBERT_GENE_JNLPBA
276# Expose all relation extraction datasets
277from .relation_extraction import RE_ENGLISH_SEMEVAL2010
278from .relation_extraction import RE_ENGLISH_TACRED
279from .relation_extraction import RE_ENGLISH_CONLL04
280from .relation_extraction import RE_ENGLISH_DRUGPROT