|
324 | 324 | )
|
325 | 325 |
|
326 | 326 | __all__ = [
|
327 |
| - "DataLoader", |
328 |
| - "OcrJsonDataset", |
329 |
| - "SROIE", |
330 |
| - "FlairDatapointDataset", |
331 |
| - "SentenceDataset", |
332 |
| - "MongoDataset", |
333 |
| - "StringDataset", |
334 |
| - "EntityLinkingDictionary", |
335 | 327 | "AGNEWS",
|
| 328 | + "AMAZON_REVIEWS", |
336 | 329 | "ANAT_EM",
|
337 | 330 | "AZDZ",
|
338 | 331 | "BC2GM",
|
339 |
| - "BIO_INFER", |
340 | 332 | "BIOBERT_CHEMICAL_BC4CHEMD",
|
341 | 333 | "BIOBERT_CHEMICAL_BC5CDR",
|
342 | 334 | "BIOBERT_DISEASE_BC5CDR",
|
|
347 | 339 | "BIOBERT_SPECIES_S800",
|
348 | 340 | "BIONLP2013_CG",
|
349 | 341 | "BIONLP2013_PC",
|
| 342 | + "BIOSCOPE", |
350 | 343 | "BIOSEMANTICS",
|
| 344 | + "BIO_INFER", |
351 | 345 | "CDR",
|
352 | 346 | "CELL_FINDER",
|
353 | 347 | "CEMP",
|
354 | 348 | "CHEMDNER",
|
| 349 | + "CLEANCONLL", |
355 | 350 | "CLL",
|
| 351 | + "COMMUNICATIVE_FUNCTIONS", |
| 352 | + "CONLL_03", |
| 353 | + "CONLL_03_DUTCH", |
| 354 | + "CONLL_03_GERMAN", |
| 355 | + "CONLL_03_SPANISH", |
| 356 | + "CONLL_2000", |
356 | 357 | "CRAFT",
|
357 | 358 | "CRAFT_V4",
|
| 359 | + "CTD_CHEMICALS_DICTIONARY", |
| 360 | + "CTD_DISEASES_DICTIONARY", |
358 | 361 | "DECA",
|
| 362 | + "FEWNERD", |
359 | 363 | "FSU",
|
360 | 364 | "GELLUS",
|
| 365 | + "GERMEVAL_2018_OFFENSIVE_LANGUAGE", |
| 366 | + "GLUE_COLA", |
| 367 | + "GLUE_MNLI", |
| 368 | + "GLUE_MRPC", |
| 369 | + "GLUE_QNLI", |
| 370 | + "GLUE_QQP", |
| 371 | + "GLUE_RTE", |
| 372 | + "GLUE_SST2", |
| 373 | + "GLUE_STSB", |
| 374 | + "GLUE_WNLI", |
| 375 | + "GO_EMOTIONS", |
361 | 376 | "GPRO",
|
362 |
| - "HunerEntityLinkingDictionary", |
363 | 377 | "HUNER_CELL_LINE",
|
364 | 378 | "HUNER_CELL_LINE_CELL_FINDER",
|
365 | 379 | "HUNER_CELL_LINE_CLL",
|
|
404 | 418 | "HUNER_SPECIES_S800",
|
405 | 419 | "HUNER_SPECIES_VARIOME",
|
406 | 420 | "IEPA",
|
| 421 | + "IMDB", |
407 | 422 | "JNLPBA",
|
| 423 | + "KEYPHRASE_INSPEC", |
| 424 | + "KEYPHRASE_SEMEVAL2010", |
| 425 | + "KEYPHRASE_SEMEVAL2017", |
408 | 426 | "LINNEAUS",
|
409 | 427 | "LOCTEXT",
|
| 428 | + "MASAKHA_POS", |
410 | 429 | "MIRNA",
|
| 430 | + "NCBI_DISEASE", |
411 | 431 | "NCBI_GENE_HUMAN_DICTIONARY",
|
412 | 432 | "NCBI_TAXONOMY_DICTIONARY",
|
413 |
| - "CTD_DISEASES_DICTIONARY", |
414 |
| - "CTD_CHEMICALS_DICTIONARY", |
415 |
| - "NCBI_DISEASE", |
416 |
| - "ONTONOTES", |
417 |
| - "OSIRIS", |
418 |
| - "PDR", |
419 |
| - "S800", |
420 |
| - "SCAI_CHEMICALS", |
421 |
| - "SCAI_DISEASE", |
422 |
| - "VARIOME", |
423 |
| - "AMAZON_REVIEWS", |
424 |
| - "COMMUNICATIVE_FUNCTIONS", |
425 |
| - "GERMEVAL_2018_OFFENSIVE_LANGUAGE", |
426 |
| - "GLUE_COLA", |
427 |
| - "GO_EMOTIONS", |
428 |
| - "IMDB", |
429 |
| - "NEWSGROUPS", |
430 |
| - "STACKOVERFLOW", |
431 |
| - "SENTEVAL_CR", |
432 |
| - "SENTEVAL_MPQA", |
433 |
| - "SENTEVAL_MR", |
434 |
| - "SENTEVAL_SST_BINARY", |
435 |
| - "SENTEVAL_SST_GRANULAR", |
436 |
| - "SENTEVAL_SUBJ", |
437 |
| - "SENTIMENT_140", |
438 |
| - "TREC_6", |
439 |
| - "TREC_50", |
440 |
| - "WASSA_ANGER", |
441 |
| - "WASSA_FEAR", |
442 |
| - "WASSA_JOY", |
443 |
| - "WASSA_SADNESS", |
444 |
| - "YAHOO_ANSWERS", |
445 |
| - "ClassificationCorpus", |
446 |
| - "ClassificationDataset", |
447 |
| - "CSVClassificationCorpus", |
448 |
| - "CSVClassificationDataset", |
449 | 433 | "NEL_ENGLISH_AIDA",
|
450 | 434 | "NEL_ENGLISH_AQUAINT",
|
451 | 435 | "NEL_ENGLISH_IITB",
|
452 | 436 | "NEL_ENGLISH_REDDIT",
|
453 | 437 | "NEL_ENGLISH_TWEEKI",
|
454 | 438 | "NEL_GERMAN_HIPE",
|
455 |
| - "WSD_MASC", |
456 |
| - "WSD_OMSTI", |
457 |
| - "WSD_RAGANATO_ALL", |
458 |
| - "WSD_SEMCOR", |
459 |
| - "WSD_TRAINOMATIC", |
460 |
| - "WSD_UFSAC", |
461 |
| - "WSD_WORDNET_GLOSS_TAGGED", |
462 |
| - "RE_ENGLISH_CONLL04", |
463 |
| - "RE_ENGLISH_DRUGPROT", |
464 |
| - "RE_ENGLISH_SEMEVAL2010", |
465 |
| - "RE_ENGLISH_TACRED", |
466 |
| - "BIOSCOPE", |
467 |
| - "CONLL_03", |
468 |
| - "CONLL_03_DUTCH", |
469 |
| - "CONLL_03_GERMAN", |
470 |
| - "CONLL_03_SPANISH", |
471 |
| - "CLEANCONLL", |
472 |
| - "CONLL_2000", |
473 |
| - "FEWNERD", |
474 |
| - "KEYPHRASE_INSPEC", |
475 |
| - "KEYPHRASE_SEMEVAL2010", |
476 |
| - "KEYPHRASE_SEMEVAL2017", |
477 |
| - "MASAKHA_POS", |
478 | 439 | "NER_ARABIC_ANER",
|
479 | 440 | "NER_ARABIC_AQMAR",
|
480 | 441 | "NER_BASQUE",
|
|
491 | 452 | "NER_ENGLISH_WEBPAGES",
|
492 | 453 | "NER_ENGLISH_WIKIGOLD",
|
493 | 454 | "NER_ENGLISH_WNUT_2020",
|
| 455 | + "NER_ESTONIAN_NOISY", |
494 | 456 | "NER_FINNISH",
|
495 | 457 | "NER_GERMAN_BIOFID",
|
496 | 458 | "NER_GERMAN_EUROPARL",
|
|
499 | 461 | "NER_GERMAN_MOBIE",
|
500 | 462 | "NER_GERMAN_POLITICS",
|
501 | 463 | "NER_HIPE_2022",
|
502 |
| - "NER_NOISEBENCH", |
503 | 464 | "NER_HUNGARIAN",
|
504 | 465 | "NER_ICDAR_EUROPEANA",
|
505 | 466 | "NER_ICELANDIC",
|
506 | 467 | "NER_JAPANESE",
|
507 |
| - "NER_NERMUD", |
508 | 468 | "NER_MASAKHANE",
|
| 469 | + "NER_MULTI_CONER", |
| 470 | + "NER_MULTI_CONER_V2", |
509 | 471 | "NER_MULTI_WIKIANN",
|
510 | 472 | "NER_MULTI_WIKINER",
|
511 | 473 | "NER_MULTI_XTREME",
|
| 474 | + "NER_NERMUD", |
| 475 | + "NER_NOISEBENCH", |
512 | 476 | "NER_SWEDISH",
|
513 | 477 | "NER_TURKU",
|
514 | 478 | "NER_UKRAINIAN",
|
515 |
| - "NER_ESTONIAN_NOISY", |
516 |
| - "UP_CHINESE", |
517 |
| - "UP_ENGLISH", |
518 |
| - "UP_FINNISH", |
519 |
| - "UP_FRENCH", |
520 |
| - "UP_GERMAN", |
521 |
| - "UP_ITALIAN", |
522 |
| - "UP_SPANISH", |
523 |
| - "UP_SPANISH_ANCORA", |
524 |
| - "WNUT_17", |
525 |
| - "ColumnCorpus", |
526 |
| - "ColumnDataset", |
527 |
| - "NER_MULTI_CONER", |
528 |
| - "NER_MULTI_CONER_V2", |
529 |
| - "FeideggerCorpus", |
530 |
| - "FeideggerDataset", |
531 |
| - "GLUE_MNLI", |
532 |
| - "GLUE_MRPC", |
533 |
| - "GLUE_QNLI", |
534 |
| - "GLUE_QQP", |
535 |
| - "GLUE_RTE", |
536 |
| - "GLUE_WNLI", |
537 |
| - "GLUE_SST2", |
538 |
| - "GLUE_STSB", |
| 479 | + "NEWSGROUPS", |
| 480 | + "ONTONOTES", |
| 481 | + "OSIRIS", |
| 482 | + "PDR", |
| 483 | + "RE_ENGLISH_CONLL04", |
| 484 | + "RE_ENGLISH_DRUGPROT", |
| 485 | + "RE_ENGLISH_SEMEVAL2010", |
| 486 | + "RE_ENGLISH_TACRED", |
| 487 | + "S800", |
| 488 | + "SCAI_CHEMICALS", |
| 489 | + "SCAI_DISEASE", |
| 490 | + "SENTEVAL_CR", |
| 491 | + "SENTEVAL_MPQA", |
| 492 | + "SENTEVAL_MR", |
| 493 | + "SENTEVAL_SST_BINARY", |
| 494 | + "SENTEVAL_SST_GRANULAR", |
| 495 | + "SENTEVAL_SUBJ", |
| 496 | + "SENTIMENT_140", |
| 497 | + "SROIE", |
| 498 | + "STACKOVERFLOW", |
539 | 499 | "SUPERGLUE_RTE",
|
540 |
| - "DataPairCorpus", |
541 |
| - "DataPairDataset", |
542 |
| - "DataTripleCorpus", |
543 |
| - "DataTripleDataset", |
544 |
| - "OpusParallelCorpus", |
545 |
| - "ParallelTextCorpus", |
546 |
| - "ParallelTextDataset", |
| 500 | + "TREC_6", |
| 501 | + "TREC_50", |
547 | 502 | "UD_AFRIKAANS",
|
548 | 503 | "UD_ANCIENT_GREEK",
|
549 | 504 | "UD_ARABIC",
|
|
603 | 558 | "UD_TURKISH",
|
604 | 559 | "UD_UKRAINIAN",
|
605 | 560 | "UD_WOLOF",
|
| 561 | + "UP_CHINESE", |
| 562 | + "UP_ENGLISH", |
| 563 | + "UP_FINNISH", |
| 564 | + "UP_FRENCH", |
| 565 | + "UP_GERMAN", |
| 566 | + "UP_ITALIAN", |
| 567 | + "UP_SPANISH", |
| 568 | + "UP_SPANISH_ANCORA", |
| 569 | + "VARIOME", |
| 570 | + "WASSA_ANGER", |
| 571 | + "WASSA_FEAR", |
| 572 | + "WASSA_JOY", |
| 573 | + "WASSA_SADNESS", |
| 574 | + "WNUT_17", |
| 575 | + "WSD_MASC", |
| 576 | + "WSD_OMSTI", |
| 577 | + "WSD_RAGANATO_ALL", |
| 578 | + "WSD_SEMCOR", |
| 579 | + "WSD_TRAINOMATIC", |
| 580 | + "WSD_UFSAC", |
| 581 | + "WSD_WORDNET_GLOSS_TAGGED", |
| 582 | + "YAHOO_ANSWERS", |
| 583 | + "ZELDA", |
| 584 | + "CSVClassificationCorpus", |
| 585 | + "CSVClassificationDataset", |
| 586 | + "ClassificationCorpus", |
| 587 | + "ClassificationDataset", |
| 588 | + "ColumnCorpus", |
| 589 | + "ColumnDataset", |
| 590 | + "DataLoader", |
| 591 | + "DataPairCorpus", |
| 592 | + "DataPairDataset", |
| 593 | + "DataTripleCorpus", |
| 594 | + "DataTripleDataset", |
| 595 | + "EntityLinkingDictionary", |
| 596 | + "FeideggerCorpus", |
| 597 | + "FeideggerDataset", |
| 598 | + "FlairDatapointDataset", |
| 599 | + "HunerEntityLinkingDictionary", |
| 600 | + "MongoDataset", |
| 601 | + "OcrJsonDataset", |
| 602 | + "OpusParallelCorpus", |
| 603 | + "ParallelTextCorpus", |
| 604 | + "ParallelTextDataset", |
| 605 | + "SentenceDataset", |
| 606 | + "StringDataset", |
606 | 607 | "UniversalDependenciesCorpus",
|
607 | 608 | "UniversalDependenciesDataset",
|
608 |
| - "ZELDA", |
609 | 609 | ]
|
0 commit comments