diff --git a/datasets/acronym_identification/README.md b/datasets/acronym_identification/README.md index a7bc8aa46b3..732633f28ec 100644 --- a/datasets/acronym_identification/README.md +++ b/datasets/acronym_identification/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - found -languages: +language: - en -licenses: +license: - mit multilinguality: - monolingual diff --git a/datasets/ade_corpus_v2/README.md b/datasets/ade_corpus_v2/README.md index b1caa60064c..e90b4d70e64 100644 --- a/datasets/ade_corpus_v2/README.md +++ b/datasets/ade_corpus_v2/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - found -languages: +language: - en -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/adv_glue/README.md b/datasets/adv_glue/README.md index 6bd668e6bb0..2a66097bfc9 100644 --- a/datasets/adv_glue/README.md +++ b/datasets/adv_glue/README.md @@ -3,9 +3,9 @@ annotations_creators: - unknown language_creators: - machine-generated -languages: +language: - en -licenses: +license: - cc-by-4.0 multilinguality: - monolingual diff --git a/datasets/adversarial_qa/README.md b/datasets/adversarial_qa/README.md index 7b99d40a802..5ecfe6ed8c0 100644 --- a/datasets/adversarial_qa/README.md +++ b/datasets/adversarial_qa/README.md @@ -3,9 +3,9 @@ annotations_creators: - crowdsourced language_creators: - found -languages: +language: - en -licenses: +license: - cc-by-sa-4.0 multilinguality: - monolingual diff --git a/datasets/aeslc/README.md b/datasets/aeslc/README.md index 426fa4c71a7..7f46a06dade 100644 --- a/datasets/aeslc/README.md +++ b/datasets/aeslc/README.md @@ -1,5 +1,5 @@ --- -languages: +language: - en paperswithcode_id: aeslc pretty_name: AESLC diff --git a/datasets/afrikaans_ner_corpus/README.md b/datasets/afrikaans_ner_corpus/README.md index 44385876c49..f5a8e0fed8d 100644 --- a/datasets/afrikaans_ner_corpus/README.md +++ b/datasets/afrikaans_ner_corpus/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - expert-generated -languages: +language: - af -licenses: +license: - other-Creative Commons Attribution 2.5 South Africa License multilinguality: - monolingual diff --git a/datasets/ag_news/README.md b/datasets/ag_news/README.md index 4d3536d9f1a..5247129b9ee 100644 --- a/datasets/ag_news/README.md +++ b/datasets/ag_news/README.md @@ -3,9 +3,9 @@ annotations_creators: - found language_creators: - found -languages: +language: - en -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/ai2_arc/README.md b/datasets/ai2_arc/README.md index 7c023456ff1..9b90ff1eebf 100644 --- a/datasets/ai2_arc/README.md +++ b/datasets/ai2_arc/README.md @@ -3,9 +3,9 @@ annotations_creators: - found language_creators: - found -languages: +language: - en-US -licenses: +license: - cc-by-sa-4.0 multilinguality: - monolingual diff --git a/datasets/air_dialogue/README.md b/datasets/air_dialogue/README.md index 112569c12eb..5379775e8e6 100644 --- a/datasets/air_dialogue/README.md +++ b/datasets/air_dialogue/README.md @@ -4,9 +4,9 @@ annotations_creators: - human-annotated language_creators: - machine-generated -languages: +language: - en -licenses: +license: - cc-by-nc-4.0 multilinguality: - monolingual diff --git a/datasets/ajgt_twitter_ar/README.md b/datasets/ajgt_twitter_ar/README.md index 6834bca4b13..a492f418d1b 100644 --- a/datasets/ajgt_twitter_ar/README.md +++ b/datasets/ajgt_twitter_ar/README.md @@ -3,9 +3,9 @@ annotations_creators: - found language_creators: - found -languages: +language: - ar -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/allegro_reviews/README.md b/datasets/allegro_reviews/README.md index c9f8434335f..cc7f47bd707 100644 --- a/datasets/allegro_reviews/README.md +++ b/datasets/allegro_reviews/README.md @@ -3,9 +3,9 @@ annotations_creators: - found language_creators: - found -languages: +language: - pl -licenses: +license: - cc-by-sa-4.0 multilinguality: - monolingual diff --git a/datasets/allocine/README.md b/datasets/allocine/README.md index 75941954c70..43202104110 100644 --- a/datasets/allocine/README.md +++ b/datasets/allocine/README.md @@ -3,9 +3,9 @@ annotations_creators: - no-annotation language_creators: - found -languages: +language: - fr -licenses: +license: - mit multilinguality: - monolingual diff --git a/datasets/alt/README.md b/datasets/alt/README.md index f2ce3cc7bab..392e73257b0 100644 --- a/datasets/alt/README.md +++ b/datasets/alt/README.md @@ -3,7 +3,7 @@ annotations_creators: - expert-generated language_creators: - crowdsourced -languages: +language: - bn - en - fil @@ -17,7 +17,7 @@ languages: - th - vi - zh -licenses: +license: - cc-by-4.0 multilinguality: - multilingual @@ -89,7 +89,7 @@ Machine Translation, Dependency Parsing ### Languages -It supports 13 languages: +It supports 13 language: * Bengali * English * Filipino diff --git a/datasets/amazon_polarity/README.md b/datasets/amazon_polarity/README.md index 58d2827b13e..50f30510ff1 100644 --- a/datasets/amazon_polarity/README.md +++ b/datasets/amazon_polarity/README.md @@ -3,9 +3,9 @@ annotations_creators: - crowdsourced language_creators: - crowdsourced -languages: +language: - en -licenses: +license: - apache-2.0 multilinguality: - monolingual diff --git a/datasets/amazon_reviews_multi/README.md b/datasets/amazon_reviews_multi/README.md index f2b07d2fd1b..50787bd0216 100644 --- a/datasets/amazon_reviews_multi/README.md +++ b/datasets/amazon_reviews_multi/README.md @@ -3,14 +3,14 @@ annotations_creators: - found language_creators: - found -languages: +language: - de - en - es - fr - ja - zh -licenses: +license: - other-amazon-license multilinguality: - monolingual diff --git a/datasets/amazon_us_reviews/README.md b/datasets/amazon_us_reviews/README.md index 55106dccdd7..ce08740c4e4 100644 --- a/datasets/amazon_us_reviews/README.md +++ b/datasets/amazon_us_reviews/README.md @@ -1,5 +1,5 @@ --- -languages: +language: - en paperswithcode_id: null pretty_name: AmazonUsReviews diff --git a/datasets/ambig_qa/README.md b/datasets/ambig_qa/README.md index f7b9858ac4b..39505d7f7c4 100644 --- a/datasets/ambig_qa/README.md +++ b/datasets/ambig_qa/README.md @@ -3,9 +3,9 @@ annotations_creators: - crowdsourced language_creators: - found -languages: +language: - en -licenses: +license: - cc-by-sa-3.0 multilinguality: - monolingual diff --git a/datasets/americas_nli/README.md b/datasets/americas_nli/README.md index 5dd0c6b8324..de7e980ebff 100644 --- a/datasets/americas_nli/README.md +++ b/datasets/americas_nli/README.md @@ -3,7 +3,7 @@ annotations_creators: - expert-generated language_creators: - expert-generated -languages: +language: - ay - bzd - cni @@ -14,7 +14,7 @@ languages: - qu - shp - tar -licenses: +license: - unknown multilinguality: - multilingual diff --git a/datasets/ami/README.md b/datasets/ami/README.md index 93b1c0cb17d..589de65f084 100644 --- a/datasets/ami/README.md +++ b/datasets/ami/README.md @@ -5,9 +5,9 @@ annotations_creators: language_creators: - crowdsourced - expert-generated -languages: +language: - en -licenses: +license: - cc-by-4.0 multilinguality: - monolingual diff --git a/datasets/amttl/README.md b/datasets/amttl/README.md index 7b5ea22e195..03d7cb2759f 100644 --- a/datasets/amttl/README.md +++ b/datasets/amttl/README.md @@ -3,9 +3,9 @@ annotations_creators: - crowdsourced language_creators: - found -languages: +language: - zh -licenses: +license: - mit multilinguality: - monolingual diff --git a/datasets/anli/README.md b/datasets/anli/README.md index 310e20c3b8a..50dee3014a6 100644 --- a/datasets/anli/README.md +++ b/datasets/anli/README.md @@ -1,5 +1,5 @@ --- -languages: +language: - en paperswithcode_id: anli pretty_name: Adversarial NLI diff --git a/datasets/app_reviews/README.md b/datasets/app_reviews/README.md index ba80ecc6439..7f1bb01602f 100644 --- a/datasets/app_reviews/README.md +++ b/datasets/app_reviews/README.md @@ -3,9 +3,9 @@ annotations_creators: - crowdsourced language_creators: - crowdsourced -languages: +language: - en -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/aqua_rat/README.md b/datasets/aqua_rat/README.md index aadd65294d8..ba3c934b9c2 100644 --- a/datasets/aqua_rat/README.md +++ b/datasets/aqua_rat/README.md @@ -4,9 +4,9 @@ annotations_creators: language_creators: - crowdsourced - expert-generated -languages: +language: - en -licenses: +license: - apache-2.0 multilinguality: - monolingual diff --git a/datasets/aquamuse/README.md b/datasets/aquamuse/README.md index 745e1bb6704..7581488be3f 100644 --- a/datasets/aquamuse/README.md +++ b/datasets/aquamuse/README.md @@ -5,9 +5,9 @@ annotations_creators: language_creators: - crowdsourced - expert-generated -languages: +language: - en -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/ar_cov19/README.md b/datasets/ar_cov19/README.md index 6877143b1af..bfbcb7a4827 100644 --- a/datasets/ar_cov19/README.md +++ b/datasets/ar_cov19/README.md @@ -3,7 +3,7 @@ annotations_creators: - no-annotation language_creators: - found -languages: +language: - ar multilinguality: - monolingual diff --git a/datasets/ar_res_reviews/README.md b/datasets/ar_res_reviews/README.md index 0437be0b4ce..803bb12b6b6 100644 --- a/datasets/ar_res_reviews/README.md +++ b/datasets/ar_res_reviews/README.md @@ -3,9 +3,9 @@ annotations_creators: - found language_creators: - found -languages: +language: - ar -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/ar_sarcasm/README.md b/datasets/ar_sarcasm/README.md index 7c60ea2bebc..bce44183d49 100644 --- a/datasets/ar_sarcasm/README.md +++ b/datasets/ar_sarcasm/README.md @@ -3,9 +3,9 @@ annotations_creators: - no-annotation language_creators: - found -languages: +language: - ar -licenses: +license: - mit multilinguality: - monolingual diff --git a/datasets/arabic_billion_words/README.md b/datasets/arabic_billion_words/README.md index b5e1908801e..89d8e307049 100644 --- a/datasets/arabic_billion_words/README.md +++ b/datasets/arabic_billion_words/README.md @@ -3,9 +3,9 @@ annotations_creators: - found language_creators: - found -languages: +language: - ar -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/arabic_pos_dialect/README.md b/datasets/arabic_pos_dialect/README.md index e6632488cc3..59f804ae169 100644 --- a/datasets/arabic_pos_dialect/README.md +++ b/datasets/arabic_pos_dialect/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - found -languages: +language: - ar -licenses: +license: - apache-2.0 multilinguality: - multilingual diff --git a/datasets/arabic_speech_corpus/README.md b/datasets/arabic_speech_corpus/README.md index f8af29e95f5..7e93a15f8fc 100644 --- a/datasets/arabic_speech_corpus/README.md +++ b/datasets/arabic_speech_corpus/README.md @@ -4,9 +4,9 @@ annotations_creators: - expert-generated language_creators: - crowdsourced -languages: +language: - ar -licenses: +license: - cc-by-4.0 multilinguality: - monolingual diff --git a/datasets/arcd/README.md b/datasets/arcd/README.md index 9adadff2d9b..272a64db526 100644 --- a/datasets/arcd/README.md +++ b/datasets/arcd/README.md @@ -3,9 +3,9 @@ annotations_creators: - crowdsourced language_creators: - crowdsourced -languages: +language: - ar-SA -licenses: +license: - mit multilinguality: - monolingual diff --git a/datasets/arsentd_lev/README.md b/datasets/arsentd_lev/README.md index 5be2b1601a4..7fa01a928ab 100644 --- a/datasets/arsentd_lev/README.md +++ b/datasets/arsentd_lev/README.md @@ -3,10 +3,10 @@ annotations_creators: - crowdsourced language_creators: - found -languages: +language: - apc - apj -licenses: +license: - other-Copyright-2018-by-[American-University-of-Beirut] multilinguality: - monolingual diff --git a/datasets/art/README.md b/datasets/art/README.md index 38aba38e4b7..16eb26d0b7c 100644 --- a/datasets/art/README.md +++ b/datasets/art/README.md @@ -1,5 +1,5 @@ --- -languages: +language: - en paperswithcode_id: art-dataset pretty_name: Abductive Reasoning in narrative Text diff --git a/datasets/arxiv_dataset/README.md b/datasets/arxiv_dataset/README.md index 6793e480e05..7e12f7673d5 100644 --- a/datasets/arxiv_dataset/README.md +++ b/datasets/arxiv_dataset/README.md @@ -3,9 +3,9 @@ annotations_creators: - no-annotation language_creators: - expert-generated -languages: +language: - en -licenses: +license: - cc0-1.0 multilinguality: - monolingual diff --git a/datasets/ascent_kb/README.md b/datasets/ascent_kb/README.md index 3120c71df25..dbccfb01572 100644 --- a/datasets/ascent_kb/README.md +++ b/datasets/ascent_kb/README.md @@ -3,9 +3,9 @@ annotations_creators: - found language_creators: - found -languages: +language: - en -licenses: +license: - cc-by-4.0 multilinguality: - monolingual diff --git a/datasets/aslg_pc12/README.md b/datasets/aslg_pc12/README.md index a26c4154dcd..b20189c9785 100644 --- a/datasets/aslg_pc12/README.md +++ b/datasets/aslg_pc12/README.md @@ -1,5 +1,5 @@ --- -languages: +language: - en paperswithcode_id: aslg-pc12 pretty_name: English-ASL Gloss Parallel Corpus 2012 diff --git a/datasets/asnq/README.md b/datasets/asnq/README.md index f3e9425aa68..ac5ae1b2e41 100644 --- a/datasets/asnq/README.md +++ b/datasets/asnq/README.md @@ -1,5 +1,5 @@ --- -languages: +language: - en paperswithcode_id: asnq pretty_name: Answer Sentence Natural Questions diff --git a/datasets/asset/README.md b/datasets/asset/README.md index 90469494cc4..e871def97a6 100644 --- a/datasets/asset/README.md +++ b/datasets/asset/README.md @@ -3,9 +3,9 @@ annotations_creators: - machine-generated language_creators: - found -languages: +language: - en -licenses: +license: - cc-by-sa-4.0 multilinguality: - monolingual diff --git a/datasets/assin/README.md b/datasets/assin/README.md index 3717b499871..183e2efc248 100644 --- a/datasets/assin/README.md +++ b/datasets/assin/README.md @@ -4,9 +4,9 @@ annotations_creators: - expert-generated language_creators: - found -languages: +language: - pt -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/assin2/README.md b/datasets/assin2/README.md index 9bf5e2c309a..b47c2530fa1 100644 --- a/datasets/assin2/README.md +++ b/datasets/assin2/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - found -languages: +language: - pt -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/atomic/README.md b/datasets/atomic/README.md index 903354a606f..cc1236db99b 100755 --- a/datasets/atomic/README.md +++ b/datasets/atomic/README.md @@ -4,9 +4,9 @@ annotations_creators: - crowdsourced language_creators: - crowdsourced -languages: +language: - en -licenses: +license: - cc-by-4.0 multilinguality: - monolingual diff --git a/datasets/autshumato/README.md b/datasets/autshumato/README.md index 64893356a5f..d52273862a3 100644 --- a/datasets/autshumato/README.md +++ b/datasets/autshumato/README.md @@ -3,12 +3,12 @@ annotations_creators: - expert-generated language_creators: - expert-generated -languages: +language: - en - tn - ts - zu -licenses: +license: - cc-by-2.5 multilinguality: - multilingual diff --git a/datasets/babi_qa/README.md b/datasets/babi_qa/README.md index 25bfe4f4692..9f5997ba30a 100644 --- a/datasets/babi_qa/README.md +++ b/datasets/babi_qa/README.md @@ -4,9 +4,9 @@ annotations_creators: - machine-generated language_creators: - machine-generated -languages: +language: - en -licenses: +license: - cc-by-3.0 multilinguality: - monolingual diff --git a/datasets/banking77/README.md b/datasets/banking77/README.md index e64eec6ef72..59781bb5210 100644 --- a/datasets/banking77/README.md +++ b/datasets/banking77/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - expert-generated -languages: +language: - en -licenses: +license: - cc-by-4.0 multilinguality: - monolingual diff --git a/datasets/bbaw_egyptian/README.md b/datasets/bbaw_egyptian/README.md index 93f6f6b4b76..136b154f26f 100644 --- a/datasets/bbaw_egyptian/README.md +++ b/datasets/bbaw_egyptian/README.md @@ -3,11 +3,11 @@ annotations_creators: - expert-generated language_creators: - found -languages: +language: - de - en - egy -licenses: +license: - cc-by-4.0 multilinguality: - multilingual diff --git a/datasets/bbc_hindi_nli/README.md b/datasets/bbc_hindi_nli/README.md index 0bf0320a058..7aba13aa16e 100644 --- a/datasets/bbc_hindi_nli/README.md +++ b/datasets/bbc_hindi_nli/README.md @@ -3,9 +3,9 @@ annotations_creators: - machine-generated language_creators: - found -languages: +language: - hi -licenses: +license: - mit multilinguality: - monolingual diff --git a/datasets/bc2gm_corpus/README.md b/datasets/bc2gm_corpus/README.md index 64da0edcea9..c84add02067 100644 --- a/datasets/bc2gm_corpus/README.md +++ b/datasets/bc2gm_corpus/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - expert-generated -languages: +language: - en -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/beans/README.md b/datasets/beans/README.md index 317827a551a..e0bfd0b9ffd 100644 --- a/datasets/beans/README.md +++ b/datasets/beans/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - expert-generated -languages: +language: - en -licenses: +license: - mit multilinguality: - monolingual diff --git a/datasets/best2009/README.md b/datasets/best2009/README.md index 5bf4362e31d..7d696e347bf 100644 --- a/datasets/best2009/README.md +++ b/datasets/best2009/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - found -languages: +language: - th -licenses: +license: - cc-by-nc-sa-3.0 multilinguality: - monolingual diff --git a/datasets/bianet/README.md b/datasets/bianet/README.md index f4835b2776c..328a1d5ce0f 100644 --- a/datasets/bianet/README.md +++ b/datasets/bianet/README.md @@ -3,11 +3,11 @@ annotations_creators: - found language_creators: - found -languages: +language: - en - ku - tr -licenses: +license: - unknown multilinguality: - translation diff --git a/datasets/bible_para/README.md b/datasets/bible_para/README.md index 8fa40fdf31f..f301303ee77 100644 --- a/datasets/bible_para/README.md +++ b/datasets/bible_para/README.md @@ -3,7 +3,7 @@ annotations_creators: - found language_creators: - found -languages: +language: - acu - af - agr @@ -106,7 +106,7 @@ languages: - xh - zh - zu -licenses: +license: - cc0-1.0 multilinguality: - multilingual diff --git a/datasets/big_patent/README.md b/datasets/big_patent/README.md index 7aa72347dc7..94a4a66c991 100644 --- a/datasets/big_patent/README.md +++ b/datasets/big_patent/README.md @@ -3,9 +3,9 @@ annotations_creators: - no-annotation language_creators: - found -languages: +language: - en -licenses: +license: - cc-by-4.0 multilinguality: - monolingual diff --git a/datasets/bigbench/README.md b/datasets/bigbench/README.md index a86ba85daa9..487b37eab97 100644 --- a/datasets/bigbench/README.md +++ b/datasets/bigbench/README.md @@ -8,9 +8,9 @@ language_creators: - expert-generated - machine-generated - other -languages: +language: - en -licenses: +license: - apache-2.0 multilinguality: - multilingual diff --git a/datasets/billsum/README.md b/datasets/billsum/README.md index f1b250f7a9b..e6472045c40 100644 --- a/datasets/billsum/README.md +++ b/datasets/billsum/README.md @@ -3,9 +3,9 @@ annotations_creators: - found language_creators: - found -languages: +language: - en -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/bing_coronavirus_query_set/README.md b/datasets/bing_coronavirus_query_set/README.md index f96ae1ae61d..b06bd3ae5a9 100644 --- a/datasets/bing_coronavirus_query_set/README.md +++ b/datasets/bing_coronavirus_query_set/README.md @@ -3,9 +3,9 @@ annotations_creators: - found language_creators: - found -languages: +language: - en -licenses: +license: - o-uda-1.0 multilinguality: - monolingual diff --git a/datasets/biomrc/README.md b/datasets/biomrc/README.md index b3ac67556bb..d67639ca352 100644 --- a/datasets/biomrc/README.md +++ b/datasets/biomrc/README.md @@ -1,5 +1,5 @@ --- -languages: +language: - en paperswithcode_id: biomrc pretty_name: BIOMRC diff --git a/datasets/biosses/README.md b/datasets/biosses/README.md index 6e6b75ab5ab..c6192ad9129 100644 --- a/datasets/biosses/README.md +++ b/datasets/biosses/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - found -languages: +language: - en -licenses: +license: - gpl-3.0 multilinguality: - monolingual diff --git a/datasets/biwi_kinect_head_pose/README.md b/datasets/biwi_kinect_head_pose/README.md index d379d637f60..c1610dda072 100644 --- a/datasets/biwi_kinect_head_pose/README.md +++ b/datasets/biwi_kinect_head_pose/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - expert-generated -languages: +language: - en -licenses: +license: - other multilinguality: - monolingual diff --git a/datasets/blbooks/README.md b/datasets/blbooks/README.md index 1969d2604da..62965f39be6 100644 --- a/datasets/blbooks/README.md +++ b/datasets/blbooks/README.md @@ -3,14 +3,14 @@ annotations_creators: - no-annotation language_creators: - machine-generated -languages: +language: - en - fr - de - es - it - nl -licenses: +license: - cc0-1.0 multilinguality: - multilingual diff --git a/datasets/blbooksgenre/README.md b/datasets/blbooksgenre/README.md index 542c6a61327..3e6b4517777 100644 --- a/datasets/blbooksgenre/README.md +++ b/datasets/blbooksgenre/README.md @@ -4,12 +4,12 @@ annotations_creators: language_creators: - crowdsourced - expert-generated -languages: +language: - en - de - fr - nl -licenses: +license: - cc0-1.0 multilinguality: - multilingual diff --git a/datasets/blended_skill_talk/README.md b/datasets/blended_skill_talk/README.md index 149a8586ca0..62c860a1ae5 100644 --- a/datasets/blended_skill_talk/README.md +++ b/datasets/blended_skill_talk/README.md @@ -3,9 +3,9 @@ annotations_creators: - crowdsourced language_creators: - crowdsourced -languages: +language: - en -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/blimp/README.md b/datasets/blimp/README.md index c7994bfa4ca..1d0b9f719b9 100644 --- a/datasets/blimp/README.md +++ b/datasets/blimp/README.md @@ -3,9 +3,9 @@ annotations_creators: - crowdsourced language_creators: - machine-generated -languages: +language: - en -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/blog_authorship_corpus/README.md b/datasets/blog_authorship_corpus/README.md index cc2761da851..2188c1e817b 100644 --- a/datasets/blog_authorship_corpus/README.md +++ b/datasets/blog_authorship_corpus/README.md @@ -3,9 +3,9 @@ annotations_creators: - no-annotation language_creators: - found -languages: +language: - en -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/bn_hate_speech/README.md b/datasets/bn_hate_speech/README.md index 63333370fb9..4cf5281aac1 100644 --- a/datasets/bn_hate_speech/README.md +++ b/datasets/bn_hate_speech/README.md @@ -4,9 +4,9 @@ annotations_creators: - expert-generated language_creators: - found -languages: +language: - bn -licenses: +license: - mit multilinguality: - monolingual diff --git a/datasets/bnl_newspapers/README.md b/datasets/bnl_newspapers/README.md index 9cbfac740ff..f6eba35d412 100644 --- a/datasets/bnl_newspapers/README.md +++ b/datasets/bnl_newspapers/README.md @@ -3,7 +3,7 @@ annotations_creators: - no-annotation language_creators: - found -languages: +language: - ar - da - de @@ -12,7 +12,7 @@ languages: - lb - nl - pt -licenses: +license: - cc0-1.0 multilinguality: - multilingual diff --git a/datasets/bookcorpus/README.md b/datasets/bookcorpus/README.md index 8a01baa7cb3..322f3d52a04 100644 --- a/datasets/bookcorpus/README.md +++ b/datasets/bookcorpus/README.md @@ -3,9 +3,9 @@ annotations_creators: - no-annotation language_creators: - found -languages: +language: - en -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/bookcorpusopen/README.md b/datasets/bookcorpusopen/README.md index d28dc98854d..3f7c692410f 100644 --- a/datasets/bookcorpusopen/README.md +++ b/datasets/bookcorpusopen/README.md @@ -3,9 +3,9 @@ annotations_creators: - no-annotation language_creators: - found -languages: +language: - en -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/boolq/README.md b/datasets/boolq/README.md index 3bb907991ec..d7deae1b395 100644 --- a/datasets/boolq/README.md +++ b/datasets/boolq/README.md @@ -1,5 +1,5 @@ --- -languages: +language: - en paperswithcode_id: boolq pretty_name: Boolean Questions diff --git a/datasets/bprec/README.md b/datasets/bprec/README.md index 8d3e02c18c9..af31a837fb8 100644 --- a/datasets/bprec/README.md +++ b/datasets/bprec/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - expert-generated -languages: +language: - pl -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/break_data/README.md b/datasets/break_data/README.md index 5508800a077..264934e3979 100644 --- a/datasets/break_data/README.md +++ b/datasets/break_data/README.md @@ -1,5 +1,5 @@ --- -languages: +language: - en paperswithcode_id: break pretty_name: BREAK diff --git a/datasets/brwac/README.md b/datasets/brwac/README.md index 3cc4bd102b0..33e1632cced 100644 --- a/datasets/brwac/README.md +++ b/datasets/brwac/README.md @@ -3,9 +3,9 @@ annotations_creators: - no-annotation language_creators: - found -languages: +language: - pt -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/bsd_ja_en/README.md b/datasets/bsd_ja_en/README.md index 87c1aa85b3a..50b2b7a8dc5 100644 --- a/datasets/bsd_ja_en/README.md +++ b/datasets/bsd_ja_en/README.md @@ -3,10 +3,10 @@ annotations_creators: - expert-generated language_creators: - expert-generated -languages: +language: - en - ja -licenses: +license: - cc-by-nc-sa-4.0 multilinguality: - translation diff --git a/datasets/bswac/README.md b/datasets/bswac/README.md index 50799d45658..e282d51bc00 100644 --- a/datasets/bswac/README.md +++ b/datasets/bswac/README.md @@ -3,9 +3,9 @@ annotations_creators: - no-annotation language_creators: - found -languages: +language: - bs -licenses: +license: - cc-by-sa-3.0 multilinguality: - monolingual diff --git a/datasets/c3/README.md b/datasets/c3/README.md index add31753f1d..e4b5b787c8b 100644 --- a/datasets/c3/README.md +++ b/datasets/c3/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - expert-generated -languages: +language: - zh -licenses: +license: - other-non-commercial-research multilinguality: - monolingual diff --git a/datasets/c4/README.md b/datasets/c4/README.md index d41d3a25613..fa8b9d8448b 100644 --- a/datasets/c4/README.md +++ b/datasets/c4/README.md @@ -4,9 +4,9 @@ annotations_creators: - no-annotation language_creators: - found -languages: +language: - en -licenses: +license: - odc-by-1.0 multilinguality: - multilingual diff --git a/datasets/cail2018/README.md b/datasets/cail2018/README.md index f232155e1f7..0a3a3a7f610 100644 --- a/datasets/cail2018/README.md +++ b/datasets/cail2018/README.md @@ -3,9 +3,9 @@ annotations_creators: - found language_creators: - found -languages: +language: - zh -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/caner/README.md b/datasets/caner/README.md index 0ef84bbf9f9..acba27c6aaf 100644 --- a/datasets/caner/README.md +++ b/datasets/caner/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - expert-generated -languages: +language: - ar -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/capes/README.md b/datasets/capes/README.md index edf195bc9e7..5807df157c5 100644 --- a/datasets/capes/README.md +++ b/datasets/capes/README.md @@ -3,10 +3,10 @@ annotations_creators: - found language_creators: - found -languages: +language: - en - pt -licenses: +license: - unknown multilinguality: - multilingual diff --git a/datasets/casino/README.md b/datasets/casino/README.md index 7dea40d28ee..eb54d8678f8 100644 --- a/datasets/casino/README.md +++ b/datasets/casino/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - crowdsourced -languages: +language: - en -licenses: +license: - cc-by-4.0 multilinguality: - monolingual diff --git a/datasets/catalonia_independence/README.md b/datasets/catalonia_independence/README.md index d05394e46cf..3268619bcd4 100644 --- a/datasets/catalonia_independence/README.md +++ b/datasets/catalonia_independence/README.md @@ -3,10 +3,10 @@ annotations_creators: - expert-generated language_creators: - crowdsourced -languages: +language: - ca - es -licenses: +license: - cc-by-nc-sa-4.0 multilinguality: - monolingual diff --git a/datasets/cats_vs_dogs/README.md b/datasets/cats_vs_dogs/README.md index e4bd4ee46b8..37c229bf455 100644 --- a/datasets/cats_vs_dogs/README.md +++ b/datasets/cats_vs_dogs/README.md @@ -3,9 +3,9 @@ annotations_creators: - crowdsourced language_creators: - crowdsourced -languages: +language: - en -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/cawac/README.md b/datasets/cawac/README.md index 211f4170e2f..29e6e42cb59 100644 --- a/datasets/cawac/README.md +++ b/datasets/cawac/README.md @@ -3,9 +3,9 @@ annotations_creators: - no-annotation language_creators: - found -languages: +language: - ca -licenses: +license: - cc-by-sa-3.0 multilinguality: - monolingual diff --git a/datasets/cbt/README.md b/datasets/cbt/README.md index 9f7f8a98130..74de2a2799c 100644 --- a/datasets/cbt/README.md +++ b/datasets/cbt/README.md @@ -4,9 +4,9 @@ annotations_creators: - machine-generated language_creators: - found -languages: +language: - en -licenses: +license: - gfdl-1.3 multilinguality: - monolingual diff --git a/datasets/cc100/README.md b/datasets/cc100/README.md index 39a9807b1d9..eadd1504d6b 100644 --- a/datasets/cc100/README.md +++ b/datasets/cc100/README.md @@ -3,7 +3,7 @@ annotations_creators: - no-annotation language_creators: - found -languages: +language: - af - am - ar @@ -120,7 +120,7 @@ languages: - zh-Hans - zh-Hant - zu -licenses: +license: - unknown multilinguality: - multilingual diff --git a/datasets/cc_news/README.md b/datasets/cc_news/README.md index e0fe8568744..e49cf585923 100644 --- a/datasets/cc_news/README.md +++ b/datasets/cc_news/README.md @@ -4,9 +4,9 @@ annotations_creators: - no-annotation language_creators: - found -languages: +language: - en -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/ccaligned_multilingual/README.md b/datasets/ccaligned_multilingual/README.md index 3b116ab339c..46f6944692b 100644 --- a/datasets/ccaligned_multilingual/README.md +++ b/datasets/ccaligned_multilingual/README.md @@ -3,7 +3,7 @@ annotations_creators: - no-annotation language_creators: - found -languages: +language: - af - ak - am @@ -132,7 +132,7 @@ languages: - zh - zu - zza -licenses: +license: - unknown multilinguality: - translation diff --git a/datasets/cdsc/README.md b/datasets/cdsc/README.md index d2835629389..c4c6daef36d 100644 --- a/datasets/cdsc/README.md +++ b/datasets/cdsc/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - other -languages: +language: - pl -licenses: +license: - cc-by-nc-sa-4.0 multilinguality: - monolingual diff --git a/datasets/cdt/README.md b/datasets/cdt/README.md index 30b10b7d644..6d690fb6279 100644 --- a/datasets/cdt/README.md +++ b/datasets/cdt/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - other -languages: +language: - pl -licenses: +license: - bsd-3-clause multilinguality: - monolingual diff --git a/datasets/cedr/README.md b/datasets/cedr/README.md index eb4d3921ea9..f118414673a 100644 --- a/datasets/cedr/README.md +++ b/datasets/cedr/README.md @@ -3,9 +3,9 @@ annotations_creators: - crowdsourced language_creators: - found -languages: +language: - ru -licenses: +license: - apache-2.0 multilinguality: - monolingual diff --git a/datasets/cfq/README.md b/datasets/cfq/README.md index 40faba5311f..5bc38ea37fb 100644 --- a/datasets/cfq/README.md +++ b/datasets/cfq/README.md @@ -1,5 +1,5 @@ --- -languages: +language: - en paperswithcode_id: cfq pretty_name: Compositional Freebase Questions diff --git a/datasets/chr_en/README.md b/datasets/chr_en/README.md index da4d0dcabe5..f46a25642e9 100644 --- a/datasets/chr_en/README.md +++ b/datasets/chr_en/README.md @@ -5,10 +5,10 @@ annotations_creators: - no-annotation language_creators: - found -languages: +language: - chr - en -licenses: +license: - other-different-license-per-source multilinguality: - monolingual diff --git a/datasets/cifar10/README.md b/datasets/cifar10/README.md index ce97aaa0cba..7195b6f15ae 100644 --- a/datasets/cifar10/README.md +++ b/datasets/cifar10/README.md @@ -4,9 +4,9 @@ annotations_creators: - crowdsourced language_creators: - found -languages: +language: - en -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/cifar100/README.md b/datasets/cifar100/README.md index 3ab94875a23..c716bcdeb48 100644 --- a/datasets/cifar100/README.md +++ b/datasets/cifar100/README.md @@ -4,9 +4,9 @@ annotations_creators: - crowdsourced language_creators: - found -languages: +language: - en -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/circa/README.md b/datasets/circa/README.md index c23333fb05f..bff810ad017 100644 --- a/datasets/circa/README.md +++ b/datasets/circa/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - crowdsourced -languages: +language: - en -licenses: +license: - cc-by-4.0 multilinguality: - monolingual diff --git a/datasets/civil_comments/README.md b/datasets/civil_comments/README.md index 1d1eda577fd..e2acf85a1f0 100644 --- a/datasets/civil_comments/README.md +++ b/datasets/civil_comments/README.md @@ -1,5 +1,5 @@ --- -languages: +language: - en paperswithcode_id: null pretty_name: CivilComments diff --git a/datasets/clickbait_news_bg/README.md b/datasets/clickbait_news_bg/README.md index 7dbd6237006..c15bcdc27bc 100644 --- a/datasets/clickbait_news_bg/README.md +++ b/datasets/clickbait_news_bg/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - expert-generated -languages: +language: - bg -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/climate_fever/README.md b/datasets/climate_fever/README.md index c03247e3bf8..4feedaf281f 100644 --- a/datasets/climate_fever/README.md +++ b/datasets/climate_fever/README.md @@ -4,9 +4,9 @@ annotations_creators: - expert-generated language_creators: - found -languages: +language: - en -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/clinc_oos/README.md b/datasets/clinc_oos/README.md index b0870c444c8..0849ee858b8 100644 --- a/datasets/clinc_oos/README.md +++ b/datasets/clinc_oos/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - crowdsourced -languages: +language: - en -licenses: +license: - cc-by-3.0 multilinguality: - monolingual diff --git a/datasets/cmrc2018/README.md b/datasets/cmrc2018/README.md index c93aa99fde3..00cf2a6da9f 100644 --- a/datasets/cmrc2018/README.md +++ b/datasets/cmrc2018/README.md @@ -3,9 +3,9 @@ annotations_creators: - crowdsourced language_creators: - crowdsourced -languages: +language: - zh -licenses: +license: - cc-by-sa-4.0 multilinguality: - monolingual diff --git a/datasets/cmu_hinglish_dog/README.md b/datasets/cmu_hinglish_dog/README.md index 607477ccd8e..69ede2db171 100644 --- a/datasets/cmu_hinglish_dog/README.md +++ b/datasets/cmu_hinglish_dog/README.md @@ -3,10 +3,10 @@ annotations_creators: - machine-generated language_creators: - crowdsourced -languages: +language: - en - hi -licenses: +license: - cc-by-sa-3.0 - gfdl-1.3-or-later multilinguality: diff --git a/datasets/cnn_dailymail/README.md b/datasets/cnn_dailymail/README.md index 183ac47c0f0..f2c4b56f0fb 100644 --- a/datasets/cnn_dailymail/README.md +++ b/datasets/cnn_dailymail/README.md @@ -3,9 +3,9 @@ annotations_creators: - no-annotation language_creators: - found -languages: +language: - en -licenses: +license: - apache-2.0 multilinguality: - monolingual diff --git a/datasets/coached_conv_pref/README.md b/datasets/coached_conv_pref/README.md index e0a380103a5..26d54166f89 100644 --- a/datasets/coached_conv_pref/README.md +++ b/datasets/coached_conv_pref/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - found -languages: +language: - en -licenses: +license: - cc-by-sa-4.0 multilinguality: - monolingual diff --git a/datasets/codah/README.md b/datasets/codah/README.md index d96c116a09e..8d9ec85d09e 100644 --- a/datasets/codah/README.md +++ b/datasets/codah/README.md @@ -3,9 +3,9 @@ annotations_creators: - crowdsourced language_creators: - crowdsourced -languages: +language: - en -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/code_search_net/README.md b/datasets/code_search_net/README.md index 566844ade9c..c64641ef7ee 100644 --- a/datasets/code_search_net/README.md +++ b/datasets/code_search_net/README.md @@ -3,9 +3,9 @@ annotations_creators: - no-annotation language_creators: - machine-generated -languages: +language: - code -licenses: +license: - other-several-licenses multilinguality: - multilingual diff --git a/datasets/code_x_glue_cc_clone_detection_big_clone_bench/README.md b/datasets/code_x_glue_cc_clone_detection_big_clone_bench/README.md index 405762d0087..9fa791a79d3 100644 --- a/datasets/code_x_glue_cc_clone_detection_big_clone_bench/README.md +++ b/datasets/code_x_glue_cc_clone_detection_big_clone_bench/README.md @@ -3,9 +3,9 @@ annotations_creators: - found language_creators: - found -languages: +language: - code -licenses: +license: - other-C-UDA multilinguality: - monolingual diff --git a/datasets/code_x_glue_cc_clone_detection_poj104/README.md b/datasets/code_x_glue_cc_clone_detection_poj104/README.md index fbd551d257a..217052eb8b6 100644 --- a/datasets/code_x_glue_cc_clone_detection_poj104/README.md +++ b/datasets/code_x_glue_cc_clone_detection_poj104/README.md @@ -4,9 +4,9 @@ annotations_creators: - found language_creators: - found -languages: +language: - code -licenses: +license: - other-C-UDA multilinguality: - monolingual diff --git a/datasets/code_x_glue_cc_cloze_testing_all/README.md b/datasets/code_x_glue_cc_cloze_testing_all/README.md index 272f12b738a..7de66bcc664 100644 --- a/datasets/code_x_glue_cc_cloze_testing_all/README.md +++ b/datasets/code_x_glue_cc_cloze_testing_all/README.md @@ -3,9 +3,9 @@ annotations_creators: - found language_creators: - found -languages: +language: - code -licenses: +license: - other-C-UDA multilinguality: - monolingual diff --git a/datasets/code_x_glue_cc_cloze_testing_maxmin/README.md b/datasets/code_x_glue_cc_cloze_testing_maxmin/README.md index 013f704c403..ee87b70ac69 100644 --- a/datasets/code_x_glue_cc_cloze_testing_maxmin/README.md +++ b/datasets/code_x_glue_cc_cloze_testing_maxmin/README.md @@ -3,9 +3,9 @@ annotations_creators: - found language_creators: - found -languages: +language: - code -licenses: +license: - other-C-UDA multilinguality: - monolingual diff --git a/datasets/code_x_glue_cc_code_completion_line/README.md b/datasets/code_x_glue_cc_code_completion_line/README.md index af147e16727..3ddbc9fe011 100644 --- a/datasets/code_x_glue_cc_code_completion_line/README.md +++ b/datasets/code_x_glue_cc_code_completion_line/README.md @@ -3,9 +3,9 @@ annotations_creators: - found language_creators: - found -languages: +language: - code -licenses: +license: - other-C-UDA multilinguality: - monolingual diff --git a/datasets/code_x_glue_cc_code_completion_token/README.md b/datasets/code_x_glue_cc_code_completion_token/README.md index 80eaecb5c78..df58bfe2fdf 100644 --- a/datasets/code_x_glue_cc_code_completion_token/README.md +++ b/datasets/code_x_glue_cc_code_completion_token/README.md @@ -3,9 +3,9 @@ annotations_creators: - found language_creators: - found -languages: +language: - code -licenses: +license: - other-C-UDA multilinguality: - monolingual diff --git a/datasets/code_x_glue_cc_code_refinement/README.md b/datasets/code_x_glue_cc_code_refinement/README.md index cd8c8999a2f..041ecb42186 100644 --- a/datasets/code_x_glue_cc_code_refinement/README.md +++ b/datasets/code_x_glue_cc_code_refinement/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - found -languages: +language: - code -licenses: +license: - other-C-UDA multilinguality: - other-programming-languages diff --git a/datasets/code_x_glue_cc_code_to_code_trans/README.md b/datasets/code_x_glue_cc_code_to_code_trans/README.md index f4ae60a8c93..ca97bb122e8 100644 --- a/datasets/code_x_glue_cc_code_to_code_trans/README.md +++ b/datasets/code_x_glue_cc_code_to_code_trans/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - found -languages: +language: - code -licenses: +license: - other-C-UDA multilinguality: - other-programming-languages diff --git a/datasets/code_x_glue_cc_defect_detection/README.md b/datasets/code_x_glue_cc_defect_detection/README.md index 40d6e13c59e..f1741fcef86 100644 --- a/datasets/code_x_glue_cc_defect_detection/README.md +++ b/datasets/code_x_glue_cc_defect_detection/README.md @@ -3,9 +3,9 @@ annotations_creators: - found language_creators: - found -languages: +language: - code -licenses: +license: - other-C-UDA multilinguality: - other-programming-languages diff --git a/datasets/code_x_glue_ct_code_to_text/README.md b/datasets/code_x_glue_ct_code_to_text/README.md index f3a5a833731..e9fd3d769f0 100644 --- a/datasets/code_x_glue_ct_code_to_text/README.md +++ b/datasets/code_x_glue_ct_code_to_text/README.md @@ -3,10 +3,10 @@ annotations_creators: - found language_creators: - found -languages: +language: - code - en -licenses: +license: - other-C-UDA multilinguality: - other-programming-languages diff --git a/datasets/code_x_glue_tc_nl_code_search_adv/README.md b/datasets/code_x_glue_tc_nl_code_search_adv/README.md index 12b83873b67..42f7fa17fd7 100644 --- a/datasets/code_x_glue_tc_nl_code_search_adv/README.md +++ b/datasets/code_x_glue_tc_nl_code_search_adv/README.md @@ -3,10 +3,10 @@ annotations_creators: - found language_creators: - found -languages: +language: - code - en -licenses: +license: - other-C-UDA multilinguality: - other-programming-languages diff --git a/datasets/code_x_glue_tc_text_to_code/README.md b/datasets/code_x_glue_tc_text_to_code/README.md index 51070edac0b..ba3a399f24c 100644 --- a/datasets/code_x_glue_tc_text_to_code/README.md +++ b/datasets/code_x_glue_tc_text_to_code/README.md @@ -3,10 +3,10 @@ annotations_creators: - found language_creators: - found -languages: +language: - en - code -licenses: +license: - other-C-UDA multilinguality: - other-programming-languages diff --git a/datasets/code_x_glue_tt_text_to_text/README.md b/datasets/code_x_glue_tt_text_to_text/README.md index 0761a65b925..b9e55610472 100644 --- a/datasets/code_x_glue_tt_text_to_text/README.md +++ b/datasets/code_x_glue_tt_text_to_text/README.md @@ -3,13 +3,13 @@ annotations_creators: - found language_creators: - found -languages: +language: - da - nb - lv - zh - en -licenses: +license: - other-C-UDA multilinguality: - multilingual diff --git a/datasets/com_qa/README.md b/datasets/com_qa/README.md index 54604474385..913ec691bfe 100644 --- a/datasets/com_qa/README.md +++ b/datasets/com_qa/README.md @@ -1,5 +1,5 @@ --- -languages: +language: - en paperswithcode_id: comqa pretty_name: ComQA diff --git a/datasets/common_gen/README.md b/datasets/common_gen/README.md index 136c5c9a290..25791b2c0cb 100644 --- a/datasets/common_gen/README.md +++ b/datasets/common_gen/README.md @@ -1,5 +1,5 @@ --- -languages: +language: - en paperswithcode_id: commongen pretty_name: CommonGen diff --git a/datasets/common_language/README.md b/datasets/common_language/README.md index 522b881ffcc..a7570e878d6 100644 --- a/datasets/common_language/README.md +++ b/datasets/common_language/README.md @@ -4,7 +4,7 @@ annotations_creators: - crowdsourced language_creators: - crowdsourced -languages: +language: - ar - br - ca @@ -50,7 +50,7 @@ languages: - zh-CN - zh-HK - zh-TW -licenses: +license: - cc-by-4.0 multilinguality: - multilingual diff --git a/datasets/common_voice/README.md b/datasets/common_voice/README.md index 3767cbea29e..0828485e726 100644 --- a/datasets/common_voice/README.md +++ b/datasets/common_voice/README.md @@ -4,7 +4,7 @@ annotations_creators: - crowdsourced language_creators: - crowdsourced -languages: +language: - ab - ar - as @@ -65,7 +65,7 @@ languages: - zh-CN - zh-HK - zh-TW -licenses: +license: - cc0-1.0 multilinguality: - multilingual diff --git a/datasets/commonsense_qa/README.md b/datasets/commonsense_qa/README.md index dc8a8dbee97..5c04751c863 100644 --- a/datasets/commonsense_qa/README.md +++ b/datasets/commonsense_qa/README.md @@ -3,9 +3,9 @@ annotations_creators: - crowdsourced language_creators: - crowdsourced -languages: +language: - en -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/competition_math/README.md b/datasets/competition_math/README.md index 09a8a567fba..7992e50011f 100644 --- a/datasets/competition_math/README.md +++ b/datasets/competition_math/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - expert-generated -languages: +language: - en -licenses: +license: - mit multilinguality: - monolingual diff --git a/datasets/conceptnet5/README.md b/datasets/conceptnet5/README.md index feb5f12be8b..db93f4e84dd 100755 --- a/datasets/conceptnet5/README.md +++ b/datasets/conceptnet5/README.md @@ -4,7 +4,7 @@ annotations_creators: language_creators: - crowdsourced - found -languages: +language: - de - en - es @@ -15,7 +15,7 @@ languages: - pt - ru - zh -licenses: +license: - cc-by-4.0 multilinguality: - monolingual diff --git a/datasets/conceptual_12m/README.md b/datasets/conceptual_12m/README.md index 9ee6012cc21..f4e22fa3530 100644 --- a/datasets/conceptual_12m/README.md +++ b/datasets/conceptual_12m/README.md @@ -3,9 +3,9 @@ annotations_creators: - found language_creators: - found -languages: +language: - en -licenses: +license: - other multilinguality: - monolingual diff --git a/datasets/conceptual_captions/README.md b/datasets/conceptual_captions/README.md index 07b600a0e5b..4609f9bcf65 100644 --- a/datasets/conceptual_captions/README.md +++ b/datasets/conceptual_captions/README.md @@ -3,9 +3,9 @@ annotations_creators: - found language_creators: - found -languages: +language: - en -licenses: +license: - other multilinguality: - monolingual diff --git a/datasets/conll2000/README.md b/datasets/conll2000/README.md index 3b108bff8ee..d2e0832abc6 100644 --- a/datasets/conll2000/README.md +++ b/datasets/conll2000/README.md @@ -1,5 +1,5 @@ --- -languages: +language: - en paperswithcode_id: conll-2000-1 pretty_name: CoNLL-2000 diff --git a/datasets/conll2002/README.md b/datasets/conll2002/README.md index 2d1b8375bf0..b75e7f27dcb 100644 --- a/datasets/conll2002/README.md +++ b/datasets/conll2002/README.md @@ -3,10 +3,10 @@ annotations_creators: - crowdsourced language_creators: - found -languages: +language: - es - nl -licenses: +license: - unknown multilinguality: - multilingual diff --git a/datasets/conll2003/README.md b/datasets/conll2003/README.md index a3cf70124e7..077e32bac6a 100644 --- a/datasets/conll2003/README.md +++ b/datasets/conll2003/README.md @@ -3,9 +3,9 @@ annotations_creators: - crowdsourced language_creators: - found -languages: +language: - en -licenses: +license: - other multilinguality: - monolingual diff --git a/datasets/conll2012_ontonotesv5/README.md b/datasets/conll2012_ontonotesv5/README.md index 9851f7e347e..393a417f231 100644 --- a/datasets/conll2012_ontonotesv5/README.md +++ b/datasets/conll2012_ontonotesv5/README.md @@ -3,11 +3,11 @@ annotations_creators: - expert-generated language_creators: - found -languages: +language: - ar - en - zh -licenses: +license: - cc-by-nc-nd-4.0 multilinguality: - multilingual diff --git a/datasets/conllpp/README.md b/datasets/conllpp/README.md index a8c36aa5ce2..4c59fe19848 100644 --- a/datasets/conllpp/README.md +++ b/datasets/conllpp/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - found -languages: +language: - en -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/consumer-finance-complaints/README.md b/datasets/consumer-finance-complaints/README.md index 85b7ba0563d..3dfa010c6a4 100644 --- a/datasets/consumer-finance-complaints/README.md +++ b/datasets/consumer-finance-complaints/README.md @@ -3,9 +3,9 @@ annotations_creators: - crowdsourced language_creators: - crowdsourced -languages: +language: - en -licenses: +license: - upl-1.0 multilinguality: - monolingual diff --git a/datasets/conv_ai/README.md b/datasets/conv_ai/README.md index 69825916cc7..9fb288255cc 100644 --- a/datasets/conv_ai/README.md +++ b/datasets/conv_ai/README.md @@ -3,9 +3,9 @@ annotations_creators: - crowdsourced language_creators: - crowdsourced -languages: +language: - en -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/conv_ai_2/README.md b/datasets/conv_ai_2/README.md index d6f779a2369..977fdeac8c4 100644 --- a/datasets/conv_ai_2/README.md +++ b/datasets/conv_ai_2/README.md @@ -3,9 +3,9 @@ annotations_creators: - crowdsourced language_creators: - crowdsourced -languages: +language: - en -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/conv_ai_3/README.md b/datasets/conv_ai_3/README.md index b1fbf425c27..fe6a5145775 100644 --- a/datasets/conv_ai_3/README.md +++ b/datasets/conv_ai_3/README.md @@ -3,9 +3,9 @@ annotations_creators: - crowdsourced language_creators: - crowdsourced -languages: +language: - en -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/conv_questions/README.md b/datasets/conv_questions/README.md index 690f244486d..cfd2f9894c5 100644 --- a/datasets/conv_questions/README.md +++ b/datasets/conv_questions/README.md @@ -3,9 +3,9 @@ annotations_creators: - crowdsourced language_creators: - crowdsourced -languages: +language: - en-US -licenses: +license: - cc-by-4.0 multilinguality: - monolingual diff --git a/datasets/coqa/README.md b/datasets/coqa/README.md index 4e5a366fb84..3afb3e66e62 100644 --- a/datasets/coqa/README.md +++ b/datasets/coqa/README.md @@ -1,5 +1,5 @@ --- -languages: +language: - en paperswithcode_id: coqa pretty_name: Conversational Question Answering Challenge diff --git a/datasets/cord19/README.md b/datasets/cord19/README.md index 40d53fdfa1b..f2e82f3180a 100644 --- a/datasets/cord19/README.md +++ b/datasets/cord19/README.md @@ -3,9 +3,9 @@ annotations_creators: - no-annotation language_creators: - found -languages: +language: - en -licenses: +license: - cc-by-nc-sa-2.0 - cc-by-nc-2.0 - cc-by-nd-2.0 diff --git a/datasets/cornell_movie_dialog/README.md b/datasets/cornell_movie_dialog/README.md index fc28c7a6bc8..c6f4b5b76ff 100644 --- a/datasets/cornell_movie_dialog/README.md +++ b/datasets/cornell_movie_dialog/README.md @@ -1,5 +1,5 @@ --- -languages: +language: - en paperswithcode_id: cornell-movie-dialogs-corpus pretty_name: Cornell Movie-Dialogs Corpus diff --git a/datasets/cos_e/README.md b/datasets/cos_e/README.md index d9cb2c3264b..962ddeef647 100644 --- a/datasets/cos_e/README.md +++ b/datasets/cos_e/README.md @@ -1,5 +1,5 @@ --- -languages: +language: - en paperswithcode_id: cos-e pretty_name: Commonsense Explanations Dataset diff --git a/datasets/cosmos_qa/README.md b/datasets/cosmos_qa/README.md index ee6708c37ce..79318f01612 100644 --- a/datasets/cosmos_qa/README.md +++ b/datasets/cosmos_qa/README.md @@ -1,5 +1,5 @@ --- -languages: +language: - en paperswithcode_id: cosmosqa pretty_name: CosmosQA diff --git a/datasets/counter/README.md b/datasets/counter/README.md index a7e18fe1c2e..91cae1b54c4 100644 --- a/datasets/counter/README.md +++ b/datasets/counter/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - expert-generated -languages: +language: - ur -licenses: +license: - cc-by-nc-sa-4.0 multilinguality: - monolingual diff --git a/datasets/covid_qa_castorini/README.md b/datasets/covid_qa_castorini/README.md index 820f375ad66..045852b8f4d 100644 --- a/datasets/covid_qa_castorini/README.md +++ b/datasets/covid_qa_castorini/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - found -languages: +language: - en -licenses: +license: - apache-2.0 multilinguality: - monolingual diff --git a/datasets/covid_qa_deepset/README.md b/datasets/covid_qa_deepset/README.md index e97be81ab4b..f66daeca2a4 100644 --- a/datasets/covid_qa_deepset/README.md +++ b/datasets/covid_qa_deepset/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - found -languages: +language: - en -licenses: +license: - apache-2.0 multilinguality: - monolingual diff --git a/datasets/covid_qa_ucsd/README.md b/datasets/covid_qa_ucsd/README.md index 0d7b19e0807..54beb832085 100644 --- a/datasets/covid_qa_ucsd/README.md +++ b/datasets/covid_qa_ucsd/README.md @@ -4,10 +4,10 @@ annotations_creators: language_creators: - expert-generated - found -languages: +language: - en - zh -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/covid_tweets_japanese/README.md b/datasets/covid_tweets_japanese/README.md index 04ea234616a..4e709aedcc4 100644 --- a/datasets/covid_tweets_japanese/README.md +++ b/datasets/covid_tweets_japanese/README.md @@ -3,9 +3,9 @@ annotations_creators: - crowdsourced language_creators: - found -languages: +language: - ja -licenses: +license: - cc-by-nd-4.0 multilinguality: - monolingual diff --git a/datasets/covost2/README.md b/datasets/covost2/README.md index 6b077d2f73f..bea6e9fe514 100644 --- a/datasets/covost2/README.md +++ b/datasets/covost2/README.md @@ -4,7 +4,7 @@ annotations_creators: language_creators: - crowdsourced - expert-generated -languages: +language: - fr - de - es @@ -26,7 +26,7 @@ languages: - ja - id - cy -licenses: +license: - cc-by-nc-4.0 multilinguality: - multilingual diff --git a/datasets/cppe-5/README.md b/datasets/cppe-5/README.md index 4980f02493f..e713f9be702 100644 --- a/datasets/cppe-5/README.md +++ b/datasets/cppe-5/README.md @@ -3,9 +3,9 @@ annotations_creators: - crowdsourced language_creators: - found -languages: +language: - en -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/craigslist_bargains/README.md b/datasets/craigslist_bargains/README.md index c28852d6f07..082d3305f42 100644 --- a/datasets/craigslist_bargains/README.md +++ b/datasets/craigslist_bargains/README.md @@ -3,9 +3,9 @@ annotations_creators: - machine-generated language_creators: - crowdsourced -languages: +language: - en -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/crawl_domain/README.md b/datasets/crawl_domain/README.md index ee19b87835f..ffcf4a2ee8c 100644 --- a/datasets/crawl_domain/README.md +++ b/datasets/crawl_domain/README.md @@ -5,9 +5,9 @@ language_creators: - crowdsourced - expert-generated - found -languages: +language: - en -licenses: +license: - mit multilinguality: - monolingual diff --git a/datasets/crd3/README.md b/datasets/crd3/README.md index 8888e2334ab..544d756ccca 100644 --- a/datasets/crd3/README.md +++ b/datasets/crd3/README.md @@ -4,9 +4,9 @@ annotations_creators: - no-annotation language_creators: - crowdsourced -languages: +language: - en -licenses: +license: - cc-by-sa-4.0 multilinguality: - monolingual diff --git a/datasets/crime_and_punish/README.md b/datasets/crime_and_punish/README.md index 5a679dd184f..6fb932d8bf9 100644 --- a/datasets/crime_and_punish/README.md +++ b/datasets/crime_and_punish/README.md @@ -1,5 +1,5 @@ --- -languages: +language: - en paperswithcode_id: null pretty_name: CrimeAndPunish diff --git a/datasets/crows_pairs/README.md b/datasets/crows_pairs/README.md index 114e1cbb951..6ec613d9e97 100644 --- a/datasets/crows_pairs/README.md +++ b/datasets/crows_pairs/README.md @@ -3,9 +3,9 @@ annotations_creators: - crowdsourced language_creators: - crowdsourced -languages: +language: - en -licenses: +license: - cc-by-sa-4.0 multilinguality: - monolingual diff --git a/datasets/cryptonite/README.md b/datasets/cryptonite/README.md index 80d2113d83d..200b15a29b5 100644 --- a/datasets/cryptonite/README.md +++ b/datasets/cryptonite/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - expert-generated -languages: +language: - en -licenses: +license: - cc-by-nc-4.0 multilinguality: - monolingual diff --git a/datasets/cs_restaurants/README.md b/datasets/cs_restaurants/README.md index 1a8127d319b..0b4069339c6 100644 --- a/datasets/cs_restaurants/README.md +++ b/datasets/cs_restaurants/README.md @@ -4,9 +4,9 @@ annotations_creators: language_creators: - expert-generated - machine-generated -languages: +language: - cs -licenses: +license: - cc-by-4.0 multilinguality: - monolingual diff --git a/datasets/cuad/README.md b/datasets/cuad/README.md index 5ceb892020b..c1a90a24a95 100644 --- a/datasets/cuad/README.md +++ b/datasets/cuad/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - found -languages: +language: - en -licenses: +license: - cc-by-4.0 multilinguality: - monolingual diff --git a/datasets/curiosity_dialogs/README.md b/datasets/curiosity_dialogs/README.md index 96f8e1c841d..7ddd497c842 100644 --- a/datasets/curiosity_dialogs/README.md +++ b/datasets/curiosity_dialogs/README.md @@ -3,9 +3,9 @@ annotations_creators: - crowdsourced language_creators: - crowdsourced -languages: +language: - en -licenses: +license: - cc-by-nc-4.0 multilinguality: - monolingual diff --git a/datasets/daily_dialog/README.md b/datasets/daily_dialog/README.md index 2e524b3b639..9ae96547994 100644 --- a/datasets/daily_dialog/README.md +++ b/datasets/daily_dialog/README.md @@ -4,9 +4,9 @@ annotations_creators: - expert-generated language_creators: - found -languages: +language: - en -licenses: +license: - cc-by-nc-sa-4.0 multilinguality: - monolingual diff --git a/datasets/dane/README.md b/datasets/dane/README.md index 7bf71d17bc9..19cff36172e 100644 --- a/datasets/dane/README.md +++ b/datasets/dane/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - found -languages: +language: - da -licenses: +license: - cc-by-sa-4.0 multilinguality: - monolingual diff --git a/datasets/danish_political_comments/README.md b/datasets/danish_political_comments/README.md index db4612fdfd7..7a677764d68 100644 --- a/datasets/danish_political_comments/README.md +++ b/datasets/danish_political_comments/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - other -languages: +language: - da -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/dart/README.md b/datasets/dart/README.md index 61a27de7522..f4b1d171e8b 100644 --- a/datasets/dart/README.md +++ b/datasets/dart/README.md @@ -5,9 +5,9 @@ annotations_creators: language_creators: - crowdsourced - machine-generated -languages: +language: - en -licenses: +license: - mit multilinguality: - monolingual diff --git a/datasets/datacommons_factcheck/README.md b/datasets/datacommons_factcheck/README.md index a08a4c0fc38..99bbcca0652 100644 --- a/datasets/datacommons_factcheck/README.md +++ b/datasets/datacommons_factcheck/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - found -languages: +language: - en -licenses: +license: - cc-by-nc-4.0 multilinguality: - monolingual diff --git a/datasets/dbpedia_14/README.md b/datasets/dbpedia_14/README.md index 33eb2293340..d6dc9a5ce2b 100644 --- a/datasets/dbpedia_14/README.md +++ b/datasets/dbpedia_14/README.md @@ -3,9 +3,9 @@ annotations_creators: - machine-generated language_creators: - crowdsourced -languages: +language: - en -licenses: +license: - cc-by-sa-3.0 multilinguality: - monolingual diff --git a/datasets/dbrd/README.md b/datasets/dbrd/README.md index 5f22ef35ee1..9021d655374 100644 --- a/datasets/dbrd/README.md +++ b/datasets/dbrd/README.md @@ -4,9 +4,9 @@ annotations_creators: - found language_creators: - found -languages: +language: - nl -licenses: +license: - cc-by-nc-sa-4.0 multilinguality: - monolingual diff --git a/datasets/deal_or_no_dialog/README.md b/datasets/deal_or_no_dialog/README.md index 75fc6c73f28..88af05c2906 100644 --- a/datasets/deal_or_no_dialog/README.md +++ b/datasets/deal_or_no_dialog/README.md @@ -3,9 +3,9 @@ annotations_creators: - crowdsourced language_creators: - crowdsourced -languages: +language: - en -licenses: +license: - cc-by-4.0 multilinguality: - monolingual diff --git a/datasets/definite_pronoun_resolution/README.md b/datasets/definite_pronoun_resolution/README.md index 233f85fc42e..de761b47874 100644 --- a/datasets/definite_pronoun_resolution/README.md +++ b/datasets/definite_pronoun_resolution/README.md @@ -1,5 +1,5 @@ --- -languages: +language: - en paperswithcode_id: definite-pronoun-resolution-dataset pretty_name: Definite Pronoun Resolution Dataset diff --git a/datasets/dengue_filipino/README.md b/datasets/dengue_filipino/README.md index e0c34489479..3c2ec485755 100644 --- a/datasets/dengue_filipino/README.md +++ b/datasets/dengue_filipino/README.md @@ -4,9 +4,9 @@ annotations_creators: - machine-generated language_creators: - crowdsourced -languages: +language: - tl -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/dialog_re/README.md b/datasets/dialog_re/README.md index ba6ba087434..0915518d28d 100644 --- a/datasets/dialog_re/README.md +++ b/datasets/dialog_re/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - expert-generated -languages: +language: - en -licenses: +license: - other-non-commercial-research-purpose-only multilinguality: - monolingual diff --git a/datasets/diplomacy_detection/README.md b/datasets/diplomacy_detection/README.md index 22f6259bbb0..7db6e4a0f61 100644 --- a/datasets/diplomacy_detection/README.md +++ b/datasets/diplomacy_detection/README.md @@ -3,9 +3,9 @@ annotations_creators: - found language_creators: - found -languages: +language: - en -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/disaster_response_messages/README.md b/datasets/disaster_response_messages/README.md index c7abb4f1a0c..659f7ee4c51 100644 --- a/datasets/disaster_response_messages/README.md +++ b/datasets/disaster_response_messages/README.md @@ -3,13 +3,13 @@ annotations_creators: - expert-generated language_creators: - crowdsourced -languages: +language: - en - es - fr - ht - ur -licenses: +license: - unknown multilinguality: - multilingual diff --git a/datasets/discofuse/README.md b/datasets/discofuse/README.md index 570aff0f4dc..13dbd16ca91 100644 --- a/datasets/discofuse/README.md +++ b/datasets/discofuse/README.md @@ -1,5 +1,5 @@ --- -languages: +language: - en paperswithcode_id: discofuse pretty_name: DiscoFuse diff --git a/datasets/discovery/README.md b/datasets/discovery/README.md index f7a876cb47b..e993542021a 100644 --- a/datasets/discovery/README.md +++ b/datasets/discovery/README.md @@ -3,9 +3,9 @@ annotations_creators: - other language_creators: - other -languages: +language: - en -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/disfl_qa/README.md b/datasets/disfl_qa/README.md index 2f637094585..01c7a5b02cb 100644 --- a/datasets/disfl_qa/README.md +++ b/datasets/disfl_qa/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - found -languages: +language: - en -licenses: +license: - cc-by-4.0 multilinguality: - monolingual diff --git a/datasets/doc2dial/README.md b/datasets/doc2dial/README.md index ffd5c2d4740..f4818d9970d 100644 --- a/datasets/doc2dial/README.md +++ b/datasets/doc2dial/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - found -languages: +language: - en -licenses: +license: - cc-by-3.0 multilinguality: - monolingual diff --git a/datasets/docred/README.md b/datasets/docred/README.md index ccfb4108a69..81f25a086b6 100644 --- a/datasets/docred/README.md +++ b/datasets/docred/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - crowdsourced -languages: +language: - en -licenses: +license: - mit multilinguality: - monolingual diff --git a/datasets/doqa/README.md b/datasets/doqa/README.md index 7a1a3ce31e0..1d525c0dc60 100644 --- a/datasets/doqa/README.md +++ b/datasets/doqa/README.md @@ -1,5 +1,5 @@ --- -languages: +language: - en paperswithcode_id: doqa pretty_name: DoQA diff --git a/datasets/dream/README.md b/datasets/dream/README.md index 79b7302351b..b5cc67098b5 100644 --- a/datasets/dream/README.md +++ b/datasets/dream/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - expert-generated -languages: +language: - en -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/drop/README.md b/datasets/drop/README.md index e4ca98153ca..b06cb38b99e 100644 --- a/datasets/drop/README.md +++ b/datasets/drop/README.md @@ -4,9 +4,9 @@ annotations_creators: - crowdsourced language_creators: - crowdsourced -languages: +language: - en -licenses: +license: - cc-by-sa-4.0 multilinguality: - monolingual diff --git a/datasets/duorc/README.md b/datasets/duorc/README.md index 484d64be1f4..fc67b4d5c04 100644 --- a/datasets/duorc/README.md +++ b/datasets/duorc/README.md @@ -3,9 +3,9 @@ annotations_creators: - crowdsourced language_creators: - crowdsourced -languages: +language: - en -licenses: +license: - mit multilinguality: - monolingual diff --git a/datasets/dutch_social/README.md b/datasets/dutch_social/README.md index 2d8611d52bc..65051a67ec1 100644 --- a/datasets/dutch_social/README.md +++ b/datasets/dutch_social/README.md @@ -3,10 +3,10 @@ annotations_creators: - machine-generated language_creators: - crowdsourced -languages: +language: - en - nl -licenses: +license: - cc-by-nc-4.0 multilinguality: - multilingual diff --git a/datasets/dyk/README.md b/datasets/dyk/README.md index 0b6cccb70ea..92ac1041b3f 100644 --- a/datasets/dyk/README.md +++ b/datasets/dyk/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - other -languages: +language: - pl -licenses: +license: - bsd-3-clause multilinguality: - monolingual diff --git a/datasets/e2e_nlg/README.md b/datasets/e2e_nlg/README.md index 65a34c7670c..a168ab245e0 100644 --- a/datasets/e2e_nlg/README.md +++ b/datasets/e2e_nlg/README.md @@ -3,9 +3,9 @@ annotations_creators: - crowdsourced language_creators: - crowdsourced -languages: +language: - en -licenses: +license: - cc-by-sa-4.0 multilinguality: - monolingual diff --git a/datasets/e2e_nlg_cleaned/README.md b/datasets/e2e_nlg_cleaned/README.md index 3444856ba66..dd901a53a60 100644 --- a/datasets/e2e_nlg_cleaned/README.md +++ b/datasets/e2e_nlg_cleaned/README.md @@ -3,9 +3,9 @@ annotations_creators: - crowdsourced language_creators: - crowdsourced -languages: +language: - en -licenses: +license: - cc-by-sa-4.0 multilinguality: - monolingual diff --git a/datasets/ecb/README.md b/datasets/ecb/README.md index fba34e5cb78..988fd8cef5d 100644 --- a/datasets/ecb/README.md +++ b/datasets/ecb/README.md @@ -3,7 +3,7 @@ annotations_creators: - found language_creators: - found -languages: +language: - cs - da - de @@ -23,7 +23,7 @@ languages: - pt - sk - sl -licenses: +license: - unknown multilinguality: - multilingual diff --git a/datasets/ecthr_cases/README.md b/datasets/ecthr_cases/README.md index 2d6e618b964..bdb43343e39 100644 --- a/datasets/ecthr_cases/README.md +++ b/datasets/ecthr_cases/README.md @@ -4,9 +4,9 @@ annotations_creators: - found language_creators: - found -languages: +language: - en -licenses: +license: - cc-by-nc-sa-4.0 multilinguality: - monolingual diff --git a/datasets/eduge/README.md b/datasets/eduge/README.md index 0b1bb97b080..e76b8b95592 100644 --- a/datasets/eduge/README.md +++ b/datasets/eduge/README.md @@ -4,9 +4,9 @@ annotations_creators: - expert-generated language_creators: - expert-generated -languages: +language: - mn -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/ehealth_kd/README.md b/datasets/ehealth_kd/README.md index b4e667a311c..fb2579c5083 100644 --- a/datasets/ehealth_kd/README.md +++ b/datasets/ehealth_kd/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - expert-generated -languages: +language: - es -licenses: +license: - cc-by-nc-sa-4.0 multilinguality: - monolingual diff --git a/datasets/eitb_parcc/README.md b/datasets/eitb_parcc/README.md index de59c43596e..742d723098f 100644 --- a/datasets/eitb_parcc/README.md +++ b/datasets/eitb_parcc/README.md @@ -3,10 +3,10 @@ annotations_creators: - found language_creators: - found -languages: +language: - es - eu -licenses: +license: - unknown multilinguality: - multilingual diff --git a/datasets/electricity_load_diagrams/README.md b/datasets/electricity_load_diagrams/README.md index da14f32fb0d..9344cbdc4ae 100644 --- a/datasets/electricity_load_diagrams/README.md +++ b/datasets/electricity_load_diagrams/README.md @@ -3,9 +3,9 @@ annotations_creators: - no-annotation language_creators: - found -languages: +language: - unknown -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/eli5/README.md b/datasets/eli5/README.md index 6a96e8b83b9..948848bb097 100644 --- a/datasets/eli5/README.md +++ b/datasets/eli5/README.md @@ -3,9 +3,9 @@ annotations_creators: - no-annotation language_creators: - found -languages: +language: - en -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/eli5_category/README.md b/datasets/eli5_category/README.md index 950ec5050a1..ef946f0d880 100644 --- a/datasets/eli5_category/README.md +++ b/datasets/eli5_category/README.md @@ -3,9 +3,9 @@ annotations_creators: - found language_creators: - found -languages: +language: - en -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/elkarhizketak/README.md b/datasets/elkarhizketak/README.md index efdd819af22..aca21069107 100644 --- a/datasets/elkarhizketak/README.md +++ b/datasets/elkarhizketak/README.md @@ -3,9 +3,9 @@ annotations_creators: - no-annotation language_creators: - crowdsourced -languages: +language: - eu -licenses: +license: - cc-by-sa-4.0 multilinguality: - monolingual diff --git a/datasets/emea/README.md b/datasets/emea/README.md index fe440882159..0d80a95cc0c 100644 --- a/datasets/emea/README.md +++ b/datasets/emea/README.md @@ -3,7 +3,7 @@ annotations_creators: - found language_creators: - found -languages: +language: - bg - cs - da @@ -26,7 +26,7 @@ languages: - sk - sl - sv -licenses: +license: - unknown multilinguality: - multilingual diff --git a/datasets/emo/README.md b/datasets/emo/README.md index aabbfe2d3ed..b4658e36636 100644 --- a/datasets/emo/README.md +++ b/datasets/emo/README.md @@ -1,5 +1,5 @@ --- -languages: +language: - en paperswithcode_id: emocontext pretty_name: EmoContext diff --git a/datasets/emotion/README.md b/datasets/emotion/README.md index 7268d7b87d5..b87fc4fd57c 100644 --- a/datasets/emotion/README.md +++ b/datasets/emotion/README.md @@ -4,9 +4,9 @@ annotations_creators: - machine-generated language_creators: - machine-generated -languages: +language: - en -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/emotone_ar/README.md b/datasets/emotone_ar/README.md index 8f2ea738517..ba0692d766e 100644 --- a/datasets/emotone_ar/README.md +++ b/datasets/emotone_ar/README.md @@ -3,9 +3,9 @@ annotations_creators: - found language_creators: - found -languages: +language: - ar -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/empathetic_dialogues/README.md b/datasets/empathetic_dialogues/README.md index 46818d2a725..d21dc02dc2e 100644 --- a/datasets/empathetic_dialogues/README.md +++ b/datasets/empathetic_dialogues/README.md @@ -1,6 +1,6 @@ --- pretty_name: EmpatheticDialogues -languages: +language: - en paperswithcode_id: empatheticdialogues --- diff --git a/datasets/enriched_web_nlg/README.md b/datasets/enriched_web_nlg/README.md index e010d572e64..3a155037329 100644 --- a/datasets/enriched_web_nlg/README.md +++ b/datasets/enriched_web_nlg/README.md @@ -3,10 +3,10 @@ annotations_creators: - found language_creators: - crowdsourced -languages: +language: - de - en -licenses: +license: - cc-by-sa-4.0 multilinguality: - monolingual diff --git a/datasets/enwik8/README.md b/datasets/enwik8/README.md index 259dca80dac..344b83cc207 100644 --- a/datasets/enwik8/README.md +++ b/datasets/enwik8/README.md @@ -3,9 +3,9 @@ annotations_creators: - no-annotation language_creators: - found -languages: +language: - en -licenses: +license: - mit multilinguality: - monolingual diff --git a/datasets/eraser_multi_rc/README.md b/datasets/eraser_multi_rc/README.md index 89022e1bd12..02ce62180d6 100644 --- a/datasets/eraser_multi_rc/README.md +++ b/datasets/eraser_multi_rc/README.md @@ -1,6 +1,6 @@ --- pretty_name: Eraser Multi Rc -languages: +language: - en paperswithcode_id: null --- diff --git a/datasets/esnli/README.md b/datasets/esnli/README.md index bbb210d8637..be02b53e4bc 100644 --- a/datasets/esnli/README.md +++ b/datasets/esnli/README.md @@ -1,5 +1,5 @@ --- -languages: +language: - en paperswithcode_id: e-snli pretty_name: e-SNLI diff --git a/datasets/eth_py150_open/README.md b/datasets/eth_py150_open/README.md index 2107ff15464..ac1d4804fd1 100644 --- a/datasets/eth_py150_open/README.md +++ b/datasets/eth_py150_open/README.md @@ -3,9 +3,9 @@ annotations_creators: - no-annotations language_creators: - machine-generated -languages: +language: - en -licenses: +license: - apache-2.0 multilinguality: - monolingual diff --git a/datasets/ethos/README.md b/datasets/ethos/README.md index 130ad50abc2..e7fcb661c47 100644 --- a/datasets/ethos/README.md +++ b/datasets/ethos/README.md @@ -4,9 +4,9 @@ annotations_creators: - expert-generated language_creators: - found, other -languages: +language: - en -licenses: +license: - agpl-3.0-or-later multilinguality: - monolingual diff --git a/datasets/ett/README.md b/datasets/ett/README.md index 9cf7d593609..f9cb69c5741 100644 --- a/datasets/ett/README.md +++ b/datasets/ett/README.md @@ -3,9 +3,9 @@ annotations_creators: - no-annotation language_creators: - found -languages: +language: - unknown -licenses: +license: - cc-by-4.0 multilinguality: - monolingual diff --git a/datasets/eu_regulatory_ir/README.md b/datasets/eu_regulatory_ir/README.md index 93045c90e07..1c9f6eca485 100644 --- a/datasets/eu_regulatory_ir/README.md +++ b/datasets/eu_regulatory_ir/README.md @@ -3,9 +3,9 @@ annotations_creators: - found language_creators: - found -languages: +language: - en -licenses: +license: - cc-by-nc-sa-4.0 multilinguality: - monolingual diff --git a/datasets/eurlex/README.md b/datasets/eurlex/README.md index 2044149d38d..1902c888c10 100644 --- a/datasets/eurlex/README.md +++ b/datasets/eurlex/README.md @@ -3,9 +3,9 @@ annotations_creators: - found language_creators: - found -languages: +language: - en -licenses: +license: - cc-by-sa-4.0 multilinguality: - monolingual diff --git a/datasets/euronews/README.md b/datasets/euronews/README.md index 14a41780bb3..9eb222a5afe 100644 --- a/datasets/euronews/README.md +++ b/datasets/euronews/README.md @@ -3,11 +3,11 @@ annotations_creators: - expert-generated language_creators: - crowdsourced -languages: +language: - de - fr - nl -licenses: +license: - cc0-1.0 multilinguality: - multilingual diff --git a/datasets/europa_eac_tm/README.md b/datasets/europa_eac_tm/README.md index e16c6310e91..28d0507bb35 100644 --- a/datasets/europa_eac_tm/README.md +++ b/datasets/europa_eac_tm/README.md @@ -3,7 +3,7 @@ annotations_creators: - expert-generated language_creators: - expert-generated -languages: +language: - bg - cs - da @@ -30,7 +30,7 @@ languages: - sl - sv - tr -licenses: +license: - cc-by-4.0 multilinguality: - translation diff --git a/datasets/europa_ecdc_tm/README.md b/datasets/europa_ecdc_tm/README.md index a3360174b22..fff0f4d432e 100644 --- a/datasets/europa_ecdc_tm/README.md +++ b/datasets/europa_ecdc_tm/README.md @@ -3,7 +3,7 @@ annotations_creators: - expert-generated language_creators: - expert-generated -languages: +language: - bg - cs - da @@ -29,7 +29,7 @@ languages: - sk - sl - sv -licenses: +license: - cc-by-sa-4.0 multilinguality: - translation diff --git a/datasets/europarl_bilingual/README.md b/datasets/europarl_bilingual/README.md index 158db71fe3a..8935d04240c 100644 --- a/datasets/europarl_bilingual/README.md +++ b/datasets/europarl_bilingual/README.md @@ -3,7 +3,7 @@ annotations_creators: - found language_creators: - found -languages: +language: - bg - cs - da @@ -25,7 +25,7 @@ languages: - sk - sl - sv -licenses: +license: - unknown multilinguality: - translation diff --git a/datasets/event2Mind/README.md b/datasets/event2Mind/README.md index a51ba120940..03d9d5c141b 100644 --- a/datasets/event2Mind/README.md +++ b/datasets/event2Mind/README.md @@ -1,5 +1,5 @@ --- -languages: +language: - en paperswithcode_id: event2mind pretty_name: Event2Mind diff --git a/datasets/evidence_infer_treatment/README.md b/datasets/evidence_infer_treatment/README.md index b9b7d3eea4f..3a709c87772 100644 --- a/datasets/evidence_infer_treatment/README.md +++ b/datasets/evidence_infer_treatment/README.md @@ -4,9 +4,9 @@ annotations_creators: - expert-generated language_creators: - expert-generated -languages: +language: - en -licenses: +license: - mit multilinguality: - monolingual diff --git a/datasets/exams/README.md b/datasets/exams/README.md index 919a86684f4..35ab42bf91e 100644 --- a/datasets/exams/README.md +++ b/datasets/exams/README.md @@ -4,7 +4,7 @@ annotations_creators: - found language_creators: - found -languages: +language: - ar - bg - de @@ -21,7 +21,7 @@ languages: - sr - tr - vi -licenses: +license: - cc-by-sa-4.0 multilinguality: - monolingual diff --git a/datasets/factckbr/README.md b/datasets/factckbr/README.md index 07bbf9cfd6d..413370ce0d3 100644 --- a/datasets/factckbr/README.md +++ b/datasets/factckbr/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - found -languages: +language: - pt -licenses: +license: - mit multilinguality: - monolingual diff --git a/datasets/fake_news_english/README.md b/datasets/fake_news_english/README.md index 7138cf4275e..6faa20359c0 100644 --- a/datasets/fake_news_english/README.md +++ b/datasets/fake_news_english/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - expert-generated -languages: +language: - en -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/fake_news_filipino/README.md b/datasets/fake_news_filipino/README.md index 7aeb3d5026e..aac72f80466 100644 --- a/datasets/fake_news_filipino/README.md +++ b/datasets/fake_news_filipino/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - crowdsourced -languages: +language: - tl -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/farsi_news/README.md b/datasets/farsi_news/README.md index c8f7696230d..6563fa86c77 100644 --- a/datasets/farsi_news/README.md +++ b/datasets/farsi_news/README.md @@ -3,9 +3,9 @@ annotations_creators: - found language_creators: - found -languages: +language: - fa -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/fashion_mnist/README.md b/datasets/fashion_mnist/README.md index 266e08d1369..2746b81f256 100644 --- a/datasets/fashion_mnist/README.md +++ b/datasets/fashion_mnist/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - found -languages: +language: - en -licenses: +license: - mit multilinguality: - monolingual diff --git a/datasets/fever/README.md b/datasets/fever/README.md index 6e6a4b7bbc0..6ac951162c2 100644 --- a/datasets/fever/README.md +++ b/datasets/fever/README.md @@ -1,12 +1,12 @@ --- -languages: +language: - en paperswithcode_id: fever annotations_creators: - crowdsourced language_creators: - found -licenses: +license: - cc-by-sa-3.0 - gpl-3.0 multilinguality: diff --git a/datasets/few_rel/README.md b/datasets/few_rel/README.md index 2a4c2dd4b9f..97d0a23e4ce 100644 --- a/datasets/few_rel/README.md +++ b/datasets/few_rel/README.md @@ -4,9 +4,9 @@ annotations_creators: - machine-generated language_creators: - found -languages: +language: - en -licenses: +license: - mit multilinguality: - monolingual diff --git a/datasets/financial_phrasebank/README.md b/datasets/financial_phrasebank/README.md index 65690bbd95a..b9f240e9836 100644 --- a/datasets/financial_phrasebank/README.md +++ b/datasets/financial_phrasebank/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - found -languages: +language: - en -licenses: +license: - cc-by-nc-sa-3.0 multilinguality: - monolingual diff --git a/datasets/finer/README.md b/datasets/finer/README.md index 2b8f56e785e..e8d9846cd53 100644 --- a/datasets/finer/README.md +++ b/datasets/finer/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - other -languages: +language: - fi -licenses: +license: - mit multilinguality: - monolingual diff --git a/datasets/flores/README.md b/datasets/flores/README.md index 72002380557..20634cb1bec 100644 --- a/datasets/flores/README.md +++ b/datasets/flores/README.md @@ -4,11 +4,11 @@ annotations_creators: - found language_creators: - found -languages: +language: - en - ne - si -licenses: +license: - cc-by-4.0 multilinguality: - translation diff --git a/datasets/flue/README.md b/datasets/flue/README.md index f936792a777..373ae398e2a 100644 --- a/datasets/flue/README.md +++ b/datasets/flue/README.md @@ -5,9 +5,9 @@ annotations_creators: - machine-generated language_creators: - crowdsourced -languages: +language: - fr -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/food101/README.md b/datasets/food101/README.md index fa0f9ff0741..392506e2dc8 100644 --- a/datasets/food101/README.md +++ b/datasets/food101/README.md @@ -3,9 +3,9 @@ annotations_creators: - crowdsourced language_creators: - crowdsourced -languages: +language: - en -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/fquad/README.md b/datasets/fquad/README.md index 7664efb4710..0898d142f09 100644 --- a/datasets/fquad/README.md +++ b/datasets/fquad/README.md @@ -4,9 +4,9 @@ annotations_creators: language_creators: - crowdsourced - found -languages: +language: - fr -licenses: +license: - cc-by-nc-sa-3.0 multilinguality: - monolingual diff --git a/datasets/freebase_qa/README.md b/datasets/freebase_qa/README.md index 0315f1333f8..09f60c16049 100644 --- a/datasets/freebase_qa/README.md +++ b/datasets/freebase_qa/README.md @@ -3,9 +3,9 @@ annotations_creators: - crowdsourced language_creators: - found -languages: +language: - en -licenses: +license: - unknown multilinguality: - monolingual diff --git a/datasets/gap/README.md b/datasets/gap/README.md index 5ce0a3c2956..a71b4080016 100644 --- a/datasets/gap/README.md +++ b/datasets/gap/README.md @@ -1,5 +1,5 @@ --- -languages: +language: - en paperswithcode_id: gap pretty_name: GAP Benchmark Suite diff --git a/datasets/gem/README.md b/datasets/gem/README.md index 3dbe3c1e50c..5750d3c19c9 100644 --- a/datasets/gem/README.md +++ b/datasets/gem/README.md @@ -6,7 +6,7 @@ language_creators: - crowdsourced - found - machine-generated -languages: +language: - cs - de - en @@ -14,7 +14,7 @@ languages: - ru - tr - vi -licenses: +license: - other-research-only multilinguality: - monolingual diff --git a/datasets/generated_reviews_enth/README.md b/datasets/generated_reviews_enth/README.md index 0d05f6d7098..8cce93031bd 100644 --- a/datasets/generated_reviews_enth/README.md +++ b/datasets/generated_reviews_enth/README.md @@ -4,10 +4,10 @@ annotations_creators: - machine-generated language_creators: - machine-generated -languages: +language: - en - th -licenses: +license: - cc-by-sa-4.0 multilinguality: - translation diff --git a/datasets/generics_kb/README.md b/datasets/generics_kb/README.md index e465824ae03..a4bdc07e1a5 100644 --- a/datasets/generics_kb/README.md +++ b/datasets/generics_kb/README.md @@ -3,9 +3,9 @@ annotations_creators: - machine-generated language_creators: - found -languages: +language: - en -licenses: +license: - cc-by-4.0 multilinguality: - monolingual diff --git a/datasets/german_legal_entity_recognition/README.md b/datasets/german_legal_entity_recognition/README.md index e57fe49f8b8..42efc6b8864 100644 --- a/datasets/german_legal_entity_recognition/README.md +++ b/datasets/german_legal_entity_recognition/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - found -languages: +language: - de -licenses: +license: - cc-by-4.0 multilinguality: - monolingual diff --git a/datasets/germaner/README.md b/datasets/germaner/README.md index bb1f47b8864..b7b4e2bcb12 100644 --- a/datasets/germaner/README.md +++ b/datasets/germaner/README.md @@ -3,9 +3,9 @@ annotations_creators: - crowdsourced language_creators: - found -languages: +language: - de -licenses: +license: - apache-2.0 multilinguality: - monolingual diff --git a/datasets/giga_fren/README.md b/datasets/giga_fren/README.md index b77de7bf102..3bcfe951012 100644 --- a/datasets/giga_fren/README.md +++ b/datasets/giga_fren/README.md @@ -3,10 +3,10 @@ annotations_creators: - found language_creators: - found -languages: +language: - en - fr -licenses: +license: - unknown multilinguality: - multilingual diff --git a/datasets/gigaword/README.md b/datasets/gigaword/README.md index 038f076b710..f79c05224ad 100644 --- a/datasets/gigaword/README.md +++ b/datasets/gigaword/README.md @@ -3,9 +3,9 @@ annotations_creators: - found language_creators: - found -languages: +language: - en -licenses: +license: - mit multilinguality: - monolingual diff --git a/datasets/glucose/README.md b/datasets/glucose/README.md index 000fed1adcc..11d03c3afd8 100644 --- a/datasets/glucose/README.md +++ b/datasets/glucose/README.md @@ -3,9 +3,9 @@ annotations_creators: - crowdsourced language_creators: - crowdsourced -languages: +language: - en -licenses: +license: - cc-by-4.0 multilinguality: - monolingual diff --git a/datasets/glue/README.md b/datasets/glue/README.md index d02f67f7756..0bfe66f279d 100644 --- a/datasets/glue/README.md +++ b/datasets/glue/README.md @@ -3,9 +3,9 @@ annotations_creators: - unknown language_creators: - unknown -languages: +language: - en -licenses: +license: - cc-by-4.0 multilinguality: - monolingual diff --git a/datasets/gnad10/README.md b/datasets/gnad10/README.md index 75bf6227e95..092dbd493ac 100644 --- a/datasets/gnad10/README.md +++ b/datasets/gnad10/README.md @@ -3,9 +3,9 @@ annotations_creators: - crowdsourced language_creators: - found -languages: +language: - de -licenses: +license: - cc-by-nc-sa-4.0 multilinguality: - monolingual diff --git a/datasets/go_emotions/README.md b/datasets/go_emotions/README.md index 80d022e6a2f..ffc46e22b10 100644 --- a/datasets/go_emotions/README.md +++ b/datasets/go_emotions/README.md @@ -3,9 +3,9 @@ annotations_creators: - crowdsourced language_creators: - found -languages: +language: - en -licenses: +license: - apache-2.0 multilinguality: - monolingual diff --git a/datasets/gooaq/README.md b/datasets/gooaq/README.md index 54d80c25333..cd30bdb91ee 100644 --- a/datasets/gooaq/README.md +++ b/datasets/gooaq/README.md @@ -3,9 +3,9 @@ annotations_creators: - expert-generated language_creators: - machine-generated -languages: +language: - en -licenses: +license: - apache-2.0 multilinguality: - monolingual diff --git a/datasets/google_wellformed_query/README.md b/datasets/google_wellformed_query/README.md index 099251b739a..bd83f8cfdee 100644 --- a/datasets/google_wellformed_query/README.md +++ b/datasets/google_wellformed_query/README.md @@ -5,7 +5,7 @@ multilinguality: - monolingual task_ids: - text-scoring -languages: +language: - en annotations_creators: - crowdsourced @@ -13,7 +13,7 @@ source_datasets: - extended size_categories: - 10K 0: raise TypeError( "Could not validate the metadata, found the following errors:\n" @@ -363,7 +373,7 @@ def validate_language_codes(languages: Union[List[str], Dict[str, List[str]]]) - return tagset_validator( languages, known_language_codes.keys(), - "languages", + "language", known_language_codes_url, lambda lang: lang == "unknown", ) @@ -373,7 +383,7 @@ def validate_licences(licenses: Union[List[str], Dict[str, List[str]]]) -> Valid validated, error = tagset_validator( licenses, list(known_licenses.keys()), - "licenses", + "license", known_licenses_url, lambda e: "-other-" in e or e.startswith("other-"), ) diff --git a/tests/test_metadata_util.py b/tests/test_metadata_util.py index cbe2e35d545..9642c7f3767 100644 --- a/tests/test_metadata_util.py +++ b/tests/test_metadata_util.py @@ -20,7 +20,7 @@ def _dedent(string: str) -> str: README_YAML = """\ --- -languages: +language: - zh - en task_ids: @@ -142,7 +142,7 @@ def test_yaml_block_from_readme(self): yaml_block, _dedent( """\ - languages: + language: - zh - en task_ids: @@ -173,7 +173,7 @@ def test_metadata_dict_from_readme(self): with open(path, "w+") as readme_file: readme_file.write(README_YAML) metadata_dict = metadata_dict_from_readme(path) - self.assertDictEqual(metadata_dict, {"languages": ["zh", "en"], "task_ids": ["sentiment-classification"]}) + self.assertDictEqual(metadata_dict, {"language": ["zh", "en"], "task_ids": ["sentiment-classification"]}) with open(path, "w+") as readme_file: readme_file.write(README_EMPTY_YAML) @@ -188,7 +188,15 @@ def test_metadata_dict_from_readme(self): def test_from_yaml_string(self): default_optional_keys = { - field.name: field.default for field in fields(DatasetMetadata) if type(field.default) is _MISSING_TYPE + field.name: field.default + for field in fields(DatasetMetadata) + if type(field.default) is _MISSING_TYPE and field.name not in DatasetMetadata._DEPRECATED_YAML_KEYS + } + + default_deprecated_keys = { + field.name: field.default + for field in fields(DatasetMetadata) + if field.name in DatasetMetadata._DEPRECATED_YAML_KEYS } valid_yaml_string = _dedent( @@ -197,9 +205,9 @@ def test_from_yaml_string(self): - found language_creators: - found - languages: + language: - en - licenses: + license: - unknown multilinguality: - monolingual @@ -222,12 +230,12 @@ def test_from_yaml_string(self): - found language_creators: - found - languages: + language: en: - en fr: - fr - licenses: + license: - unknown multilinguality: - monolingual @@ -250,9 +258,9 @@ def test_from_yaml_string(self): - found language_creators: - some guys in Panama - languages: + language: - en - licenses: + license: - unknown multilinguality: - monolingual @@ -275,9 +283,9 @@ def test_from_yaml_string(self): """\ annotations_creators: - found - languages: + language: - en - licenses: + license: - unknown multilinguality: - monolingual @@ -300,9 +308,9 @@ def test_from_yaml_string(self): """\ annotations_creators: - found - languages: + language: - en - licenses: + license: - unknown multilinguality: - monolingual @@ -329,12 +337,12 @@ def test_from_yaml_string(self): - found language_creators: - found - languages: + language: en: - en en: - en - licenses: + license: - unknown multilinguality: - monolingual @@ -359,9 +367,9 @@ def test_from_yaml_string(self): - found language_creators: - found - languages: + language: - en - licenses: + license: - unknown multilinguality: - monolingual @@ -385,9 +393,9 @@ def test_from_yaml_string(self): - found language_creators: - found - languages: + language: - en - licenses: + license: - unknown multilinguality: - monolingual @@ -411,9 +419,9 @@ def test_from_yaml_string(self): - found language_creators: - found - languages: + language: - en - licenses: + license: - unknown multilinguality: - monolingual @@ -440,9 +448,9 @@ def test_from_yaml_string(self): - found language_creators: - found - languages: + language: - en - licenses: + license: - unknown multilinguality: - monolingual @@ -487,10 +495,11 @@ def test_from_yaml_string(self): metadata_dict = asdict(metadata) expected = { **default_optional_keys, + **default_deprecated_keys, "annotations_creators": ["found"], "language_creators": ["found"], - "languages": ["en"], - "licenses": ["unknown"], + "language": ["en"], + "license": ["unknown"], "multilinguality": ["monolingual"], "pretty_name": "Test Dataset", "size_categories": ["10K