From 36b8f39157d9ddb8dc2f3467e7ac10355d18476d Mon Sep 17 00:00:00 2001
From: Quentin Lhoest <lhoest.q@gmail.com>
Date: Wed, 30 Mar 2022 16:16:02 +0200
Subject: [PATCH 01/10] update tasks list

---
 src/datasets/utils/resources/tasks.json | 259 +++++++++++++++---------
 1 file changed, 158 insertions(+), 101 deletions(-)

diff --git a/src/datasets/utils/resources/tasks.json b/src/datasets/utils/resources/tasks.json
index 0585f97b917..540e6ffbccd 100644
--- a/src/datasets/utils/resources/tasks.json
+++ b/src/datasets/utils/resources/tasks.json
@@ -1,54 +1,110 @@
 {
-    "conditional-text-generation": {
-        "description": "data-to-text and text transduction tasks such as translation or summarization",
-        "options": [
-            "machine-translation",
-            "sentence-splitting-fusion",
-            "summarization",
-            "table-to-text",
-            "text-simplification",
-            "explanation-generation",
-            "other-structured-to-text",
-            "other"
+    "audio-classification": {
+        "type": "audio",
+        "subtasks": [
+            "keyword-spotting",
+            "speaker-identification",
+            "speaker-intent-classification",
+            "emotion-recognition",
+            "speaker-language-identification"
+        ]
+    },
+    "audio-to-audio": {
+        "type": "audio"
+    },
+    "automatic-speech-recognition": {
+        "type": "multimodal"
+    },
+    "conversational": {
+        "type": "text",
+        "subtasks": [
+            "dialogue-generation"
+        ]
+    },
+    "feature-extraction": {
+        "type": "multimodal"
+    },
+    "fill-mask": {
+        "type": "text",
+        "subtasks": [
+            "slot-filling",
+            "masked-language-modeling"
+        ]
+    },
+    "image-classification": {
+        "type": "image",
+        "subtasks": [
+            "multi-label-image-classification",
+            "multi-class-image-classification"
+        ]
+    },
+    "image-segmentation": {
+        "type": "image",
+        "subtasks": [
+            "instance-segmentation",
+            "semantic-segmentation",
+            "panoptic-segmentation"
+        ]
+    },
+    "image-to-text": {
+        "type": "multimodal",
+        "subtasks": [
+            "image-captioning"
+        ]
+    },
+    "multiple-choice": {
+        "type": "text",
+        "subtasks": [
+            "multiple-choice-question-answering",
+            "multiple-choice-coreference-resolution"
+        ]
+    },
+    "object-detection": {
+        "type": "image",
+        "subtasks": [
+            "face-detection",
+            "vehicle-detection"
         ]
     },
     "question-answering": {
-        "description": "question answering tasks",
-        "options": [
-            "open-domain-qa",
-            "closed-domain-qa",
-            "multiple-choice-qa",
+        "type": "text",
+        "aliases": [
+            "extractive-question-answering"
+        ],
+        "subtasks": [
             "extractive-qa",
-            "abstractive-qa",
-            "other"
+            "open-domain-qa",
+            "closed-domain-qa"
         ]
     },
-    "sequence-modeling": {
-        "description": "such as language modeling or dialogue",
-        "options": [
-            "dialogue-modeling",
-            "language-modeling",
-            "other-multi-turn",
-            "slot-filling",
-            "other"
+    "sentence-similarity": {
+        "type": "text"
+    },
+    "tabular-classification": {
+        "type": "text"
+    },
+    "tabular-to-text": {
+        "type": "text",
+        "subtasks": [
+            "rdf-to-text"
         ]
     },
-    "structure-prediction": {
-        "description": "predicting structural properties of the text, such as syntax",
-        "options": [
-            "coreference-resolution",
-            "named-entity-recognition",
-            "part-of-speech-tagging",
-            "parsing",
-            "semantic-role-labeling",
-            "lemmatization",
-            "word-sense-disambiguation",
-            "other"
+    "summarization": {
+        "type": "text",
+        "subtasks": [
+            "news-articles-summarization",
+            "news-articles-headline-generation"
         ]
     },
+    "table-to-text": {
+        "type": "text"
+    },
+    "table-question-answering": {
+        "type": "text"
+    },
     "text-classification": {
-        "description": "predicting a class index or boolean value",
-        "options": [
+        "type": "text",
+        "subtasks": [
             "acceptability-classification",
             "entity-linking-classification",
             "fact-checking",
@@ -59,90 +115,91 @@
             "semantic-similarity-classification",
             "sentiment-classification",
             "topic-classification",
-            "other"
+            "semantic-similarity-scoring",
+            "sentiment-scoring",
+            "sentiment-analysis",
+            "hate-speech-detection",
+            "text-scoring"
+        ]
+    },
+    "text-generation": {
+        "type": "text",
+        "subtasks": [
+            "dialogue-modeling",
+            "language-modeling"
         ]
     },
     "text-retrieval": {
-        "description": "information or text retrieval tasks",
-        "options": [
+        "type": "text",
+        "subtasks": [
             "document-retrieval",
             "utterance-retrieval",
             "entity-linking-retrieval",
-            "fact-checking-retrieval",
-            "other"
+            "fact-checking-retrieval"
         ]
     },
-    "text-scoring": {
-        "description": "text scoring tasks, predicting a real valued score for some text",
-        "options": [
-            "semantic-similarity-scoring",
-            "sentiment-scoring",
-            "other"
+    "text-to-image": {
+        "type": "multimodal"
+    },
+    "text-to-tabular": {
+        "type": "text",
+        "subtasks": [
+            "relation-extraction",
+            "semantic-role-labeling"
         ]
     },
-    "speech-processing": {
-        "description": "tasks related to the analysis and representations of speech signals",
-        "options": [
-            "automatic-speech-recognition",
-            "phoneme-recognition",
-            "keyword-spotting",
-            "query-by-example-spoken-term-detection",
-            "speaker-identification",
-            "automatic-speaker-verification",
-            "speaker-diarization",
-            "intent-classification",
-            "slot-filling",
-            "emotion-recognition"
+    "text-to-speech": {
+        "type": "multimodal"
+    },
+    "text2text-generation": {
+        "type": "text",
+        "subtasks": [
+            "text-simplification",
+            "explanation-generation",
+            "abstractive-qa",
+            "open-domain-abstractive-qa",
+            "closed-domain-qa",
+            "open-book-qa",
+            "closed-book-qa"
         ]
     },
     "time-series-forecasting": {
-        "description": "tasks related to predicting future values of a time series",
-        "options": [
+        "type": "time series",
+        "subtasks": [
             "univariate-time-series-forecasting",
             "multivariate-time-series-forecasting"
         ]
     },
-    "object-detection": {
-        "description": "tasks related to detecting instances of objects from a particular class in an image",
-        "options": [
-            "face-detection",
-            "other"
+    "token-classification": {
+        "type": "text",
+        "aliases": [
+            "structure-prediction"
+        ],
+        "subtasks": [
+            "named-entity-recognition",
+            "part-of-speech-tagging",
+            "parsing",
+            "lemmatization",
+            "word-sense-disambiguation",
+            "coreference-resolution"
         ]
     },
-    "image-to-text": {
-        "description": "tasks related to generating text from images",
-        "options": [
-            "image-captioning",
-            "other"
-        ]
+    "translation": {
+        "type": "text"
     },
-    "text-to-image": {
-        "description": "tasks related to generating images from text",
-        "options": []
+    "visual-question-answering": {
+        "type": "multimodal"
     },
-    "image-segmentation": {
-        "description": "tasks related to detecting and delineating distinct objects in images",
-        "options": [
-            "instance-segmentation",
-            "semantic-segmentation",
-            "panoptic-segmentation",
-            "other"
-        ]
+    "voice-activity-detection": {
+        "type": "audio"
     },
-    "image-classification": {
-        "description": "tasks related to identifying what images represent",
-        "options": [
-            "multi-label-image-classification",
-            "single-label-image-classification",
-            "other"
-        ]
-
+    "zero-shot-classification": {
+        "type": "text"
     },
-
-    "other": {
-        "description": "other task family not mentioned here",
-        "options": [
-            "other"
-        ]
+    "zero-shot-image-classification": {
+        "type": "multimodal"
+    },
+    "reinforcement-learning": {
+        "type": "other"
     }
 }
\ No newline at end of file

From 1ccbe6b38dd8af67f0b04d9cbcf0b66aac8f20e5 Mon Sep 17 00:00:00 2001
From: Quentin Lhoest <lhoest.q@gmail.com>
Date: Wed, 30 Mar 2022 16:16:17 +0200
Subject: [PATCH 02/10] update tags in dataset cards

---
 datasets/acronym_identification/README.md     |  4 +-
 datasets/ade_corpus_v2/README.md              |  4 +-
 datasets/afrikaans_ner_corpus/README.md       |  2 +-
 datasets/air_dialogue/README.md               |  8 ++--
 datasets/allegro_reviews/README.md            |  3 +-
 datasets/alt/README.md                        |  5 +--
 datasets/amazon_reviews_multi/README.md       |  9 ++--
 datasets/ami/README.md                        |  3 +-
 datasets/amttl/README.md                      |  2 +-
 datasets/app_reviews/README.md                |  3 +-
 datasets/aquamuse/README.md                   |  1 +
 datasets/arabic_billion_words/README.md       |  4 +-
 datasets/arabic_pos_dialect/README.md         |  2 +-
 datasets/arabic_speech_corpus/README.md       |  3 +-
 datasets/arxiv_dataset/README.md              |  5 +--
 datasets/asset/README.md                      |  8 ++--
 datasets/assin/README.md                      |  2 +-
 datasets/assin2/README.md                     |  2 +-
 datasets/atomic/README.md                     |  4 +-
 datasets/autshumato/README.md                 |  5 +--
 datasets/bbaw_egyptian/README.md              |  5 +--
 datasets/bc2gm_corpus/README.md               |  2 +-
 datasets/best2009/README.md                   |  4 +-
 datasets/bianet/README.md                     |  5 +--
 datasets/bible_para/README.md                 |  5 +--
 datasets/big_patent/README.md                 |  4 +-
 datasets/billsum/README.md                    |  4 +-
 datasets/biosses/README.md                    |  3 +-
 datasets/blbooks/README.md                    |  4 +-
 datasets/blbooksgenre/README.md               |  4 +-
 datasets/bnl_newspapers/README.md             |  4 +-
 datasets/bookcorpus/README.md                 |  4 +-
 datasets/bookcorpusopen/README.md             |  4 +-
 datasets/brwac/README.md                      |  4 +-
 datasets/bsd_ja_en/README.md                  |  4 +-
 datasets/bswac/README.md                      |  4 +-
 datasets/c4/README.md                         |  4 +-
 datasets/caner/README.md                      |  2 +-
 datasets/capes/README.md                      |  5 ++-
 datasets/casino/README.md                     |  6 +--
 datasets/cawac/README.md                      |  4 +-
 datasets/cc100/README.md                      |  4 +-
 datasets/cc_news/README.md                    |  4 +-
 datasets/chr_en/README.md                     | 19 ++++----
 datasets/climate_fever/README.md              |  2 +-
 datasets/cmu_hinglish_dog/README.md           |  5 +--
 datasets/cnn_dailymail/README.md              |  4 +-
 datasets/coached_conv_pref/README.md          |  5 ++-
 datasets/code_search_net/README.md            |  4 +-
 .../README.md                                 |  3 +-
 .../README.md                                 |  3 +-
 .../README.md                                 |  3 +-
 .../README.md                                 |  4 +-
 .../code_x_glue_cc_code_refinement/README.md  |  6 +--
 .../README.md                                 |  4 +-
 .../code_x_glue_ct_code_to_text/README.md     |  4 +-
 .../code_x_glue_tc_text_to_code/README.md     |  4 +-
 .../code_x_glue_tt_text_to_text/README.md     |  4 +-
 datasets/common_gen/README.md                 |  4 ++
 datasets/common_language/README.md            |  4 +-
 datasets/common_voice/README.md               |  3 +-
 datasets/competition_math/README.md           |  4 +-
 datasets/conll2002/README.md                  |  2 +-
 datasets/conll2003/README.md                  |  2 +-
 datasets/conll2012_ontonotesv5/README.md      |  2 +-
 datasets/conllpp/README.md                    |  2 +-
 datasets/conv_ai/README.md                    |  7 +--
 datasets/conv_ai_2/README.md                  |  5 ++-
 datasets/conv_ai_3/README.md                  |  5 ++-
 datasets/conv_questions/README.md             |  3 +-
 datasets/counter/README.md                    |  2 +-
 datasets/covost2/README.md                    |  3 +-
 datasets/craigslist_bargains/README.md        |  3 +-
 datasets/crd3/README.md                       |  6 +--
 datasets/crows_pairs/README.md                |  5 ++-
 datasets/cs_restaurants/README.md             | 10 +++--
 datasets/curiosity_dialogs/README.md          |  8 ++--
 datasets/dane/README.md                       |  2 +-
 datasets/dart/README.md                       |  6 +--
 datasets/dbrd/README.md                       |  6 ++-
 datasets/deal_or_no_dialog/README.md          |  5 +--
 datasets/dialog_re/README.md                  |  3 +-
 datasets/disaster_response_messages/README.md |  2 +-
 datasets/drop/README.md                       |  1 +
 datasets/duorc/README.md                      |  1 +
 datasets/e2e_nlg/README.md                    |  6 +--
 datasets/e2e_nlg_cleaned/README.md            |  6 +--
 datasets/ecb/README.md                        |  5 +--
 datasets/ehealth_kd/README.md                 |  4 +-
 datasets/eitb_parcc/README.md                 |  5 +--
 datasets/eli5/README.md                       |  6 +--
 datasets/eli5_category/README.md              |  6 +--
 datasets/elkarhizketak/README.md              |  2 +-
 datasets/emea/README.md                       |  5 +--
 datasets/enriched_web_nlg/README.md           |  6 +--
 datasets/euronews/README.md                   |  2 +-
 datasets/europa_eac_tm/README.md              |  7 ++-
 datasets/europa_ecdc_tm/README.md             |  7 ++-
 datasets/europarl_bilingual/README.md         |  5 +--
 datasets/farsi_news/README.md                 |  4 +-
 datasets/finer/README.md                      |  2 +-
 datasets/flores/README.md                     |  5 +--
 datasets/gem/README.md                        | 45 ++++++++++---------
 datasets/generated_reviews_enth/README.md     |  3 +-
 .../german_legal_entity_recognition/README.md |  2 +-
 datasets/germaner/README.md                   |  2 +-
 datasets/giga_fren/README.md                  |  5 +--
 datasets/gigaword/README.md                   |  4 +-
 datasets/glucose/README.md                    |  8 ++--
 datasets/glue/README.md                       |  3 +-
 datasets/google_wellformed_query/README.md    |  4 +-
 datasets/great_code/README.md                 |  3 +-
 datasets/harem/README.md                      |  2 +-
 datasets/has_part/README.md                   |  5 ++-
 datasets/hate_speech_pl/README.md             |  2 +-
 datasets/hausa_voa_ner/README.md              |  2 +-
 datasets/hebrew_projectbenyehuda/README.md    |  4 +-
 datasets/hebrew_this_world/README.md          |  4 +-
 datasets/hind_encorp/README.md                |  5 +--
 datasets/hindi_discourse/README.md            |  8 ++--
 datasets/hippocorpus/README.md                |  5 ++-
 datasets/hkcancor/README.md                   |  6 +--
 datasets/hrenwac_para/README.md               |  5 +--
 datasets/hrwac/README.md                      |  4 +-
 datasets/humicroedit/README.md                |  5 ++-
 datasets/id_liputan6/README.md                |  3 +-
 datasets/id_nergrit_corpus/README.md          |  2 +-
 datasets/id_newspapers_2018/README.md         |  4 +-
 datasets/id_panl_bppt/README.md               |  5 +--
 datasets/id_puisi/README.md                   |  8 ++--
 .../README.md                                 |  5 +--
 datasets/igbo_monolingual/README.md           |  4 +-
 datasets/igbo_ner/README.md                   |  2 +-
 datasets/indonlu/README.md                    | 16 +++----
 datasets/inquisitive_qg/README.md             |  4 +-
 datasets/irc_disentangle/README.md            |  4 +-
 datasets/isixhosa_ner_corpus/README.md        |  2 +-
 datasets/isizulu_ner_corpus/README.md         |  2 +-
 datasets/jfleg/README.md                      |  4 +-
 datasets/jigsaw_unintended_bias/README.md     |  5 ++-
 datasets/jnlpba/README.md                     |  2 +-
 datasets/kd_conv/README.md                    |  4 +-
 datasets/kde4/README.md                       |  5 +--
 datasets/kilt_tasks/README.md                 | 13 +++---
 datasets/klue/README.md                       | 14 +++---
 datasets/kor_ner/README.md                    |  2 +-
 datasets/lama/README.md                       |  5 ++-
 datasets/lambada/README.md                    |  4 +-
 datasets/lener_br/README.md                   |  2 +-
 datasets/librispeech_asr/README.md            |  3 +-
 datasets/limit/README.md                      |  2 +-
 datasets/linnaeus/README.md                   |  2 +-
 datasets/lj_speech/README.md                  |  3 +-
 datasets/lst20/README.md                      |  8 ++--
 datasets/m_lama/README.md                     |  5 ++-
 datasets/mac_morpho/README.md                 |  2 +-
 datasets/makhzan/README.md                    |  4 +-
 datasets/masakhaner/README.md                 |  2 +-
 datasets/mbpp/README.md                       |  4 +-
 datasets/mc4/README.md                        |  4 +-
 datasets/mdd/README.md                        |  3 +-
 datasets/menyo20k_mt/README.md                |  5 +--
 datasets/meta_woz/README.md                   |  3 +-
 datasets/miam/README.md                       |  8 +++-
 datasets/mkb/README.md                        |  4 +-
 datasets/mlsum/README.md                      |  3 +-
 datasets/ms_terms/README.md                   |  5 +--
 datasets/msr_text_compression/README.md       |  3 +-
 .../msr_zhen_translation_parity/README.md     |  5 +--
 datasets/msra_ner/README.md                   |  2 +-
 datasets/mt_eng_vietnamese/README.md          |  5 +--
 datasets/multi_news/README.md                 |  5 ++-
 datasets/multi_nli/README.md                  |  3 +-
 datasets/multi_nli_mismatch/README.md         |  3 +-
 datasets/multi_para_crawl/README.md           |  5 +--
 datasets/multi_woz_v22/README.md              |  5 ++-
 datasets/multi_x_science_sum/README.md        |  6 +--
 datasets/multilingual_librispeech/README.md   |  3 +-
 datasets/mutual_friends/README.md             |  3 +-
 datasets/narrativeqa/README.md                |  2 +-
 datasets/narrativeqa_manual/README.md         |  2 +-
 datasets/ncbi_disease/README.md               |  2 +-
 datasets/nchlt/README.md                      |  2 +-
 datasets/ncslgr/README.md                     |  5 +--
 datasets/nell/README.md                       |  5 ++-
 datasets/news_commentary/README.md            |  5 +--
 datasets/newsph/README.md                     |  4 +-
 datasets/newspop/README.md                    |  5 ++-
 datasets/newsroom/README.md                   |  4 +-
 datasets/nkjp-ner/README.md                   |  2 +-
 datasets/norec/README.md                      |  2 +-
 datasets/norne/README.md                      |  2 +-
 datasets/norwegian_ner/README.md              |  2 +-
 datasets/numer_sense/README.md                |  3 +-
 datasets/numeric_fused_head/README.md         |  4 +-
 datasets/oclar/README.md                      |  2 +-
 datasets/ofis_publik/README.md                |  5 +--
 datasets/ollie/README.md                      |  5 +--
 datasets/onestop_english/README.md            |  2 +-
 datasets/open_subtitles/README.md             |  5 +--
 datasets/openai_humaneval/README.md           |  4 +-
 datasets/openslr/README.md                    |  3 +-
 datasets/openwebtext/README.md                |  4 +-
 datasets/opus100/README.md                    |  4 +-
 datasets/opus_books/README.md                 |  5 +--
 datasets/opus_dgt/README.md                   |  5 +--
 datasets/opus_dogc/README.md                  |  5 +--
 datasets/opus_elhuyar/README.md               |  5 +--
 datasets/opus_euconst/README.md               |  5 +--
 datasets/opus_finlex/README.md                |  5 +--
 datasets/opus_fiskmo/README.md                |  5 +--
 datasets/opus_gnome/README.md                 |  5 +--
 datasets/opus_infopankki/README.md            |  5 +--
 datasets/opus_memat/README.md                 |  5 +--
 datasets/opus_montenegrinsubs/README.md       |  5 +--
 datasets/opus_openoffice/README.md            |  5 +--
 datasets/opus_paracrawl/README.md             |  5 +--
 datasets/opus_rf/README.md                    |  5 +--
 datasets/opus_tedtalks/README.md              |  5 +--
 datasets/opus_ubuntu/README.md                |  5 +--
 datasets/opus_wikipedia/README.md             |  5 +--
 datasets/opus_xhosanavy/README.md             |  5 +--
 datasets/orange_sum/README.md                 |  5 ++-
 datasets/oscar/README.md                      |  4 +-
 datasets/para_crawl/README.md                 |  5 +--
 datasets/para_pat/README.md                   |  4 +-
 datasets/paws-x/README.md                     |  4 +-
 datasets/paws/README.md                       |  4 +-
 datasets/pec/README.md                        |  3 +-
 datasets/peoples_daily_ner/README.md          |  2 +-
 datasets/persian_ner/README.md                |  2 +-
 datasets/php/README.md                        |  5 +--
 datasets/pib/README.md                        |  7 +--
 datasets/pn_summary/README.md                 |  5 ++-
 datasets/poleval2019_mt/README.md             |  5 +--
 datasets/polsum/README.md                     |  4 +-
 datasets/polyglot_ner/README.md               |  2 +-
 datasets/psc/README.md                        |  4 +-
 datasets/ptb_text_only/README.md              |  4 +-
 datasets/pubmed/README.md                     | 10 ++---
 datasets/py_ast/README.md                     |  8 ++--
 datasets/qed_amara/README.md                  |  5 +--
 datasets/quac/README.md                       |  3 +-
 datasets/recipe_nlg/README.md                 |  6 ++-
 datasets/reddit/README.md                     |  4 +-
 datasets/reddit_tifu/README.md                |  6 +--
 datasets/refresd/README.md                    |  2 +-
 datasets/ro_sts/README.md                     |  3 +-
 datasets/ro_sts_parallel/README.md            |  5 +--
 datasets/ronec/README.md                      |  2 +-
 datasets/s2orc/README.md                      |  4 +-
 datasets/samsum/README.md                     |  4 +-
 datasets/sanskrit_classic/README.md           |  4 +-
 datasets/saudinewsnet/README.md               |  4 +-
 datasets/scb_mt_enth_2020/README.md           |  5 +--
 datasets/schema_guided_dstc8/README.md        |  5 ++-
 datasets/scielo/README.md                     |  5 +--
 datasets/scitldr/README.md                    |  4 +-
 datasets/sede/README.md                       |  2 +-
 datasets/sem_eval_2014_task_1/README.md       |  2 +-
 datasets/sem_eval_2020_task_11/README.md      |  4 +-
 datasets/senti_ws/README.md                   |  7 +--
 datasets/sepedi_ner/README.md                 |  2 +-
 datasets/sesotho_ner_corpus/README.md         |  2 +-
 datasets/setimes/README.md                    |  5 +--
 datasets/setswana_ner_corpus/README.md        |  2 +-
 datasets/silicone/README.md                   | 24 +++++++++-
 datasets/siswati_ner_corpus/README.md         |  2 +-
 datasets/smartdata/README.md                  |  2 +-
 .../snow_simplified_japanese_corpus/README.md |  5 +--
 datasets/so_stacksample/README.md             |  4 +-
 datasets/social_bias_frames/README.md         |  4 +-
 datasets/sofc_materials_articles/README.md    |  5 ++-
 datasets/spanish_billion_words/README.md      |  4 +-
 datasets/spc/README.md                        |  5 +--
 datasets/species_800/README.md                |  2 +-
 datasets/speech_commands/README.md            |  4 +-
 datasets/spider/README.md                     |  4 +-
 datasets/srwac/README.md                      |  4 +-
 datasets/sst/README.md                        |  2 +-
 datasets/stsb_multi_mt/README.md              |  3 +-
 datasets/superb/README.md                     | 10 ++---
 datasets/swahili/README.md                    |  4 +-
 datasets/swedish_medical_ner/README.md        |  2 +-
 datasets/swedish_ner_corpus/README.md         |  2 +-
 datasets/tanzil/README.md                     |  5 +--
 datasets/tapaco/README.md                     |  6 +--
 datasets/tashkeela/README.md                  |  4 +-
 datasets/taskmaster1/README.md                |  3 +-
 datasets/taskmaster2/README.md                |  3 +-
 datasets/taskmaster3/README.md                |  3 +-
 datasets/tatoeba/README.md                    |  5 +--
 datasets/ted_iwlst2013/README.md              |  5 +--
 datasets/ted_talks_iwslt/README.md            |  5 +--
 datasets/telugu_books/README.md               |  4 +-
 datasets/telugu_news/README.md                |  4 +-
 datasets/tep_en_fa_para/README.md             |  5 +--
 datasets/text2log/README.md                   |  5 +--
 datasets/thainer/README.md                    |  2 +-
 datasets/thaisum/README.md                    |  7 +--
 datasets/the_pile/README.md                   |  4 +-
 datasets/the_pile_books3/README.md            |  4 +-
 datasets/the_pile_openwebtext2/README.md      |  4 +-
 datasets/the_pile_stack_exchange/README.md    |  4 +-
 datasets/tilde_model/README.md                |  5 +--
 .../times_of_india_news_headlines/README.md   |  4 +-
 datasets/timit_asr/README.md                  |  3 +-
 datasets/tlc/README.md                        |  4 +-
 datasets/tmu_gfm_dataset/README.md            |  4 +-
 datasets/totto/README.md                      |  3 +-
 datasets/trivia_qa/README.md                  |  2 +
 datasets/turk/README.md                       |  2 +-
 datasets/turkic_xwmt/README.md                |  5 +--
 datasets/turkish_ner/README.md                |  2 +-
 datasets/turkish_shrinked_ner/README.md       |  2 +-
 datasets/turku_ner_corpus/README.md           |  2 +-
 datasets/tweets_ar_en_parallel/README.md      |  4 +-
 datasets/twi_text_c3/README.md                |  4 +-
 datasets/twi_wordsim353/README.md             |  3 +-
 datasets/udhr/README.md                       |  5 +--
 datasets/um005/README.md                      |  5 +--
 datasets/un_ga/README.md                      |  5 +--
 datasets/un_multi/README.md                   |  5 +--
 datasets/un_pc/README.md                      |  5 +--
 datasets/universal_morphologies/README.md     |  4 +-
 datasets/vctk/README.md                       |  3 +-
 datasets/vivos/README.md                      |  3 +-
 datasets/web_nlg/README.md                    | 34 +-------------
 datasets/weibo_ner/README.md                  |  2 +-
 datasets/wi_locness/README.md                 |  4 +-
 datasets/wiki_asp/README.md                   |  4 +-
 datasets/wiki_atomic_edits/README.md          |  4 +-
 datasets/wiki_auto/README.md                  |  2 +-
 datasets/wiki_bio/README.md                   |  4 +-
 datasets/wiki_dpr/README.md                   |  4 +-
 datasets/wiki_lingua/README.md                |  3 +-
 datasets/wiki_source/README.md                |  5 +--
 datasets/wiki_summary/README.md               |  5 ++-
 datasets/wikiann/README.md                    |  2 +-
 datasets/wikicorpus/README.md                 | 28 +++++++-----
 datasets/wikipedia/README.md                  |  4 +-
 datasets/wikitext/README.md                   |  4 +-
 datasets/wikitext_tl39/README.md              |  4 +-
 datasets/wino_bias/README.md                  |  2 +-
 datasets/winograd_wsc/README.md               |  2 +-
 datasets/wisesight1000/README.md              |  4 +-
 datasets/wmt14/README.md                      |  5 +--
 datasets/wmt15/README.md                      |  5 +--
 datasets/wmt16/README.md                      |  5 +--
 datasets/wmt17/README.md                      |  5 +--
 datasets/wmt18/README.md                      |  5 +--
 datasets/wmt19/README.md                      |  5 +--
 datasets/wmt20_mlqe_task1/README.md           |  5 +--
 datasets/wmt20_mlqe_task2/README.md           |  5 +--
 datasets/wmt20_mlqe_task3/README.md           |  5 +--
 datasets/wmt_t2t/README.md                    |  5 +--
 datasets/wnut_17/README.md                    |  2 +-
 datasets/woz_dialogue/README.md               |  5 ++-
 datasets/xglue/README.md                      | 13 +++---
 datasets/xsum/README.md                       |  4 +-
 datasets/xsum_factuality/README.md            |  4 +-
 datasets/xtreme/README.md                     |  2 +-
 datasets/yoruba_gv_ner/README.md              |  2 +-
 datasets/yoruba_text_c3/README.md             |  4 +-
 datasets/yoruba_wordsim353/README.md          |  3 +-
 .../youtube_caption_corrections/README.md     |  3 +-
 datasets/zest/README.md                       |  4 +-
 367 files changed, 858 insertions(+), 786 deletions(-)

diff --git a/datasets/acronym_identification/README.md b/datasets/acronym_identification/README.md
index a2e205679fd..dbe60263ce4 100644
--- a/datasets/acronym_identification/README.md
+++ b/datasets/acronym_identification/README.md
@@ -14,9 +14,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
-- structure-prediction-other-acronym-identification
+- token-classification-other-acronym-identification
 paperswithcode_id: acronym-identification
 pretty_name: Acronym Identification Dataset
 ---
diff --git a/datasets/ade_corpus_v2/README.md b/datasets/ade_corpus_v2/README.md
index 5d375ed9e2b..14246693348 100644
--- a/datasets/ade_corpus_v2/README.md
+++ b/datasets/ade_corpus_v2/README.md
@@ -22,9 +22,9 @@ task_categories:
   Ade_corpus_v2_classification:
   - text-classification
   Ade_corpus_v2_drug_ade_relation:
-  - structure-prediction
+  - token-classification
   Ade_corpus_v2_drug_dosage_relation:
-  - structure-prediction
+  - token-classification
 task_ids:
   Ade_corpus_v2_classification:
   - fact-checking
diff --git a/datasets/afrikaans_ner_corpus/README.md b/datasets/afrikaans_ner_corpus/README.md
index b32383cb67d..44385876c49 100644
--- a/datasets/afrikaans_ner_corpus/README.md
+++ b/datasets/afrikaans_ner_corpus/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: null
diff --git a/datasets/air_dialogue/README.md b/datasets/air_dialogue/README.md
index e6952f18de6..112569c12eb 100644
--- a/datasets/air_dialogue/README.md
+++ b/datasets/air_dialogue/README.md
@@ -15,12 +15,14 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-- sequence-modeling
+- conversational
+- text-generation
+- fill-mask
 task_ids:
-- conditional-text-generation-other-dialogue-generation
+- dialogue-generation
 - dialogue-modeling
 - language-modeling
+- masked-language-modeling
 paperswithcode_id: null
 ---
 
diff --git a/datasets/allegro_reviews/README.md b/datasets/allegro_reviews/README.md
index 53b29b53d7b..c9f8434335f 100644
--- a/datasets/allegro_reviews/README.md
+++ b/datasets/allegro_reviews/README.md
@@ -14,9 +14,10 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- text-scoring
+- text-classification
 task_ids:
 - sentiment-scoring
+- text-scoring
 paperswithcode_id: allegro-reviews
 pretty_name: Allegro Reviews
 ---
diff --git a/datasets/alt/README.md b/datasets/alt/README.md
index 3546370e30d..a035b4e5594 100644
--- a/datasets/alt/README.md
+++ b/datasets/alt/README.md
@@ -40,10 +40,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-- structure-prediction
+- translation
+- token-classification
 task_ids:
-- machine-translation
 - parsing
 paperswithcode_id: alt
 pretty_name: Asian Language Treebank
diff --git a/datasets/amazon_reviews_multi/README.md b/datasets/amazon_reviews_multi/README.md
index 55391781530..a998cf8511d 100644
--- a/datasets/amazon_reviews_multi/README.md
+++ b/datasets/amazon_reviews_multi/README.md
@@ -58,15 +58,16 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-- sequence-modeling
+- summarization
+- text-generation
+- fill-mask
 - text-classification
-- text-scoring
 task_ids:
+- text-scoring
 - language-modeling
+- masked-language-modeling
 - sentiment-classification
 - sentiment-scoring
-- summarization
 - topic-classification
 paperswithcode_id: null
 pretty_name: The Multilingual Amazon Reviews Corpus
diff --git a/datasets/ami/README.md b/datasets/ami/README.md
index c5e763a76a5..93b1c0cb17d 100644
--- a/datasets/ami/README.md
+++ b/datasets/ami/README.md
@@ -16,9 +16,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- speech-processing
-task_ids:
 - automatic-speech-recognition
+task_ids: []
 ---
 
 # Dataset Card for AMI Corpus
diff --git a/datasets/amttl/README.md b/datasets/amttl/README.md
index 8670c554b65..7b5ea22e195 100644
--- a/datasets/amttl/README.md
+++ b/datasets/amttl/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - parsing
 paperswithcode_id: null
diff --git a/datasets/app_reviews/README.md b/datasets/app_reviews/README.md
index 1a932dad5b1..3a6fe0e664c 100644
--- a/datasets/app_reviews/README.md
+++ b/datasets/app_reviews/README.md
@@ -14,8 +14,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- text-scoring
+- text-classification
 task_ids:
+- text-scoring
 - sentiment-scoring
 paperswithcode_id: null
 pretty_name: AppReviews
diff --git a/datasets/aquamuse/README.md b/datasets/aquamuse/README.md
index 41e80eae341..745e1bb6704 100644
--- a/datasets/aquamuse/README.md
+++ b/datasets/aquamuse/README.md
@@ -20,6 +20,7 @@ source_datasets:
 task_categories:
 - other
 - question-answering
+- text2text-generation
 task_ids:
 - abstractive-qa
 - extractive-qa
diff --git a/datasets/arabic_billion_words/README.md b/datasets/arabic_billion_words/README.md
index ce93ac175f7..62d7bca307a 100644
--- a/datasets/arabic_billion_words/README.md
+++ b/datasets/arabic_billion_words/README.md
@@ -33,9 +33,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 paperswithcode_id: null
 pretty_name: Arabic Billion Words
 ---
diff --git a/datasets/arabic_pos_dialect/README.md b/datasets/arabic_pos_dialect/README.md
index a519eca613d..e6632488cc3 100644
--- a/datasets/arabic_pos_dialect/README.md
+++ b/datasets/arabic_pos_dialect/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - extended
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - part-of-speech-tagging
 paperswithcode_id: null
diff --git a/datasets/arabic_speech_corpus/README.md b/datasets/arabic_speech_corpus/README.md
index c9f064dd02d..a12f9bf6d56 100644
--- a/datasets/arabic_speech_corpus/README.md
+++ b/datasets/arabic_speech_corpus/README.md
@@ -16,9 +16,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- speech-processing
-task_ids:
 - automatic-speech-recognition
+task_ids: []
 ---
 
 # Dataset Card for Arabic Speech Corpus
diff --git a/datasets/arxiv_dataset/README.md b/datasets/arxiv_dataset/README.md
index fdd9b79b264..6793e480e05 100644
--- a/datasets/arxiv_dataset/README.md
+++ b/datasets/arxiv_dataset/README.md
@@ -14,15 +14,14 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
+- translation
+- summarization
 - text-retrieval
 task_ids:
 - document-retrieval
 - entity-linking-retrieval
 - explanation-generation
 - fact-checking-retrieval
-- machine-translation
-- summarization
 - text-simplification
 paperswithcode_id: null
 pretty_name: arXiv Dataset
diff --git a/datasets/asset/README.md b/datasets/asset/README.md
index b70d66cc253..24f697d338d 100644
--- a/datasets/asset/README.md
+++ b/datasets/asset/README.md
@@ -16,12 +16,12 @@ source_datasets:
 - extended|other-turkcorpus
 task_categories:
   ratings:
-  - text-scoring
+  - text-classification
   simplification:
-  - conditional-text-generation
+  - text2text-generation
 task_ids:
   ratings:
-  - text-scoring-other-simplification-evaluation
+  - text-classification-other-simplification-evaluation
   simplification:
   - text-simplification
 paperswithcode_id: asset
@@ -67,7 +67,7 @@ splitting in [HSplit](https://www.aclweb.org/anthology/D18-1081.pdf)), the simpl
 
 ### Supported Tasks and Leaderboards
 
-The dataset supports the evaluation of `test-simplification` systems. Success in this tasks is typically measured using the [SARI](https://huggingface.co/metrics/sari) and [FKBLEU](https://huggingface.co/metrics/fkbleu) metrics described in the paper [Optimizing Statistical Machine Translation for Text Simplification](https://www.aclweb.org/anthology/Q16-1029.pdf).
+The dataset supports the evaluation of `text-simplification` systems. Success in this tasks is typically measured using the [SARI](https://huggingface.co/metrics/sari) and [FKBLEU](https://huggingface.co/metrics/fkbleu) metrics described in the paper [Optimizing Statistical Machine Translation for Text Simplification](https://www.aclweb.org/anthology/Q16-1029.pdf).
 
 ### Languages
 
diff --git a/datasets/assin/README.md b/datasets/assin/README.md
index c15f2de834b..3717b499871 100644
--- a/datasets/assin/README.md
+++ b/datasets/assin/README.md
@@ -16,8 +16,8 @@ source_datasets:
 - original
 task_categories:
 - text-classification
-- text-scoring
 task_ids:
+- text-scoring
 - natural-language-inference
 - semantic-similarity-scoring
 paperswithcode_id: assin
diff --git a/datasets/assin2/README.md b/datasets/assin2/README.md
index 6a4cbdc4c52..9bf5e2c309a 100644
--- a/datasets/assin2/README.md
+++ b/datasets/assin2/README.md
@@ -15,8 +15,8 @@ source_datasets:
 - original
 task_categories:
 - text-classification
-- text-scoring
 task_ids:
+- text-scoring
 - natural-language-inference
 - semantic-similarity-scoring
 paperswithcode_id: assin2
diff --git a/datasets/atomic/README.md b/datasets/atomic/README.md
index 410502f1220..903354a606f 100755
--- a/datasets/atomic/README.md
+++ b/datasets/atomic/README.md
@@ -15,9 +15,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
+- text2text-generation
 task_ids:
-- other-structured-to-text
+- text2text-generation-other-common-sense-if-then-reasoning
 paperswithcode_id: atomic
 ---
 
diff --git a/datasets/autshumato/README.md b/datasets/autshumato/README.md
index 46ecb299df9..3afffcd1342 100644
--- a/datasets/autshumato/README.md
+++ b/datasets/autshumato/README.md
@@ -40,9 +40,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: autshumato
 ---
diff --git a/datasets/bbaw_egyptian/README.md b/datasets/bbaw_egyptian/README.md
index a34c9e2610e..93f6f6b4b76 100644
--- a/datasets/bbaw_egyptian/README.md
+++ b/datasets/bbaw_egyptian/README.md
@@ -16,9 +16,8 @@ size_categories:
 source_datasets:
 - extended|wikipedia
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: BbawEgyptian
 ---
diff --git a/datasets/bc2gm_corpus/README.md b/datasets/bc2gm_corpus/README.md
index d8b3d9670fa..64da0edcea9 100644
--- a/datasets/bc2gm_corpus/README.md
+++ b/datasets/bc2gm_corpus/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: null
diff --git a/datasets/best2009/README.md b/datasets/best2009/README.md
index 026633232b6..5bf4362e31d 100644
--- a/datasets/best2009/README.md
+++ b/datasets/best2009/README.md
@@ -14,9 +14,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
-- structure-prediction-other-word-tokenization
+- token-classification-other-word-tokenization
 paperswithcode_id: null
 pretty_name: best2009
 ---
diff --git a/datasets/bianet/README.md b/datasets/bianet/README.md
index 3e8169f9284..85061259a50 100644
--- a/datasets/bianet/README.md
+++ b/datasets/bianet/README.md
@@ -27,9 +27,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: bianet
 pretty_name: Bianet
 ---
diff --git a/datasets/bible_para/README.md b/datasets/bible_para/README.md
index 67755ef417a..8fa40fdf31f 100644
--- a/datasets/bible_para/README.md
+++ b/datasets/bible_para/README.md
@@ -115,9 +115,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: BiblePara
 ---
diff --git a/datasets/big_patent/README.md b/datasets/big_patent/README.md
index 9ca05553a89..cdee0f5f7a7 100644
--- a/datasets/big_patent/README.md
+++ b/datasets/big_patent/README.md
@@ -33,9 +33,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
 - summarization
+task_ids:
+- summarization-other-patent-summarization
 paperswithcode_id: bigpatent
 pretty_name: Big Patent
 ---
diff --git a/datasets/billsum/README.md b/datasets/billsum/README.md
index 694d095cac7..cdca4737043 100644
--- a/datasets/billsum/README.md
+++ b/datasets/billsum/README.md
@@ -14,9 +14,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
 - summarization
+task_ids:
+- summarization-other-bills-summarization
 paperswithcode_id: billsum
 pretty_name: BillSum
 ---
diff --git a/datasets/biosses/README.md b/datasets/biosses/README.md
index 5b66590225a..6e6b75ab5ab 100644
--- a/datasets/biosses/README.md
+++ b/datasets/biosses/README.md
@@ -14,8 +14,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- text-scoring
+- text-classification
 task_ids:
+- text-scoring
 - semantic-similarity-scoring
 paperswithcode_id: biosses
 pretty_name: BIOSSES
diff --git a/datasets/blbooks/README.md b/datasets/blbooks/README.md
index 2542ce04f9a..1969d2604da 100644
--- a/datasets/blbooks/README.md
+++ b/datasets/blbooks/README.md
@@ -20,10 +20,12 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 - other
 task_ids:
 - language-modeling
+- masked-language-modeling
 - other-other-digital-humanities-research
 ---
 
diff --git a/datasets/blbooksgenre/README.md b/datasets/blbooksgenre/README.md
index 6a3a6aee0e0..53d20bf6be8 100644
--- a/datasets/blbooksgenre/README.md
+++ b/datasets/blbooksgenre/README.md
@@ -25,11 +25,13 @@ source_datasets:
 - original
 task_categories:
 - text-classification
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - topic-classification
 - multi-label-classification
 - language-modeling
+- masked-language-modeling
 ---
 
 # Dataset Card for blbooksgenre
diff --git a/datasets/bnl_newspapers/README.md b/datasets/bnl_newspapers/README.md
index 4b6a7f1ae9e..9cbfac740ff 100644
--- a/datasets/bnl_newspapers/README.md
+++ b/datasets/bnl_newspapers/README.md
@@ -22,9 +22,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 ---
 
 # Dataset Card for BnL Historical Newspapers
diff --git a/datasets/bookcorpus/README.md b/datasets/bookcorpus/README.md
index bc6badeb50b..8e5ca1dff9b 100644
--- a/datasets/bookcorpus/README.md
+++ b/datasets/bookcorpus/README.md
@@ -15,9 +15,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 paperswithcode_id: bookcorpus
 ---
 
diff --git a/datasets/bookcorpusopen/README.md b/datasets/bookcorpusopen/README.md
index 2f4ffc95dbf..b06cb5f3c21 100644
--- a/datasets/bookcorpusopen/README.md
+++ b/datasets/bookcorpusopen/README.md
@@ -15,9 +15,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 paperswithcode_id: bookcorpus
 ---
 
diff --git a/datasets/brwac/README.md b/datasets/brwac/README.md
index 3669e44f0f3..3cc4bd102b0 100644
--- a/datasets/brwac/README.md
+++ b/datasets/brwac/README.md
@@ -14,9 +14,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 paperswithcode_id: brwac
 pretty_name: BrWaC
 ---
diff --git a/datasets/bsd_ja_en/README.md b/datasets/bsd_ja_en/README.md
index 1bc90e8f54c..87c1aa85b3a 100644
--- a/datasets/bsd_ja_en/README.md
+++ b/datasets/bsd_ja_en/README.md
@@ -15,9 +15,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
+- translation
 task_ids:
-- machine-translation
+- translation-other-business-conversations-translation
 paperswithcode_id: business-scene-dialogue
 pretty_name: Business Scene Dialogue
 ---
diff --git a/datasets/bswac/README.md b/datasets/bswac/README.md
index c8a75e7c112..50799d45658 100644
--- a/datasets/bswac/README.md
+++ b/datasets/bswac/README.md
@@ -14,9 +14,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 paperswithcode_id: null
 pretty_name: BsWac
 ---
diff --git a/datasets/c4/README.md b/datasets/c4/README.md
index 9b8455b15f0..d41d3a25613 100644
--- a/datasets/c4/README.md
+++ b/datasets/c4/README.md
@@ -15,9 +15,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 paperswithcode_id: c4
 ---
 
diff --git a/datasets/caner/README.md b/datasets/caner/README.md
index 99de3de9c52..7c0781659da 100644
--- a/datasets/caner/README.md
+++ b/datasets/caner/README.md
@@ -13,7 +13,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: null
diff --git a/datasets/capes/README.md b/datasets/capes/README.md
index 0678b06717a..edf195bc9e7 100644
--- a/datasets/capes/README.md
+++ b/datasets/capes/README.md
@@ -15,9 +15,10 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
+- translation
 task_ids:
-- machine-translation
+- translaiton-other-theses-translation
+- translaiton-other-dissertation-abstracts-translation
 paperswithcode_id: capes
 pretty_name: CAPES
 ---
diff --git a/datasets/casino/README.md b/datasets/casino/README.md
index 9ae616c3d15..7dea40d28ee 100644
--- a/datasets/casino/README.md
+++ b/datasets/casino/README.md
@@ -14,10 +14,10 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-- sequence-modeling
+- conversational
+- text-generation
+- fill-mask
 task_ids:
-- conditional-text-generation-other-dialogue-generation
 - dialogue-modeling
 pretty_name: Campsite Negotiation Dialogues
 paperswithcode_id: casino
diff --git a/datasets/cawac/README.md b/datasets/cawac/README.md
index 0db683b591c..211f4170e2f 100644
--- a/datasets/cawac/README.md
+++ b/datasets/cawac/README.md
@@ -14,9 +14,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 paperswithcode_id: cawac
 pretty_name: caWaC
 ---
diff --git a/datasets/cc100/README.md b/datasets/cc100/README.md
index 5b1bf401dc9..ca5b71c40bc 100644
--- a/datasets/cc100/README.md
+++ b/datasets/cc100/README.md
@@ -132,9 +132,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 paperswithcode_id: cc100
 pretty_name: CC100
 ---
diff --git a/datasets/cc_news/README.md b/datasets/cc_news/README.md
index 8aab90f8018..e0fe8568744 100644
--- a/datasets/cc_news/README.md
+++ b/datasets/cc_news/README.md
@@ -15,9 +15,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 paperswithcode_id: cc-news
 ---
 
diff --git a/datasets/chr_en/README.md b/datasets/chr_en/README.md
index c92552bf5e0..9f1c03fb20d 100644
--- a/datasets/chr_en/README.md
+++ b/datasets/chr_en/README.md
@@ -46,22 +46,21 @@ source_datasets:
 - original
 task_categories:
   monolingual:
-  - conditional-text-generation
+  - translation
   monolingual_raw:
-  - sequence-modeling
+  - text-generation
+  - fill-mask
   parallel:
-  - conditional-text-generation
+  - translation
   parallel_raw:
-  - conditional-text-generation
+  - translation
 task_ids:
-  monolingual:
-  - machine-translation
+  monolingual: []
   monolingual_raw:
   - language-modeling
-  parallel:
-  - machine-translation
-  parallel_raw:
-  - machine-translation
+  - masked-language-modeling
+  parallel: []
+  parallel_raw: []
 paperswithcode_id: chren
 ---
 
diff --git a/datasets/climate_fever/README.md b/datasets/climate_fever/README.md
index 4050e0bd20b..eb22f4e2177 100644
--- a/datasets/climate_fever/README.md
+++ b/datasets/climate_fever/README.md
@@ -18,8 +18,8 @@ source_datasets:
 task_categories:
 - text-classification
 - text-retrieval
-- text-scoring
 task_ids:
+- text-scoring
 - fact-checking
 - fact-checking-retrieval
 - semantic-similarity-scoring
diff --git a/datasets/cmu_hinglish_dog/README.md b/datasets/cmu_hinglish_dog/README.md
index 027619a9b52..607477ccd8e 100644
--- a/datasets/cmu_hinglish_dog/README.md
+++ b/datasets/cmu_hinglish_dog/README.md
@@ -18,9 +18,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 ---
 
 # Dataset Card for CMU Document Grounded Conversations
diff --git a/datasets/cnn_dailymail/README.md b/datasets/cnn_dailymail/README.md
index fa16607cd43..41224565d5c 100644
--- a/datasets/cnn_dailymail/README.md
+++ b/datasets/cnn_dailymail/README.md
@@ -14,9 +14,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
 - summarization
+task_ids:
+- summarization-news-articles-summarization
 paperswithcode_id: cnn-daily-mail-1
 pretty_name: CNN / Daily Mail
 ---
diff --git a/datasets/coached_conv_pref/README.md b/datasets/coached_conv_pref/README.md
index b7d7ac2904a..e0a380103a5 100644
--- a/datasets/coached_conv_pref/README.md
+++ b/datasets/coached_conv_pref/README.md
@@ -15,8 +15,9 @@ source_datasets:
 - original
 task_categories:
 - other
-- sequence-modeling
-- structure-prediction
+- text-generation
+- fill-mask
+- token-classification
 task_ids:
 - other-other-Conversational Recommendation
 - dialogue-modeling
diff --git a/datasets/code_search_net/README.md b/datasets/code_search_net/README.md
index dfefe894417..fb475993ca3 100644
--- a/datasets/code_search_net/README.md
+++ b/datasets/code_search_net/README.md
@@ -27,9 +27,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 paperswithcode_id: codesearchnet
 pretty_name: CodeSearchNet
 ---
diff --git a/datasets/code_x_glue_cc_cloze_testing_all/README.md b/datasets/code_x_glue_cc_cloze_testing_all/README.md
index 69cb15a9ff5..cccd954b7e6 100644
--- a/datasets/code_x_glue_cc_cloze_testing_all/README.md
+++ b/datasets/code_x_glue_cc_cloze_testing_all/README.md
@@ -25,7 +25,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - slot-filling
 pretty_name: CodeXGlueCcClozeTestingAll
diff --git a/datasets/code_x_glue_cc_cloze_testing_maxmin/README.md b/datasets/code_x_glue_cc_cloze_testing_maxmin/README.md
index 6297269934a..9c3e8031df5 100644
--- a/datasets/code_x_glue_cc_cloze_testing_maxmin/README.md
+++ b/datasets/code_x_glue_cc_cloze_testing_maxmin/README.md
@@ -25,7 +25,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - slot-filling
 pretty_name: CodeXGlueCcClozeTestingMaxmin
diff --git a/datasets/code_x_glue_cc_code_completion_line/README.md b/datasets/code_x_glue_cc_code_completion_line/README.md
index e455c7bd219..0e3232b665c 100644
--- a/datasets/code_x_glue_cc_code_completion_line/README.md
+++ b/datasets/code_x_glue_cc_code_completion_line/README.md
@@ -25,7 +25,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - slot-filling
 pretty_name: CodeXGlueCcCodeCompletionLine
diff --git a/datasets/code_x_glue_cc_code_completion_token/README.md b/datasets/code_x_glue_cc_code_completion_token/README.md
index b35fd706ffb..80eaecb5c78 100644
--- a/datasets/code_x_glue_cc_code_completion_token/README.md
+++ b/datasets/code_x_glue_cc_code_completion_token/README.md
@@ -14,9 +14,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 pretty_name: CodeXGlueCcCodeCompletionToken
 ---
 # Dataset Card for "code_x_glue_cc_code_completion_token"
diff --git a/datasets/code_x_glue_cc_code_refinement/README.md b/datasets/code_x_glue_cc_code_refinement/README.md
index 2a021cba785..cd8c8999a2f 100644
--- a/datasets/code_x_glue_cc_code_refinement/README.md
+++ b/datasets/code_x_glue_cc_code_refinement/README.md
@@ -14,9 +14,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
+- text2text-generation
 task_ids:
-- conditional-text-generation-other-debugging
+- text2text-generation-other-debugging
 pretty_name: CodeXGlueCcCodeRefinement
 ---
 
@@ -58,7 +58,7 @@ We use the dataset released by this paper(https://arxiv.org/pdf/1812.08693.pdf).
 
 ### Supported Tasks and Leaderboards
 
-- `conditional-text-generation-other-debugging`: The dataset can be used to train a model for automatically fixing buggy code.
+- `text2text-generation-other-debugging`: The dataset can be used to train a model for automatically fixing buggy code.
 
 ### Languages
 
diff --git a/datasets/code_x_glue_cc_code_to_code_trans/README.md b/datasets/code_x_glue_cc_code_to_code_trans/README.md
index c403b360a42..f4ae60a8c93 100644
--- a/datasets/code_x_glue_cc_code_to_code_trans/README.md
+++ b/datasets/code_x_glue_cc_code_to_code_trans/README.md
@@ -14,9 +14,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
+- translation
 task_ids:
-- machine-translation
+- translation-other-code-to-code
 pretty_name: CodeXGlueCcCodeToCodeTrans
 ---
 # Dataset Card for "code_x_glue_cc_code_to_code_trans"
diff --git a/datasets/code_x_glue_ct_code_to_text/README.md b/datasets/code_x_glue_ct_code_to_text/README.md
index aa457452139..3865687cedf 100644
--- a/datasets/code_x_glue_ct_code_to_text/README.md
+++ b/datasets/code_x_glue_ct_code_to_text/README.md
@@ -26,9 +26,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
+- translation
 task_ids:
-- machine-translation
+- translation-other-code-to-text
 pretty_name: CodeXGlueCtCodeToText
 ---
 # Dataset Card for "code_x_glue_ct_code_to_text"
diff --git a/datasets/code_x_glue_tc_text_to_code/README.md b/datasets/code_x_glue_tc_text_to_code/README.md
index e10824df6b8..51070edac0b 100644
--- a/datasets/code_x_glue_tc_text_to_code/README.md
+++ b/datasets/code_x_glue_tc_text_to_code/README.md
@@ -15,9 +15,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
+- translation
 task_ids:
-- machine-translation
+- translation-other-text-to-code
 pretty_name: CodeXGlueTcTextToCode
 ---
 # Dataset Card for "code_x_glue_tc_text_to_code"
diff --git a/datasets/code_x_glue_tt_text_to_text/README.md b/datasets/code_x_glue_tt_text_to_text/README.md
index 48f90fda204..0761a65b925 100644
--- a/datasets/code_x_glue_tt_text_to_text/README.md
+++ b/datasets/code_x_glue_tt_text_to_text/README.md
@@ -18,9 +18,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
+- translation
 task_ids:
-- machine-translation
+- translation-other-code-documentation-translation
 pretty_name: CodeXGlueTtTextToText
 ---
 # Dataset Card for "code_x_glue_tt_text_to_text"
diff --git a/datasets/common_gen/README.md b/datasets/common_gen/README.md
index 75b73501f1b..b819df86681 100644
--- a/datasets/common_gen/README.md
+++ b/datasets/common_gen/README.md
@@ -3,6 +3,10 @@ languages:
 - en
 paperswithcode_id: commongen
 pretty_name: CommonGen
+task_ids:
+- text2text-generation-other-concepts-to-text
+tasks_categories:
+- text2text-generation
 ---
 
 # Dataset Card for "common_gen"
diff --git a/datasets/common_language/README.md b/datasets/common_language/README.md
index a2804ca3851..522b881ffcc 100644
--- a/datasets/common_language/README.md
+++ b/datasets/common_language/README.md
@@ -59,9 +59,9 @@ size_categories:
 source_datasets:
 - extended|common_voice
 task_categories:
-- speech-processing
+- audio-classification
 task_ids:
-- other-other-speech-classification
+- speaker-language-identification
 ---
 
 # Dataset Card for common_language
diff --git a/datasets/common_voice/README.md b/datasets/common_voice/README.md
index bdd46378910..230b1fdd465 100644
--- a/datasets/common_voice/README.md
+++ b/datasets/common_voice/README.md
@@ -193,9 +193,8 @@ size_categories:
 source_datasets:
 - extended|common_voice
 task_categories:
-- speech-processing
-task_ids:
 - automatic-speech-recognition
+task_ids: []
 paperswithcode_id: common-voice
 ---
 
diff --git a/datasets/competition_math/README.md b/datasets/competition_math/README.md
index 1de4e51f69e..09a8a567fba 100644
--- a/datasets/competition_math/README.md
+++ b/datasets/competition_math/README.md
@@ -15,9 +15,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
+- text2text-generation
 task_ids:
-- explanation-generation
+- text2text-generation-other-explanation-generation
 ---
 
 # Dataset Card for Mathematics Aptitude Test of Heuristics (MATH) dataset
diff --git a/datasets/conll2002/README.md b/datasets/conll2002/README.md
index c84899b5040..3113faefa8d 100644
--- a/datasets/conll2002/README.md
+++ b/datasets/conll2002/README.md
@@ -17,7 +17,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 - part-of-speech-tagging
diff --git a/datasets/conll2003/README.md b/datasets/conll2003/README.md
index 3b466be3f34..97b43530119 100644
--- a/datasets/conll2003/README.md
+++ b/datasets/conll2003/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - extended|other-reuters-corpus
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 - part-of-speech-tagging
diff --git a/datasets/conll2012_ontonotesv5/README.md b/datasets/conll2012_ontonotesv5/README.md
index bd776dc04c4..9851f7e347e 100644
--- a/datasets/conll2012_ontonotesv5/README.md
+++ b/datasets/conll2012_ontonotesv5/README.md
@@ -18,7 +18,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 - part-of-speech-tagging
diff --git a/datasets/conllpp/README.md b/datasets/conllpp/README.md
index 5284f4bd37e..4d3307da20b 100644
--- a/datasets/conllpp/README.md
+++ b/datasets/conllpp/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - extended|conll2003
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: conll
diff --git a/datasets/conv_ai/README.md b/datasets/conv_ai/README.md
index 76a66aeb127..69825916cc7 100644
--- a/datasets/conv_ai/README.md
+++ b/datasets/conv_ai/README.md
@@ -14,10 +14,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-- text-scoring
+- conversational
+- text-classification
 task_ids:
-- text-scoring-other-evaluating-dialogue-systems
+- text-scoring
+- text-classification-other-evaluating-dialogue-systems
 paperswithcode_id: null
 pretty_name: ConvAi
 ---
diff --git a/datasets/conv_ai_2/README.md b/datasets/conv_ai_2/README.md
index 19304823e8f..d6f779a2369 100644
--- a/datasets/conv_ai_2/README.md
+++ b/datasets/conv_ai_2/README.md
@@ -14,9 +14,10 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-- text-scoring
+- conversational
+- text-classification
 task_ids:
+- text-scoring
 - text-scoring-other-evaluating-dialogue-systems
 paperswithcode_id: convai2
 pretty_name: Conversational Intelligence Challenge 2
diff --git a/datasets/conv_ai_3/README.md b/datasets/conv_ai_3/README.md
index c2659226ec6..b1fbf425c27 100644
--- a/datasets/conv_ai_3/README.md
+++ b/datasets/conv_ai_3/README.md
@@ -14,9 +14,10 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-- text-scoring
+- conversational
+- text-classification
 task_ids:
+- text-scoring
 - text-scoring-other-evaluating-dialogue-systems
 paperswithcode_id: null
 pretty_name: More Information Needed
diff --git a/datasets/conv_questions/README.md b/datasets/conv_questions/README.md
index 81d99d2b71f..690f244486d 100644
--- a/datasets/conv_questions/README.md
+++ b/datasets/conv_questions/README.md
@@ -15,7 +15,8 @@ source_datasets:
 - original
 task_categories:
 - question-answering
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - open-domain-qa
 - dialogue-modeling
diff --git a/datasets/counter/README.md b/datasets/counter/README.md
index f1405bd7453..a7e18fe1c2e 100644
--- a/datasets/counter/README.md
+++ b/datasets/counter/README.md
@@ -15,8 +15,8 @@ source_datasets:
 - original
 task_categories:
 - text-classification
-- text-scoring
 task_ids:
+- text-scoring
 - semantic-similarity-scoring
 - topic-classification
 paperswithcode_id: counter
diff --git a/datasets/covost2/README.md b/datasets/covost2/README.md
index febbabb48d9..6b077d2f73f 100644
--- a/datasets/covost2/README.md
+++ b/datasets/covost2/README.md
@@ -35,9 +35,8 @@ size_categories:
 source_datasets:
 - extended|other-common-voice
 task_categories:
-- speech-processing
-task_ids:
 - automatic-speech-recognition
+task_ids: []
 paperswithcode_id: null
 pretty_name: CoVoST 2
 ---
diff --git a/datasets/craigslist_bargains/README.md b/datasets/craigslist_bargains/README.md
index 92c4f93cc31..c28852d6f07 100644
--- a/datasets/craigslist_bargains/README.md
+++ b/datasets/craigslist_bargains/README.md
@@ -14,7 +14,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - dialogue-modeling
 paperswithcode_id: craigslistbargains
diff --git a/datasets/crd3/README.md b/datasets/crd3/README.md
index b5eced9e7a1..6394e94eb8b 100644
--- a/datasets/crd3/README.md
+++ b/datasets/crd3/README.md
@@ -13,10 +13,10 @@ multilinguality:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-- sequence-modeling
-task_ids:
 - summarization
+- text-generation
+- fill-mask
+task_ids:
 - dialogue-modeling
 size_categories:
 - 10K<n<100K
diff --git a/datasets/crows_pairs/README.md b/datasets/crows_pairs/README.md
index 539bd391540..114e1cbb951 100644
--- a/datasets/crows_pairs/README.md
+++ b/datasets/crows_pairs/README.md
@@ -14,9 +14,10 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- text-scoring
+- text-classification
 task_ids:
-- text-scoring-other-bias-evaluation
+- text-scoring
+- text-classification-other-bias-evaluation
 paperswithcode_id: crows-pairs
 pretty_name: CrowS-Pairs
 ---
diff --git a/datasets/cs_restaurants/README.md b/datasets/cs_restaurants/README.md
index e6c944ce12f..1a8127d319b 100644
--- a/datasets/cs_restaurants/README.md
+++ b/datasets/cs_restaurants/README.md
@@ -15,12 +15,14 @@ size_categories:
 source_datasets:
 - extended|other-san-francisco-restaurants
 task_categories:
-- conditional-text-generation
-- sequence-modeling
+- text2text-generation
+- text-generation
+- fill-mask
 task_ids:
 - dialogue-modeling
 - language-modeling
-- other-structured-to-text
+- masked-language-modeling
+- text2text-generation-other-intent-to-text
 paperswithcode_id: czech-restaurant-information
 pretty_name: Czech Restaurant
 ---
@@ -62,7 +64,7 @@ This is a dataset for NLG in task-oriented spoken dialogue systems with Czech as
 
 ### Supported Tasks and Leaderboards
 
-- `other-structured-to-text`: The dataset can be used to train a model for data-to-text generation: from a desired dialogue act, the model must produce textual output that conveys this intention.
+- `other-intent-to-text`: The dataset can be used to train a model for data-to-text generation: from a desired dialogue act, the model must produce textual output that conveys this intention.
 
 ### Languages
 
diff --git a/datasets/curiosity_dialogs/README.md b/datasets/curiosity_dialogs/README.md
index 28b5e2f11b9..96f8e1c841d 100644
--- a/datasets/curiosity_dialogs/README.md
+++ b/datasets/curiosity_dialogs/README.md
@@ -14,10 +14,12 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - dialogue-modeling
-- sequence-modeling-other-conversational-curiosity
+- text-generation
+- fill-mask-other-conversational-curiosity
 paperswithcode_id: curiosity
 pretty_name: Curiosity Dataset
 ---
@@ -61,7 +63,7 @@ Curiosity dataset consists of 14K English dialogs (181K utterances) where users
 
 ### Supported Tasks and Leaderboards
 
-* `sequence-modeling-other-conversational-curiosity`: The dataset can be used to train a model for Conversational Curiosity, which consists in the testing of the hypothesis that engagement increases when users are presented with facts related to what they know. Success on this task is typically measured by achieving a *high* [Accuracy](https://huggingface.co/metrics/accuracy) and [F1 Score](https://huggingface.co/metrics/f1).
+* `text-generation-other-conversational-curiosity`: The dataset can be used to train a model for Conversational Curiosity, which consists in the testing of the hypothesis that engagement increases when users are presented with facts related to what they know. Success on this task is typically measured by achieving a *high* [Accuracy](https://huggingface.co/metrics/accuracy) and [F1 Score](https://huggingface.co/metrics/f1).
 
 ### Languages
 
diff --git a/datasets/dane/README.md b/datasets/dane/README.md
index 75f9da4a9c9..7bf71d17bc9 100644
--- a/datasets/dane/README.md
+++ b/datasets/dane/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - extended|other-Danish-Universal-Dependencies-treebank
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 - part-of-speech-tagging
diff --git a/datasets/dart/README.md b/datasets/dart/README.md
index 47f6169b33c..a62f65f6595 100644
--- a/datasets/dart/README.md
+++ b/datasets/dart/README.md
@@ -19,9 +19,9 @@ source_datasets:
 - extended|web_nlg
 - extended|cleaned_e2e
 task_categories:
-- conditional-text-generation
+- structured-to-text
 task_ids:
-- conditional-text-generation-other-rdf-to-text
+- rdf-to-text
 paperswithcode_id: dart
 pretty_name: DART
 ---
@@ -67,7 +67,7 @@ DART is a large dataset for open-domain structured data record to text generatio
 
 The task associated to DART is text generation from data records that are RDF triplets:
 
-- `conditional-text-generation-other-rdf-to-text`: The dataset can be used to train a model for text generation from RDF triplets, which consists in generating textual description of structured data. Success on this task is typically measured by achieving a *high* [BLEU](https://huggingface.co/metrics/bleu), [METEOR](https://huggingface.co/metrics/meteor), [BLEURT](https://huggingface.co/metrics/bleurt), [TER](https://huggingface.co/metrics/ter), [MoverScore](https://huggingface.co/metrics/mover_score), and [BERTScore](https://huggingface.co/metrics/bert_score). The ([BART-large model](https://huggingface.co/facebook/bart-large) from [BART](https://huggingface.co/transformers/model_doc/bart.html)) model currently achieves the following scores:
+- `rdf-to-text`: The dataset can be used to train a model for text generation from RDF triplets, which consists in generating textual description of structured data. Success on this task is typically measured by achieving a *high* [BLEU](https://huggingface.co/metrics/bleu), [METEOR](https://huggingface.co/metrics/meteor), [BLEURT](https://huggingface.co/metrics/bleurt), [TER](https://huggingface.co/metrics/ter), [MoverScore](https://huggingface.co/metrics/mover_score), and [BERTScore](https://huggingface.co/metrics/bert_score). The ([BART-large model](https://huggingface.co/facebook/bart-large) from [BART](https://huggingface.co/transformers/model_doc/bart.html)) model currently achieves the following scores:
 
 |            | BLEU  | METEOR | TER  | MoverScore  | BERTScore  | BLEURT |
 | -----      | ----- | ------ | ---- | ----------- | ---------- | ------ |
diff --git a/datasets/dbrd/README.md b/datasets/dbrd/README.md
index 93d1668d8cb..5f22ef35ee1 100644
--- a/datasets/dbrd/README.md
+++ b/datasets/dbrd/README.md
@@ -15,10 +15,12 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 - text-classification
 task_ids:
 - language-modeling
+- masked-language-modeling
 - sentiment-classification
 paperswithcode_id: dbrd
 ---
@@ -63,7 +65,7 @@ The DBRD (pronounced *dee-bird*) dataset contains over 110k book reviews of whic
 
 ### Supported Tasks and Leaderboards
 
-- `sequence-modeling`: The dataset can be used to train a model for sequence modeling, more specifically language modeling.
+- `text-generation`: The dataset can be used to train a model for sequence modeling, more specifically language modeling.
 - `text-classification`: The dataset can be used to train a model for text classification, more specifically sentiment classification, using the provided positive/negative sentiment polarity labels.
 
 ### Languages
diff --git a/datasets/deal_or_no_dialog/README.md b/datasets/deal_or_no_dialog/README.md
index 261f34f3334..75fc6c73f28 100644
--- a/datasets/deal_or_no_dialog/README.md
+++ b/datasets/deal_or_no_dialog/README.md
@@ -14,9 +14,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- conditional-text-generation-other-dialogue-generation
+- conversational
+task_ids: []
 paperswithcode_id: negotiation-dialogues-dataset
 pretty_name: Deal or No Deal Negotiator
 ---
diff --git a/datasets/dialog_re/README.md b/datasets/dialog_re/README.md
index a43d5604f4c..ba6ba087434 100644
--- a/datasets/dialog_re/README.md
+++ b/datasets/dialog_re/README.md
@@ -15,7 +15,8 @@ source_datasets:
 - original
 task_categories:
 - other
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - other-other-relation-extraction
 - dialogue-modeling
diff --git a/datasets/disaster_response_messages/README.md b/datasets/disaster_response_messages/README.md
index ab04c4c597b..6cc9c750998 100644
--- a/datasets/disaster_response_messages/README.md
+++ b/datasets/disaster_response_messages/README.md
@@ -18,7 +18,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
+- text2text-generation
 - text-classification
 task_ids:
 - intent-classification
diff --git a/datasets/drop/README.md b/datasets/drop/README.md
index d3ee7a54c96..82b078383ce 100644
--- a/datasets/drop/README.md
+++ b/datasets/drop/README.md
@@ -16,6 +16,7 @@ source_datasets:
 - original
 task_categories:
 - question-answering
+- text2text-generation
 task_ids:
 - extractive-qa
 - abstractive-qa
diff --git a/datasets/duorc/README.md b/datasets/duorc/README.md
index 1ac6a5264f1..a68661aed49 100644
--- a/datasets/duorc/README.md
+++ b/datasets/duorc/README.md
@@ -18,6 +18,7 @@ source_datasets:
 - original
 task_categories:
 - question-answering
+- text2text-generation
 task_ids:
 - abstractive-qa
 - extractive-qa
diff --git a/datasets/e2e_nlg/README.md b/datasets/e2e_nlg/README.md
index 17baa7f2ed1..65a34c7670c 100644
--- a/datasets/e2e_nlg/README.md
+++ b/datasets/e2e_nlg/README.md
@@ -14,9 +14,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
+- text2text-generation
 task_ids:
-- conditional-text-generation-other-meaning-representtion-to-text
+- text2text-generation-other-meaning-representation-to-text
 paperswithcode_id: e2e
 pretty_name: End-to-End NLG Challenge
 ---
@@ -67,7 +67,7 @@ https://arxiv.org/abs/1706.09254
 
 ### Supported Tasks and Leaderboards
 
-- `conditional-text-generation-other-meaning-representtion-to-text`: The dataset can be used to train a model to generate descriptions in the restaurant domain from meaning representations, which consists in taking as input some data about a restaurant and generate a sentence in natural language that presents the different aspects of the data about the restaurant.. Success on this task is typically measured by achieving a *high* [BLEU](https://huggingface.co/metrics/bleu), [NIST](https://huggingface.co/metrics/nist), [METEOR](https://huggingface.co/metrics/meteor), [Rouge-L](https://huggingface.co/metrics/rouge), [CIDEr](https://huggingface.co/metrics/cider). The TGen model (Dusek and Jurcıcek, 2016a) was used a baseline, had the following scores:
+- `text2text-generation-other-meaning-representation-to-text`: The dataset can be used to train a model to generate descriptions in the restaurant domain from meaning representations, which consists in taking as input some data about a restaurant and generate a sentence in natural language that presents the different aspects of the data about the restaurant.. Success on this task is typically measured by achieving a *high* [BLEU](https://huggingface.co/metrics/bleu), [NIST](https://huggingface.co/metrics/nist), [METEOR](https://huggingface.co/metrics/meteor), [Rouge-L](https://huggingface.co/metrics/rouge), [CIDEr](https://huggingface.co/metrics/cider). The TGen model (Dusek and Jurcıcek, 2016a) was used a baseline, had the following scores:
 
 |          | BLEU	  | NIST   | METEOR | ROUGE_L | CIDEr  |
 | -------- | ------ | ------ | ------ | ------- | ------ |
diff --git a/datasets/e2e_nlg_cleaned/README.md b/datasets/e2e_nlg_cleaned/README.md
index 4d48ba15b24..3444856ba66 100644
--- a/datasets/e2e_nlg_cleaned/README.md
+++ b/datasets/e2e_nlg_cleaned/README.md
@@ -14,9 +14,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
+- text2text-generation
 task_ids:
-- conditional-text-generation-other-meaning-representtion-to-text
+- text2text-generation-other-meaning-representtion-to-text
 paperswithcode_id: null
 pretty_name: the Cleaned Version of the E2E Dataset
 ---
@@ -69,7 +69,7 @@ https://arxiv.org/abs/1706.09254
 
 ### Supported Tasks and Leaderboards
 
-- `conditional-text-generation-other-meaning-representtion-to-text`: The dataset can be used to train a model to generate descriptions in the restaurant domain from meaning representations, which consists in taking as input some data about a restaurant and generate a sentence in natural language that presents the different aspects of the data about the restaurant.. Success on this task is typically measured by achieving a *high* [BLEU](https://huggingface.co/metrics/bleu), [NIST](https://huggingface.co/metrics/nist), [METEOR](https://huggingface.co/metrics/meteor), [Rouge-L](https://huggingface.co/metrics/rouge), [CIDEr](https://huggingface.co/metrics/cider).
+- `text2text-generation-other-meaning-representtion-to-text`: The dataset can be used to train a model to generate descriptions in the restaurant domain from meaning representations, which consists in taking as input some data about a restaurant and generate a sentence in natural language that presents the different aspects of the data about the restaurant.. Success on this task is typically measured by achieving a *high* [BLEU](https://huggingface.co/metrics/bleu), [NIST](https://huggingface.co/metrics/nist), [METEOR](https://huggingface.co/metrics/meteor), [Rouge-L](https://huggingface.co/metrics/rouge), [CIDEr](https://huggingface.co/metrics/cider).
 
 
 This task has an inactive leaderboard which can be found [here](http://www.macs.hw.ac.uk/InteractionLab/E2E/) and ranks models based on the metrics above.
diff --git a/datasets/ecb/README.md b/datasets/ecb/README.md
index 7a11cc043c3..fba34e5cb78 100644
--- a/datasets/ecb/README.md
+++ b/datasets/ecb/README.md
@@ -32,9 +32,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: ecb
 pretty_name: extension to the EventCorefBank
 ---
diff --git a/datasets/ehealth_kd/README.md b/datasets/ehealth_kd/README.md
index dfac294cc5b..b4e667a311c 100644
--- a/datasets/ehealth_kd/README.md
+++ b/datasets/ehealth_kd/README.md
@@ -14,10 +14,10 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
-- structure-prediction-other-relation-prediction
+- token-classification-other-relation-prediction
 paperswithcode_id: null
 pretty_name: eHealth-KD
 ---
diff --git a/datasets/eitb_parcc/README.md b/datasets/eitb_parcc/README.md
index 2af59af4149..de59c43596e 100644
--- a/datasets/eitb_parcc/README.md
+++ b/datasets/eitb_parcc/README.md
@@ -15,9 +15,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: eitb-parcc
 pretty_name: EiTB-ParCC
 ---
diff --git a/datasets/eli5/README.md b/datasets/eli5/README.md
index 3b8a3aff2c8..6a96e8b83b9 100644
--- a/datasets/eli5/README.md
+++ b/datasets/eli5/README.md
@@ -14,10 +14,10 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- question-answering
+- text2text-generation
 task_ids:
 - abstractive-qa
-- open-domain-qa
+- open-domain-abstrative-qa
 paperswithcode_id: eli5
 pretty_name: ELI5
 ---
@@ -61,7 +61,7 @@ The ELI5 dataset is an English-language dataset of questions and answers gathere
 
 ### Supported Tasks and Leaderboards
 
-- `abstractive-qa`, `open-domain-qa`: The dataset can be used to train a model for Open Domain Long Form Question Answering. An LFQA model is presented with a non-factoid and asked to retrieve relevant information from a knowledge source (such as [Wikipedia](https://www.wikipedia.org/)), then use it to generate a multi-sentence answer. The model performance is measured by how high its [ROUGE](https://huggingface.co/metrics/rouge) score to the reference is. A [BART-based model](https://huggingface.co/yjernite/bart_eli5) with a [dense retriever](https://huggingface.co/yjernite/retribert-base-uncased) trained to draw information from [Wikipedia passages](https://huggingface.co/datasets/wiki_snippets) achieves a [ROUGE-L of 0.149](https://yjernite.github.io/lfqa.html#generation).
+- `abstractive-qa`, `open-domain-abstractive-qa`: The dataset can be used to train a model for Open Domain Long Form Question Answering. An LFQA model is presented with a non-factoid and asked to retrieve relevant information from a knowledge source (such as [Wikipedia](https://www.wikipedia.org/)), then use it to generate a multi-sentence answer. The model performance is measured by how high its [ROUGE](https://huggingface.co/metrics/rouge) score to the reference is. A [BART-based model](https://huggingface.co/yjernite/bart_eli5) with a [dense retriever](https://huggingface.co/yjernite/retribert-base-uncased) trained to draw information from [Wikipedia passages](https://huggingface.co/datasets/wiki_snippets) achieves a [ROUGE-L of 0.149](https://yjernite.github.io/lfqa.html#generation).
 
 ### Languages
 
diff --git a/datasets/eli5_category/README.md b/datasets/eli5_category/README.md
index 4d735f7d489..950ec5050a1 100644
--- a/datasets/eli5_category/README.md
+++ b/datasets/eli5_category/README.md
@@ -16,10 +16,10 @@ size_categories:
 source_datasets:
 - extended|eli5
 task_categories:
-- question-answering
+- text2text-generation
 task_ids:
 - abstractive-qa
-- open-domain-qa
+- open-domain-abstractive-qa
 ---
 
 # Dataset Card for ELI5-Category
@@ -61,7 +61,7 @@ The ELI5-Category dataset is a smaller but newer and categorized version of the
 
 ### Supported Tasks and Leaderboards
 
-- `abstractive-qa`, `open-domain-qa`: The dataset can be used to train a model for Open Domain Long Form Question Answering. An LFQA model is presented with a non-factoid and asked to retrieve relevant information from a knowledge source (such as [Wikipedia](https://www.wikipedia.org/)), then use it to generate a multi-sentence answer. 
+- `abstractive-qa`, `open-domain-abstractive-qa`: The dataset can be used to train a model for Open Domain Long Form Question Answering. An LFQA model is presented with a non-factoid and asked to retrieve relevant information from a knowledge source (such as [Wikipedia](https://www.wikipedia.org/)), then use it to generate a multi-sentence answer. 
 
 ### Languages
 
diff --git a/datasets/elkarhizketak/README.md b/datasets/elkarhizketak/README.md
index 756169477ae..efdd819af22 100644
--- a/datasets/elkarhizketak/README.md
+++ b/datasets/elkarhizketak/README.md
@@ -15,9 +15,9 @@ source_datasets:
 - original
 task_categories:
 - question-answering
-- other-dialogue
 task_ids:
 - extractive-qa
+- question-ansering-other-dialogue-qa
 pretty_name: ElkarHizketak
 ---
 
diff --git a/datasets/emea/README.md b/datasets/emea/README.md
index f1a0f0094e0..772e44f6f15 100644
--- a/datasets/emea/README.md
+++ b/datasets/emea/README.md
@@ -44,9 +44,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: EMEA
 ---
diff --git a/datasets/enriched_web_nlg/README.md b/datasets/enriched_web_nlg/README.md
index 9f1db5a10dc..325426cded6 100644
--- a/datasets/enriched_web_nlg/README.md
+++ b/datasets/enriched_web_nlg/README.md
@@ -17,9 +17,9 @@ size_categories:
 source_datasets:
 - extended|other-web-nlg
 task_categories:
-- conditional-text-generation
+- structured-to-text
 task_ids:
-- other-structured-to-text
+- rdf-to-text
 paperswithcode_id: null
 pretty_name: Enriched WebNLG
 ---
@@ -64,7 +64,7 @@ DBpedia triples shown in (a), the aim is to generate a text such as (b). It is a
 
 ### Supported Tasks and Leaderboards
 
-The dataset supports a `other-structured-to-text` task which requires a model takes a set of RDF (Resource Description
+The dataset supports a `other-rdf-to-text` task which requires a model takes a set of RDF (Resource Description
 Format) triples from a database (DBpedia) of the form (subject, property, object) as input and write out a natural
 language sentence expressing the information contained in the triples.
 
diff --git a/datasets/euronews/README.md b/datasets/euronews/README.md
index aa4198b11c9..14a41780bb3 100644
--- a/datasets/euronews/README.md
+++ b/datasets/euronews/README.md
@@ -16,7 +16,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: europeana-newspapers
diff --git a/datasets/europa_eac_tm/README.md b/datasets/europa_eac_tm/README.md
index a2112af124f..e16c6310e91 100644
--- a/datasets/europa_eac_tm/README.md
+++ b/datasets/europa_eac_tm/README.md
@@ -39,9 +39,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: Europa Education and Culture Translation Memory (EAC-TM)
 ---
@@ -88,7 +87,7 @@ To load a language pair that is not part of the config, just specify the languag
 
 ### Supported Tasks and Leaderboards
 
-- `conditional-text-generation`: the dataset can be used to train a model for `machine-translation`. Machine translation models are usually evaluated using metrics such as [BLEU](https://huggingface.co/metrics/bleu), [ROUGE](https://huggingface.co/metrics/rouge) or [SacreBLEU](https://huggingface.co/metrics/sacrebleu). You can use the [mBART](https://huggingface.co/facebook/mbart-large-cc25) model for this task. This task has active leaderboards which can be found at [https://paperswithcode.com/task/machine-translation](https://paperswithcode.com/task/machine-translation), which usually rank models based on [BLEU score](https://huggingface.co/metrics/bleu).
+- `text2text-generation`: the dataset can be used to train a model for `machine-translation`. Machine translation models are usually evaluated using metrics such as [BLEU](https://huggingface.co/metrics/bleu), [ROUGE](https://huggingface.co/metrics/rouge) or [SacreBLEU](https://huggingface.co/metrics/sacrebleu). You can use the [mBART](https://huggingface.co/facebook/mbart-large-cc25) model for this task. This task has active leaderboards which can be found at [https://paperswithcode.com/task/machine-translation](https://paperswithcode.com/task/machine-translation), which usually rank models based on [BLEU score](https://huggingface.co/metrics/bleu).
 
 ### Languages
 
diff --git a/datasets/europa_ecdc_tm/README.md b/datasets/europa_ecdc_tm/README.md
index 1c4f02cabf8..a3360174b22 100644
--- a/datasets/europa_ecdc_tm/README.md
+++ b/datasets/europa_ecdc_tm/README.md
@@ -38,9 +38,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: EuropaEcdcTm
 ---
@@ -91,7 +90,7 @@ To load a language pair that is not part of the config, just specify the languag
 
 ### Supported Tasks and Leaderboards
 
-- `conditional-text-generation`: the dataset can be used to train a model for `machine-translation`. Machine translation models are usually evaluated using metrics such as [BLEU](https://huggingface.co/metrics/bleu), [ROUGE](https://huggingface.co/metrics/rouge) or [SacreBLEU](https://huggingface.co/metrics/sacrebleu). You can use the [mBART](https://huggingface.co/facebook/mbart-large-cc25) model for this task. This task has active leaderboards which can be found at [https://paperswithcode.com/task/machine-translation](https://paperswithcode.com/task/machine-translation), which usually rank models based on [BLEU score](https://huggingface.co/metrics/bleu).
+- `text2text-generation`: the dataset can be used to train a model for `machine-translation`. Machine translation models are usually evaluated using metrics such as [BLEU](https://huggingface.co/metrics/bleu), [ROUGE](https://huggingface.co/metrics/rouge) or [SacreBLEU](https://huggingface.co/metrics/sacrebleu). You can use the [mBART](https://huggingface.co/facebook/mbart-large-cc25) model for this task. This task has active leaderboards which can be found at [https://paperswithcode.com/task/machine-translation](https://paperswithcode.com/task/machine-translation), which usually rank models based on [BLEU score](https://huggingface.co/metrics/bleu).
 
 ### Languages
 
diff --git a/datasets/europarl_bilingual/README.md b/datasets/europarl_bilingual/README.md
index 68d5f86e782..158db71fe3a 100644
--- a/datasets/europarl_bilingual/README.md
+++ b/datasets/europarl_bilingual/README.md
@@ -34,9 +34,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- other
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: europarl-bilingual
 ---
diff --git a/datasets/farsi_news/README.md b/datasets/farsi_news/README.md
index 6306f7ef535..c8f7696230d 100644
--- a/datasets/farsi_news/README.md
+++ b/datasets/farsi_news/README.md
@@ -14,9 +14,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 paperswithcode_id: null
 pretty_name: FarsiNews
 ---
diff --git a/datasets/finer/README.md b/datasets/finer/README.md
index d84d9a682e3..2b8f56e785e 100644
--- a/datasets/finer/README.md
+++ b/datasets/finer/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: finer
diff --git a/datasets/flores/README.md b/datasets/flores/README.md
index 796d658adcd..effb778a96b 100644
--- a/datasets/flores/README.md
+++ b/datasets/flores/README.md
@@ -28,9 +28,8 @@ source_datasets:
 - extended|other-global-voices
 - extended|other-common-crawl
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: flores
 ---
 
diff --git a/datasets/gem/README.md b/datasets/gem/README.md
index 791ce1d6b16..c8a390f01b4 100644
--- a/datasets/gem/README.md
+++ b/datasets/gem/README.md
@@ -215,46 +215,47 @@ source_datasets:
   - original
 task_categories:
   common_gen:
-  - conditional-text-generation
+  - text2text-generation
   cs_restaurants:
-  - conditional-text-generation
+  - text2text-generation
   dart:
-  - conditional-text-generation
+  - structured-to-text
   e2e_nlg:
-  - conditional-text-generation
+  - text2text-generation
   mlsum_de:
-  - conditional-text-generation
+  - text2text-generation
   mlsum_es:
-  - conditional-text-generation
+  - text2text-generation
   schema_guided_dialog:
-  - sequence-modeling
+  - text-generation
+  - fill-mask
   totto:
-  - conditional-text-generation
+  - text2text-generation
   web_nlg_en:
-  - conditional-text-generation
+  - structured-to-text
   web_nlg_ru:
-  - conditional-text-generation
+  - structured-to-text
   wiki_auto_asset_turk:
-  - conditional-text-generation
+  - text2text-generation
   wiki_lingua_es_en:
-  - conditional-text-generation
+  - text2text-generation
   wiki_lingua_ru_en:
-  - conditional-text-generation
+  - text2text-generation
   wiki_lingua_tr_en:
-  - conditional-text-generation
+  - text2text-generation
   wiki_lingua_vi_en:
-  - conditional-text-generation
+  - text2text-generation
   xsum:
-  - conditional-text-generation
+  - text2text-generation
 task_ids:
   common_gen:
-  - other-structured-to-text
+  - other-concepts-to-text
   cs_restaurants:
-  - other-structured-to-text
+  - other-intent-to-text
   dart:
-  - other-structured-to-text
+  - rdf-to-text
   e2e_nlg:
-  - other-structured-to-text
+  - text2text-generation-other-meaning-representation-to-text
   mlsum_de:
   - summarization
   mlsum_es:
@@ -264,9 +265,9 @@ task_ids:
   totto:
   - table-to-text
   web_nlg_en:
-  - other-structured-to-text
+  - rdf-to-text
   web_nlg_ru:
-  - other-structured-to-text
+  - rdf-to-text
   wiki_auto_asset_turk:
   - text-simplification
   wiki_lingua_es_en:
diff --git a/datasets/generated_reviews_enth/README.md b/datasets/generated_reviews_enth/README.md
index 629df77130a..0d05f6d7098 100644
--- a/datasets/generated_reviews_enth/README.md
+++ b/datasets/generated_reviews_enth/README.md
@@ -16,10 +16,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
+- transkation
 - text-classification
 task_ids:
-- machine-translation
 - multi-class-classification
 - semantic-similarity-classification
 paperswithcode_id: null
diff --git a/datasets/german_legal_entity_recognition/README.md b/datasets/german_legal_entity_recognition/README.md
index 096037a525d..e57fe49f8b8 100644
--- a/datasets/german_legal_entity_recognition/README.md
+++ b/datasets/german_legal_entity_recognition/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: legal-documents-entity-recognition
diff --git a/datasets/germaner/README.md b/datasets/germaner/README.md
index 1a679fbb6e8..bb1f47b8864 100644
--- a/datasets/germaner/README.md
+++ b/datasets/germaner/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: null
diff --git a/datasets/giga_fren/README.md b/datasets/giga_fren/README.md
index 8ac0c6a10cf..b77de7bf102 100644
--- a/datasets/giga_fren/README.md
+++ b/datasets/giga_fren/README.md
@@ -15,9 +15,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: GigaFren
 ---
diff --git a/datasets/gigaword/README.md b/datasets/gigaword/README.md
index d67b30c3cab..2f97f7af60e 100644
--- a/datasets/gigaword/README.md
+++ b/datasets/gigaword/README.md
@@ -14,9 +14,9 @@ size_categories:
 source_datasets:
 - extended|gigaword_2003
 task_categories:
-- conditional-text-generation
-task_ids:
 - summarization
+task_ids:
+- summarization--other-headline-generation
 paperswithcode_id: null
 pretty_name: Gigaword
 ---
diff --git a/datasets/glucose/README.md b/datasets/glucose/README.md
index 30949e226b9..533798c754a 100644
--- a/datasets/glucose/README.md
+++ b/datasets/glucose/README.md
@@ -14,9 +14,11 @@ size_categories:
 source_datasets:
 - extended|other-ROC-stories
 task_categories:
-- sequence-modeling
-task_ids:
-- sequence-modeling-other-common-sense-inference
+- text-generation
+- fill-mask
+- text-generation
+- fill-mask
+- text-generation-other-common-sense-inference
 paperswithcode_id: glucose
 pretty_name: GLUCOSE
 ---
diff --git a/datasets/glue/README.md b/datasets/glue/README.md
index 92b54d2d2bf..5d917812a37 100644
--- a/datasets/glue/README.md
+++ b/datasets/glue/README.md
@@ -35,7 +35,7 @@ task_categories:
   sst2:
   - text-classification
   stsb:
-  - text-scoring
+  - text-classification
   wnli:
   - text-classification
 task_ids:
@@ -60,6 +60,7 @@ task_ids:
   sst2:
   - sentiment-classification
   stsb:
+  - text-scoring
   - semantic-similarity-scoring
   wnli:
   - text-classification-other-coreference-nli
diff --git a/datasets/google_wellformed_query/README.md b/datasets/google_wellformed_query/README.md
index 46e885552c8..ac4a542eee8 100644
--- a/datasets/google_wellformed_query/README.md
+++ b/datasets/google_wellformed_query/README.md
@@ -1,10 +1,10 @@
 ---
 task_categories:
-- text-scoring
+- text-classification
 multilinguality:
 - monolingual
 task_ids:
-- other
+- text-scoring
 languages:
 - en
 annotations_creators:
diff --git a/datasets/great_code/README.md b/datasets/great_code/README.md
index 95169412468..05ac0f43717 100644
--- a/datasets/great_code/README.md
+++ b/datasets/great_code/README.md
@@ -14,9 +14,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
 - table-to-text
+task_ids: []
 paperswithcode_id: null
 pretty_name: GREAT
 ---
diff --git a/datasets/harem/README.md b/datasets/harem/README.md
index 07c73364048..70339486629 100644
--- a/datasets/harem/README.md
+++ b/datasets/harem/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: null
diff --git a/datasets/has_part/README.md b/datasets/has_part/README.md
index 6ec23875b4a..869e9007ca1 100644
--- a/datasets/has_part/README.md
+++ b/datasets/has_part/README.md
@@ -14,9 +14,10 @@ size_categories:
 source_datasets:
 - extended|other-Generics-KB
 task_categories:
-- text-scoring
+- text-classification
 task_ids:
-- text-scoring-other-Meronym-Prediction
+- text-scoring
+- text-classification-other-Meronym-Prediction
 paperswithcode_id: haspart-kb
 pretty_name: hasPart KB
 ---
diff --git a/datasets/hate_speech_pl/README.md b/datasets/hate_speech_pl/README.md
index 2fa70687f7c..754b08a459e 100644
--- a/datasets/hate_speech_pl/README.md
+++ b/datasets/hate_speech_pl/README.md
@@ -15,8 +15,8 @@ source_datasets:
 - original
 task_categories:
 - text-classification
-- text-scoring
 task_ids:
+- text-scoring
 - multi-class-classification
 - multi-label-classification
 - sentiment-classification
diff --git a/datasets/hausa_voa_ner/README.md b/datasets/hausa_voa_ner/README.md
index eda07ef1c13..f1e8f17499d 100644
--- a/datasets/hausa_voa_ner/README.md
+++ b/datasets/hausa_voa_ner/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: null
diff --git a/datasets/hebrew_projectbenyehuda/README.md b/datasets/hebrew_projectbenyehuda/README.md
index e51e51f7d7b..650ab3b169f 100644
--- a/datasets/hebrew_projectbenyehuda/README.md
+++ b/datasets/hebrew_projectbenyehuda/README.md
@@ -14,9 +14,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 paperswithcode_id: null
 pretty_name: Hebrew Projectbenyehuda
 ---
diff --git a/datasets/hebrew_this_world/README.md b/datasets/hebrew_this_world/README.md
index 728926f6242..fb668d02363 100644
--- a/datasets/hebrew_this_world/README.md
+++ b/datasets/hebrew_this_world/README.md
@@ -14,9 +14,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 paperswithcode_id: null
 pretty_name: HebrewSentiment
 ---
diff --git a/datasets/hind_encorp/README.md b/datasets/hind_encorp/README.md
index 4a01623f6a2..c90de52a7b9 100644
--- a/datasets/hind_encorp/README.md
+++ b/datasets/hind_encorp/README.md
@@ -16,9 +16,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: hindencorp
 pretty_name: HindEnCorp
 ---
diff --git a/datasets/hindi_discourse/README.md b/datasets/hindi_discourse/README.md
index eea3a3308a8..55d9e195a13 100644
--- a/datasets/hindi_discourse/README.md
+++ b/datasets/hindi_discourse/README.md
@@ -14,9 +14,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
-task_ids:
-- sequence-modeling-other-discourse-analysis
+- text-generation
+- fill-mask
+- text-generation
+- fill-mask
+- text-generation-other-discourse-analysis
 paperswithcode_id: null
 pretty_name: Discourse Analysis dataset
 ---
diff --git a/datasets/hippocorpus/README.md b/datasets/hippocorpus/README.md
index d33059a9cb5..1fee90765bd 100644
--- a/datasets/hippocorpus/README.md
+++ b/datasets/hippocorpus/README.md
@@ -14,9 +14,10 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- text-scoring
+- text-classification
 task_ids:
-- text-scoring-other-narrative-flow
+- text-scoring
+- text-classification-other-narrative-flow
 paperswithcode_id: null
 pretty_name: hippocorpus
 ---
diff --git a/datasets/hkcancor/README.md b/datasets/hkcancor/README.md
index 7c1b177eb65..a4dec2c869b 100644
--- a/datasets/hkcancor/README.md
+++ b/datasets/hkcancor/README.md
@@ -14,11 +14,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-- sequence-modeling
+- translation
+- text-generation
+- fill-mask
 task_ids:
 - dialogue-modeling
-- machine-translation
 paperswithcode_id: hong-kong-cantonese-corpus
 pretty_name: The Hong Kong Cantonese Corpus (HKCanCor)
 ---
diff --git a/datasets/hrenwac_para/README.md b/datasets/hrenwac_para/README.md
index 2a46234cf14..69f93ea9877 100644
--- a/datasets/hrenwac_para/README.md
+++ b/datasets/hrenwac_para/README.md
@@ -15,9 +15,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: HrenwacPara
 ---
diff --git a/datasets/hrwac/README.md b/datasets/hrwac/README.md
index dc0f58ede08..81e5a4d0370 100644
--- a/datasets/hrwac/README.md
+++ b/datasets/hrwac/README.md
@@ -14,9 +14,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 paperswithcode_id: null
 pretty_name: HrWac
 ---
diff --git a/datasets/humicroedit/README.md b/datasets/humicroedit/README.md
index cacb03a565d..574d5eff47d 100644
--- a/datasets/humicroedit/README.md
+++ b/datasets/humicroedit/README.md
@@ -16,12 +16,13 @@ source_datasets:
 - original
 task_categories:
   subtask-1:
-  - text-scoring
+  - text-classification
   subtask-2:
   - text-classification
 task_ids:
   subtask-1:
-  - text-scoring-other-funniness-score-prediction
+  - text-scoring
+  - text-classification-other-funniness-score-prediction
   subtask-2:
   - text-classification-other-funnier-headline-identification
 paperswithcode_id: humicroedit
diff --git a/datasets/id_liputan6/README.md b/datasets/id_liputan6/README.md
index e19b28ed60d..4e78415ee70 100644
--- a/datasets/id_liputan6/README.md
+++ b/datasets/id_liputan6/README.md
@@ -14,9 +14,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
 - summarization
+task_ids: []
 paperswithcode_id: null
 pretty_name: Large-scale Indonesian Summarization
 ---
diff --git a/datasets/id_nergrit_corpus/README.md b/datasets/id_nergrit_corpus/README.md
index e845eafc13b..7b1cd8b6745 100644
--- a/datasets/id_nergrit_corpus/README.md
+++ b/datasets/id_nergrit_corpus/README.md
@@ -15,7 +15,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: nergrit-corpus
diff --git a/datasets/id_newspapers_2018/README.md b/datasets/id_newspapers_2018/README.md
index 27edb0dcc59..4405b1f37ba 100644
--- a/datasets/id_newspapers_2018/README.md
+++ b/datasets/id_newspapers_2018/README.md
@@ -14,9 +14,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 paperswithcode_id: null
 pretty_name: Indonesian Newspapers 2018
 ---
diff --git a/datasets/id_panl_bppt/README.md b/datasets/id_panl_bppt/README.md
index 611737fa34d..15d177f26e6 100644
--- a/datasets/id_panl_bppt/README.md
+++ b/datasets/id_panl_bppt/README.md
@@ -15,9 +15,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: IdPanlBppt
 ---
diff --git a/datasets/id_puisi/README.md b/datasets/id_puisi/README.md
index 22ac9c145f4..6b310c9f9ae 100644
--- a/datasets/id_puisi/README.md
+++ b/datasets/id_puisi/README.md
@@ -14,11 +14,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-- sequence-modeling
+- text2text-generation
+- text-generation
+- fill-mask
 task_ids:
-- language-modeling
-- other-structured-to-text
+- text2text-generation-other-poem-generation
 paperswithcode_id: null
 pretty_name: Indonesian Puisi
 ---
diff --git a/datasets/igbo_english_machine_translation/README.md b/datasets/igbo_english_machine_translation/README.md
index bc95c5c8dde..7c78d88091b 100644
--- a/datasets/igbo_english_machine_translation/README.md
+++ b/datasets/igbo_english_machine_translation/README.md
@@ -15,9 +15,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: igbonlp-datasets
 pretty_name: IgboNLP Datasets
 ---
diff --git a/datasets/igbo_monolingual/README.md b/datasets/igbo_monolingual/README.md
index af1da8932c2..5a2a4e5e5a7 100644
--- a/datasets/igbo_monolingual/README.md
+++ b/datasets/igbo_monolingual/README.md
@@ -31,9 +31,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 paperswithcode_id: null
 pretty_name: Igbo Monolingual Dataset
 ---
diff --git a/datasets/igbo_ner/README.md b/datasets/igbo_ner/README.md
index b55e9a59315..043f179ccce 100644
--- a/datasets/igbo_ner/README.md
+++ b/datasets/igbo_ner/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: null
diff --git a/datasets/indonlu/README.md b/datasets/indonlu/README.md
index 2d3cc6cad46..2be924b384d 100644
--- a/datasets/indonlu/README.md
+++ b/datasets/indonlu/README.md
@@ -38,7 +38,7 @@ source_datasets:
 - original
 task_categories:
   bapos:
-  - structure-prediction
+  - token-classification
   casa:
   - text-classification
   emot:
@@ -48,17 +48,17 @@ task_categories:
   hoasa:
   - text-classification
   keps:
-  - structure-prediction
+  - token-classification
   nergrit:
-  - structure-prediction
+  - token-classification
   nerp:
-  - structure-prediction
+  - token-classification
   posp:
-  - structure-prediction
+  - token-classification
   smsa:
   - text-classification
   terma:
-  - structure-prediction
+  - token-classification
   wrete:
   - text-classification
 task_ids:
@@ -73,7 +73,7 @@ task_ids:
   hoasa:
   - text-classification-other-aspect-based-sentiment-analysis
   keps:
-  - structure-prediction-other-keyphrase-extraction
+  - token-classification-other-keyphrase-extraction
   nergrit:
   - named-entity-recognition
   nerp:
@@ -83,7 +83,7 @@ task_ids:
   smsa:
   - sentiment-classification
   terma:
-  - structure-prediction-other-span-extraction
+  - token-classification-other-span-extraction
   wrete:
   - semantic-similarity-classification
 paperswithcode_id: indonlu-benchmark
diff --git a/datasets/inquisitive_qg/README.md b/datasets/inquisitive_qg/README.md
index e7dea5ff940..13bc8f02534 100644
--- a/datasets/inquisitive_qg/README.md
+++ b/datasets/inquisitive_qg/README.md
@@ -15,9 +15,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
+- text2text-generation
 task_ids:
-- conditional-text-generation-other-question-generation
+- text2text-generation-other-question-generation
 paperswithcode_id: inquisitive
 ---
 
diff --git a/datasets/irc_disentangle/README.md b/datasets/irc_disentangle/README.md
index d5b528adac9..70763fefbb7 100644
--- a/datasets/irc_disentangle/README.md
+++ b/datasets/irc_disentangle/README.md
@@ -14,9 +14,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
-- structure-prediction-other-conversation-disentanglement
+- token-classification-other-conversation-disentanglement
 paperswithcode_id: irc-disentanglement
 pretty_name: IRC Disentanglement
 ---
diff --git a/datasets/isixhosa_ner_corpus/README.md b/datasets/isixhosa_ner_corpus/README.md
index 1edb6440c1a..efbcf80cf67 100644
--- a/datasets/isixhosa_ner_corpus/README.md
+++ b/datasets/isixhosa_ner_corpus/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: null
diff --git a/datasets/isizulu_ner_corpus/README.md b/datasets/isizulu_ner_corpus/README.md
index 95f19440626..a4c2777270f 100644
--- a/datasets/isizulu_ner_corpus/README.md
+++ b/datasets/isizulu_ner_corpus/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: null
diff --git a/datasets/jfleg/README.md b/datasets/jfleg/README.md
index 9ed9d8d5901..2a3aa145f4c 100644
--- a/datasets/jfleg/README.md
+++ b/datasets/jfleg/README.md
@@ -15,9 +15,9 @@ size_categories:
 source_datasets:
 - extended|other-GUG-grammaticality-judgements
 task_categories:
-- conditional-text-generation
+- text2text-generation
 task_ids:
-- conditional-text-generation-other-grammatical-error-correction
+- text2text-generation-other-grammatical-error-correction
 paperswithcode_id: jfleg
 pretty_name: JHU FLuency-Extended GUG corpus
 ---
diff --git a/datasets/jigsaw_unintended_bias/README.md b/datasets/jigsaw_unintended_bias/README.md
index a40faa0b56f..c44e5e90abd 100644
--- a/datasets/jigsaw_unintended_bias/README.md
+++ b/datasets/jigsaw_unintended_bias/README.md
@@ -15,9 +15,10 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- text-scoring
+- text-classification
 task_ids:
-- text-scoring-other-toxicity-prediction
+- text-scoring
+- text-classification-other-toxicity-prediction
 ---
 
 # Dataset Card for Jigsaw Unintended Bias in Toxicity Classification
diff --git a/datasets/jnlpba/README.md b/datasets/jnlpba/README.md
index ad39c68a58d..14a815be148 100644
--- a/datasets/jnlpba/README.md
+++ b/datasets/jnlpba/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - extended|other-genia-v3.02
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: null
diff --git a/datasets/kd_conv/README.md b/datasets/kd_conv/README.md
index 0928a0cb19e..0fadb84f6e6 100644
--- a/datasets/kd_conv/README.md
+++ b/datasets/kd_conv/README.md
@@ -15,10 +15,10 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - dialogue-modeling
-- other-multi-turn
 paperswithcode_id: kdconv
 pretty_name: Knowledge-driven Conversation
 ---
diff --git a/datasets/kde4/README.md b/datasets/kde4/README.md
index 4acc8a71314..d8ba74a6892 100644
--- a/datasets/kde4/README.md
+++ b/datasets/kde4/README.md
@@ -105,9 +105,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: KDE4
 ---
diff --git a/datasets/kilt_tasks/README.md b/datasets/kilt_tasks/README.md
index 0c8b2090c21..797f2199378 100644
--- a/datasets/kilt_tasks/README.md
+++ b/datasets/kilt_tasks/README.md
@@ -136,7 +136,7 @@ task_categories:
   cweb:
   - text-retrieval
   eli5:
-  - question-answering
+  - text2text-generation
   - text-retrieval
   fever:
   - text-classification
@@ -148,10 +148,12 @@ task_categories:
   - question-answering
   - text-retrieval
   structured_zeroshot:
-  - sequence-modeling
+  - text-generation
+  - fill-mask
   - text-retrieval
   trex:
-  - sequence-modeling
+  - text-generation
+  - fill-mask
   - text-retrieval
   triviaqa_support_only:
   - question-answering
@@ -159,7 +161,8 @@ task_categories:
   wned:
   - text-retrieval
   wow:
-  - sequence-modeling
+  - text-generation
+  - fill-mask
   - text-retrieval
 task_ids:
   aidayago2:
@@ -171,7 +174,7 @@ task_ids:
   eli5:
   - abstractive-qa
   - document-retrieval
-  - open-domain-qa
+  - open-domain-abstractive-qa
   fever:
   - document-retrieval
   - fact-checking
diff --git a/datasets/klue/README.md b/datasets/klue/README.md
index adcad6a4e7d..7630c4ba2c6 100644
--- a/datasets/klue/README.md
+++ b/datasets/klue/README.md
@@ -18,30 +18,32 @@ task_categories:
   ynat:
   - text-classification
   sts:
-  - text-scoring
+  - text-classification
   nli:
   - text-classification
   ner:
-  - structure-prediction
+  - token-classification
   re:
-  - structure-prediction
+  - token-classification
   dp:
-  - structure-prediction
+  - token-classification
   mrc:
   - question-answering
   wos:
-  - sequence-modeling
+  - text-generation
+  - fill-mask
 task_ids:
   ynat:
   - topic-classification
   sts:
+  - text-scoring
   - semantic-similarity-scoring
   nli:
   - natural-language-inference
   ner:
   - named-entity-recognition
   re:
-  - other-relation-extraction
+  - token-classification-other-relation-extraction
   dp:
   - parsing
   mrc:
diff --git a/datasets/kor_ner/README.md b/datasets/kor_ner/README.md
index df2487c0de0..bb4165a1a5c 100644
--- a/datasets/kor_ner/README.md
+++ b/datasets/kor_ner/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: null
diff --git a/datasets/lama/README.md b/datasets/lama/README.md
index 80dbe66968d..e3ddb94ae7d 100755
--- a/datasets/lama/README.md
+++ b/datasets/lama/README.md
@@ -28,10 +28,11 @@ source_datasets:
 - extended|squad
 task_categories:
 - text-retrieval
-- text-scoring
+- text-classification
 task_ids:
 - fact-checking-retrieval
-- text-scoring-other-probing
+- text-classification-other-probing
+- text-scoring
 paperswithcode_id: lama
 ---
 
diff --git a/datasets/lambada/README.md b/datasets/lambada/README.md
index e711a53ace2..cb1f0d9cc07 100644
--- a/datasets/lambada/README.md
+++ b/datasets/lambada/README.md
@@ -1,8 +1,8 @@
 ---
 task_categories:
-- conditional-text-generation
+- text2text-generation
 task_ids:
-- conditional-text-generation-other-long-range-dependency
+- text2text-generation-other-long-range-dependency
 multilinguality:
 - monolingual
 languages:
diff --git a/datasets/lener_br/README.md b/datasets/lener_br/README.md
index 5e3c8fb185f..72747df8916 100644
--- a/datasets/lener_br/README.md
+++ b/datasets/lener_br/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: lener-br
diff --git a/datasets/librispeech_asr/README.md b/datasets/librispeech_asr/README.md
index a530435216f..329ecfb246b 100644
--- a/datasets/librispeech_asr/README.md
+++ b/datasets/librispeech_asr/README.md
@@ -17,9 +17,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- speech-processing
-task_ids:
 - automatic-speech-recognition
+task_ids: []
 ---
 
 # Dataset Card for librispeech_asr
diff --git a/datasets/limit/README.md b/datasets/limit/README.md
index 5106460c29b..61671e79ef2 100644
--- a/datasets/limit/README.md
+++ b/datasets/limit/README.md
@@ -15,7 +15,7 @@ source_datasets:
 - extended|net-activities-captions
 - original
 task_categories:
-- structure-prediction
+- token-classification
 - text-classification
 task_ids:
 - multi-class-classification
diff --git a/datasets/linnaeus/README.md b/datasets/linnaeus/README.md
index 0acd6d6090f..95ea019ebc1 100644
--- a/datasets/linnaeus/README.md
+++ b/datasets/linnaeus/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: linnaeus
diff --git a/datasets/lj_speech/README.md b/datasets/lj_speech/README.md
index 0a31deebf18..ef8f4d111ff 100644
--- a/datasets/lj_speech/README.md
+++ b/datasets/lj_speech/README.md
@@ -16,9 +16,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- speech-processing
-task_ids:
 - automatic-speech-recognition
+task_ids: []
 ---
 
 # Dataset Card for lj_speech
diff --git a/datasets/lst20/README.md b/datasets/lst20/README.md
index 859a05c6834..77117a80d77 100644
--- a/datasets/lst20/README.md
+++ b/datasets/lst20/README.md
@@ -14,13 +14,13 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 - part-of-speech-tagging
-- structure-prediction-other-clause-segmentation
-- structure-prediction-other-sentence-segmentation
-- structure-prediction-other-word-segmentation
+- token-classification-other-clause-segmentation
+- token-classification-other-sentence-segmentation
+- token-classification-other-word-segmentation
 paperswithcode_id: null
 pretty_name: LST20
 ---
diff --git a/datasets/m_lama/README.md b/datasets/m_lama/README.md
index cb129051e09..a17141a3dfb 100644
--- a/datasets/m_lama/README.md
+++ b/datasets/m_lama/README.md
@@ -71,10 +71,11 @@ source_datasets:
 - extended|lama
 task_categories:
 - question-answering
-- text-scoring
+- text-classification
 task_ids:
 - open-domain-qa
-- text-scoring-other-probing
+- text-scoring
+- text-classification-other-probing
 paperswithcode_id: null
 pretty_name: MLama
 ---
diff --git a/datasets/mac_morpho/README.md b/datasets/mac_morpho/README.md
index 0bc9741311e..d61de28a62e 100644
--- a/datasets/mac_morpho/README.md
+++ b/datasets/mac_morpho/README.md
@@ -15,7 +15,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - part-of-speech-tagging
 paperswithcode_id: null
diff --git a/datasets/makhzan/README.md b/datasets/makhzan/README.md
index b2bea6518b8..bbafac9bd7c 100644
--- a/datasets/makhzan/README.md
+++ b/datasets/makhzan/README.md
@@ -14,9 +14,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 paperswithcode_id: null
 pretty_name: makhzan
 ---
diff --git a/datasets/masakhaner/README.md b/datasets/masakhaner/README.md
index f00f3007b2d..b3fbcde5a9d 100644
--- a/datasets/masakhaner/README.md
+++ b/datasets/masakhaner/README.md
@@ -34,7 +34,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: null
diff --git a/datasets/mbpp/README.md b/datasets/mbpp/README.md
index 6bc9f0d491e..9c5fae251a0 100644
--- a/datasets/mbpp/README.md
+++ b/datasets/mbpp/README.md
@@ -17,9 +17,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
+- text2text-generation
 task_ids:
-- conditional-text-generation-other-code-generation
+- text2text-generation-other-code-generation
 ---
 
 # Dataset Card for Mostly Basic Python Problems (mbpp)
diff --git a/datasets/mc4/README.md b/datasets/mc4/README.md
index 4b49dc73162..277ef1a2950 100644
--- a/datasets/mc4/README.md
+++ b/datasets/mc4/README.md
@@ -130,9 +130,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 paperswithcode_id: mc4
 ---
 
diff --git a/datasets/mdd/README.md b/datasets/mdd/README.md
index 2def0f91319..49e49326587 100644
--- a/datasets/mdd/README.md
+++ b/datasets/mdd/README.md
@@ -21,7 +21,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - dialogue-modeling
 paperswithcode_id: mdd
diff --git a/datasets/menyo20k_mt/README.md b/datasets/menyo20k_mt/README.md
index 0e92d643cd6..2f62c97e241 100644
--- a/datasets/menyo20k_mt/README.md
+++ b/datasets/menyo20k_mt/README.md
@@ -16,9 +16,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: MENYO-20k
 ---
diff --git a/datasets/meta_woz/README.md b/datasets/meta_woz/README.md
index efdc55e1f2f..8b31104bea4 100644
--- a/datasets/meta_woz/README.md
+++ b/datasets/meta_woz/README.md
@@ -14,7 +14,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - dialogue-modeling
 paperswithcode_id: metalwoz
diff --git a/datasets/miam/README.md b/datasets/miam/README.md
index 9e25845dcfd..20decb3583e 100644
--- a/datasets/miam/README.md
+++ b/datasets/miam/README.md
@@ -23,28 +23,34 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 - text-classification
 task_ids:
   dihana:
   - dialogue-modeling
   - language-modeling
+  - masked-language-modeling
   - text-classification-other-dialogue-act-classification
   ilisten:
   - dialogue-modeling
   - language-modeling
+  - masked-language-modeling
   - text-classification-other-dialogue-act-classification
   loria:
   - dialogue-modeling
   - language-modeling
+  - masked-language-modeling
   - text-classification-other-dialogue-act-classification
   maptask:
   - dialogue-modeling
   - language-modeling
+  - masked-language-modeling
   - text-classification-other-dialogue-act-classification
   vm2:
   - dialogue-modeling
   - language-modeling
+  - masked-language-modeling
   - text-classification-other-dialogue-act-classification
 paperswithcode_id: null
 pretty_name: MIAM
diff --git a/datasets/mkb/README.md b/datasets/mkb/README.md
index feb90149112..03f6f8a7be1 100644
--- a/datasets/mkb/README.md
+++ b/datasets/mkb/README.md
@@ -1,10 +1,12 @@
 ---
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 multilinguality:
 - translation
 task_ids:
 - language-modeling
+- masked-language-modeling
 languages:
 - hi
 - te
diff --git a/datasets/mlsum/README.md b/datasets/mlsum/README.md
index 0f21319c0b8..cb7df888182 100644
--- a/datasets/mlsum/README.md
+++ b/datasets/mlsum/README.md
@@ -28,10 +28,9 @@ source_datasets:
 - extended|cnn_dailymail
 - original
 task_categories:
-- conditional-text-generation
+- translation
 - text-classification
 task_ids:
-- machine-translation
 - multi-class-classification
 - multi-label-classification
 - summarization
diff --git a/datasets/ms_terms/README.md b/datasets/ms_terms/README.md
index eae98037dcb..ae293e4faab 100644
--- a/datasets/ms_terms/README.md
+++ b/datasets/ms_terms/README.md
@@ -129,9 +129,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: MsTerms
 ---
diff --git a/datasets/msr_text_compression/README.md b/datasets/msr_text_compression/README.md
index 6a038a34f70..15d9ba75772 100644
--- a/datasets/msr_text_compression/README.md
+++ b/datasets/msr_text_compression/README.md
@@ -14,9 +14,8 @@ size_categories:
 source_datasets:
 - extended|other-Open-American-National-Corpus-(OANC1)
 task_categories:
-- conditional-text-generation
-task_ids:
 - summarization
+task_ids: []
 pretty_name: MsrTextCompression
 ---
 
diff --git a/datasets/msr_zhen_translation_parity/README.md b/datasets/msr_zhen_translation_parity/README.md
index 14c1cdcc95a..a35d641ed57 100644
--- a/datasets/msr_zhen_translation_parity/README.md
+++ b/datasets/msr_zhen_translation_parity/README.md
@@ -16,9 +16,8 @@ size_categories:
 source_datasets:
 - extended|other-newstest2017
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: MsrZhenTranslationParity
 ---
diff --git a/datasets/msra_ner/README.md b/datasets/msra_ner/README.md
index 3bc4562c5ef..d4f528bf7ad 100644
--- a/datasets/msra_ner/README.md
+++ b/datasets/msra_ner/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: null
diff --git a/datasets/mt_eng_vietnamese/README.md b/datasets/mt_eng_vietnamese/README.md
index dd82fc579d4..3ccffae9e9b 100644
--- a/datasets/mt_eng_vietnamese/README.md
+++ b/datasets/mt_eng_vietnamese/README.md
@@ -15,9 +15,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: MtEngVietnamese
 ---
diff --git a/datasets/multi_news/README.md b/datasets/multi_news/README.md
index 3f395f4183e..525ee1cf31c 100644
--- a/datasets/multi_news/README.md
+++ b/datasets/multi_news/README.md
@@ -15,9 +15,10 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
+task_categories:
 - summarization
+task_ids:
+- news-articles-summarization
 paperswithcode_id: multi-news
 ---
 
diff --git a/datasets/multi_nli/README.md b/datasets/multi_nli/README.md
index 3f63c7ab3be..c9805f41f8d 100644
--- a/datasets/multi_nli/README.md
+++ b/datasets/multi_nli/README.md
@@ -18,8 +18,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- text-scoring
+- text-classification
 task_ids:
+- text-scoring
 - semantic-similarity-scoring
 paperswithcode_id: multinli
 pretty_name: Multi-Genre Natural Language Inference
diff --git a/datasets/multi_nli_mismatch/README.md b/datasets/multi_nli_mismatch/README.md
index 7bfa78b724f..26c59b59431 100644
--- a/datasets/multi_nli_mismatch/README.md
+++ b/datasets/multi_nli_mismatch/README.md
@@ -18,8 +18,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- text-scoring
+- text-classification
 task_ids:
+- text-scoring
 - semantic-similarity-scoring
 paperswithcode_id: multinli
 pretty_name: Multi-Genre Natural Language Inference
diff --git a/datasets/multi_para_crawl/README.md b/datasets/multi_para_crawl/README.md
index 48776c9d5ae..651781570ca 100644
--- a/datasets/multi_para_crawl/README.md
+++ b/datasets/multi_para_crawl/README.md
@@ -53,9 +53,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: MultiParaCrawl
 ---
diff --git a/datasets/multi_woz_v22/README.md b/datasets/multi_woz_v22/README.md
index ff21ee841bd..c413546efeb 100644
--- a/datasets/multi_woz_v22/README.md
+++ b/datasets/multi_woz_v22/README.md
@@ -15,8 +15,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
-- structure-prediction
+- text-generation
+- fill-mask
+- token-classification
 - text-classification
 task_ids:
 - dialogue-modeling
diff --git a/datasets/multi_x_science_sum/README.md b/datasets/multi_x_science_sum/README.md
index 2d9bb3440ea..5e9489db0f2 100644
--- a/datasets/multi_x_science_sum/README.md
+++ b/datasets/multi_x_science_sum/README.md
@@ -14,9 +14,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
 - summarization
+task_ids:
+- summarization-other-paper-abstract-generation
 paperswithcode_id: multi-xscience
 pretty_name: Multi-XScience
 ---
@@ -54,7 +54,7 @@ pretty_name: Multi-XScience
 
 ### Dataset Summary
 
-Multi-XScience, a large-scale multi-document summarization dataset created from scientific articles. Multi-XScience introduces a challenging multi-document summarization task: writing therelated-work section of a paper based on itsabstract and the articles it references.
+Multi-XScience, a large-scale multi-document summarization dataset created from scientific articles. Multi-XScience introduces a challenging multi-document summarization task: writing the related-work section of a paper based on its abstract and the articles it references.
 
 ### Supported Tasks and Leaderboards
 
diff --git a/datasets/multilingual_librispeech/README.md b/datasets/multilingual_librispeech/README.md
index 68a92b13152..5d390f3f25f 100644
--- a/datasets/multilingual_librispeech/README.md
+++ b/datasets/multilingual_librispeech/README.md
@@ -23,9 +23,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- speech-processing
-task_ids:
 - automatic-speech-recognition
+task_ids: []
 ---
 
 # Dataset Card for MultiLingual LibriSpeech
diff --git a/datasets/mutual_friends/README.md b/datasets/mutual_friends/README.md
index c53632cec22..4578b9d169d 100644
--- a/datasets/mutual_friends/README.md
+++ b/datasets/mutual_friends/README.md
@@ -14,7 +14,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - dialogue-modeling
 paperswithcode_id: mutualfriends
diff --git a/datasets/narrativeqa/README.md b/datasets/narrativeqa/README.md
index 29f8c9b4ae0..536ca4bd483 100644
--- a/datasets/narrativeqa/README.md
+++ b/datasets/narrativeqa/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- question-answering
+- text2text-generation
 task_ids:
 - abstractive-qa
 paperswithcode_id: narrativeqa
diff --git a/datasets/narrativeqa_manual/README.md b/datasets/narrativeqa_manual/README.md
index ab06c73d197..e852781e38f 100644
--- a/datasets/narrativeqa_manual/README.md
+++ b/datasets/narrativeqa_manual/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- question-answering
+- text2text-generation
 task_ids:
 - abstractive-qa
 paperswithcode_id: narrativeqa
diff --git a/datasets/ncbi_disease/README.md b/datasets/ncbi_disease/README.md
index b91da3114eb..73fc77d6058 100644
--- a/datasets/ncbi_disease/README.md
+++ b/datasets/ncbi_disease/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: ncbi-disease-1
diff --git a/datasets/nchlt/README.md b/datasets/nchlt/README.md
index 6e930144686..aef3ecafec7 100644
--- a/datasets/nchlt/README.md
+++ b/datasets/nchlt/README.md
@@ -22,7 +22,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: null
diff --git a/datasets/ncslgr/README.md b/datasets/ncslgr/README.md
index 02af89f315a..ad29336f12b 100644
--- a/datasets/ncslgr/README.md
+++ b/datasets/ncslgr/README.md
@@ -15,9 +15,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: NCSLGR
 ---
diff --git a/datasets/nell/README.md b/datasets/nell/README.md
index 961e5370f81..e04dce6a32e 100755
--- a/datasets/nell/README.md
+++ b/datasets/nell/README.md
@@ -21,12 +21,13 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
+- text-to-tabular
 - text-retrieval
+- text-to-structured
 task_ids:
 - entity-linking-retrieval
 - fact-checking-retrieval
-- other-structured-to-text
+- relation-extraction
 paperswithcode_id: nell
 pretty_name: Never Ending Language Learning (NELL)
 ---
diff --git a/datasets/news_commentary/README.md b/datasets/news_commentary/README.md
index b36b94bc08e..671e4827266 100644
--- a/datasets/news_commentary/README.md
+++ b/datasets/news_commentary/README.md
@@ -25,9 +25,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: NewsCommentary
 ---
diff --git a/datasets/newsph/README.md b/datasets/newsph/README.md
index 737bc7978e9..c23467d033f 100644
--- a/datasets/newsph/README.md
+++ b/datasets/newsph/README.md
@@ -15,9 +15,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 paperswithcode_id: newsph-nli
 pretty_name: NewsPH-NLI
 ---
diff --git a/datasets/newspop/README.md b/datasets/newspop/README.md
index a5c96d72b1e..52f7022fd6b 100644
--- a/datasets/newspop/README.md
+++ b/datasets/newspop/README.md
@@ -14,9 +14,10 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- text-scoring
+- text-classification
 task_ids:
-- other-social-media-shares-prediction
+- text-scoring
+- text-classification-other-social-media-shares-prediction
 paperswithcode_id: null
 pretty_name: News Popularity in Multiple Social Media Platforms
 ---
diff --git a/datasets/newsroom/README.md b/datasets/newsroom/README.md
index 6c10bb6a926..3aeec719e2e 100644
--- a/datasets/newsroom/README.md
+++ b/datasets/newsroom/README.md
@@ -15,9 +15,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
 - summarization
+task_ids:
+- news-articles-summarization
 paperswithcode_id: newsroom
 ---
 
diff --git a/datasets/nkjp-ner/README.md b/datasets/nkjp-ner/README.md
index 19f75e0c95f..5736c045f45 100644
--- a/datasets/nkjp-ner/README.md
+++ b/datasets/nkjp-ner/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: null
diff --git a/datasets/norec/README.md b/datasets/norec/README.md
index e742a54ec26..8564fa2c8c2 100644
--- a/datasets/norec/README.md
+++ b/datasets/norec/README.md
@@ -17,7 +17,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: norec
diff --git a/datasets/norne/README.md b/datasets/norne/README.md
index 7044b742135..d68d4da304b 100644
--- a/datasets/norne/README.md
+++ b/datasets/norne/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: null
diff --git a/datasets/norwegian_ner/README.md b/datasets/norwegian_ner/README.md
index e8db3942423..8e8696f6f76 100644
--- a/datasets/norwegian_ner/README.md
+++ b/datasets/norwegian_ner/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: null
diff --git a/datasets/numer_sense/README.md b/datasets/numer_sense/README.md
index 95b1c583ac2..e711ca69484 100644
--- a/datasets/numer_sense/README.md
+++ b/datasets/numer_sense/README.md
@@ -14,7 +14,8 @@ size_categories:
 source_datasets:
 - extended|other
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - slot-filling
 paperswithcode_id: numersense
diff --git a/datasets/numeric_fused_head/README.md b/datasets/numeric_fused_head/README.md
index 7d0e650d4a3..bce963793bb 100644
--- a/datasets/numeric_fused_head/README.md
+++ b/datasets/numeric_fused_head/README.md
@@ -21,9 +21,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
-- structure-prediction-other-fused-head-identification
+- token-classification-other-fused-head-identification
 paperswithcode_id: numeric-fused-head
 pretty_name: Numeric Fused Heads
 ---
diff --git a/datasets/oclar/README.md b/datasets/oclar/README.md
index da5d51da6aa..864b8a07d3c 100644
--- a/datasets/oclar/README.md
+++ b/datasets/oclar/README.md
@@ -15,8 +15,8 @@ source_datasets:
 - original
 task_categories:
 - text-classification
-- text-scoring
 task_ids:
+- text-scoring
 - sentiment-classification
 - sentiment-scoring
 paperswithcode_id: null
diff --git a/datasets/ofis_publik/README.md b/datasets/ofis_publik/README.md
index 1b3553f3ae5..b83e8edc68b 100644
--- a/datasets/ofis_publik/README.md
+++ b/datasets/ofis_publik/README.md
@@ -15,9 +15,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: OfisPublik
 ---
diff --git a/datasets/ollie/README.md b/datasets/ollie/README.md
index 4148f63ac82..da4bf65682d 100755
--- a/datasets/ollie/README.md
+++ b/datasets/ollie/README.md
@@ -17,10 +17,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- other
+- text-to-structured
 task_ids:
-- other-structured-to-text
-- other-other-relation-extraction
+- relation-extraction
 paperswithcode_id: null
 pretty_name: Ollie
 ---
diff --git a/datasets/onestop_english/README.md b/datasets/onestop_english/README.md
index 2ac162080ec..58cff19ac65 100644
--- a/datasets/onestop_english/README.md
+++ b/datasets/onestop_english/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
+- text2text-generation
 - text-classification
 task_ids:
 - multi-class-classification
diff --git a/datasets/open_subtitles/README.md b/datasets/open_subtitles/README.md
index e0598ec5704..e5ebf915b32 100644
--- a/datasets/open_subtitles/README.md
+++ b/datasets/open_subtitles/README.md
@@ -84,9 +84,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: opensubtitles
 pretty_name: OpenSubtitles
 ---
diff --git a/datasets/openai_humaneval/README.md b/datasets/openai_humaneval/README.md
index 0d3c0f71121..efee435558d 100644
--- a/datasets/openai_humaneval/README.md
+++ b/datasets/openai_humaneval/README.md
@@ -15,9 +15,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
+- text2text-generation
 task_ids:
-- conditional-text-generation-other-code-generation
+- text2text-generation-other-code-generation
 ---
 
 # Dataset Card for OpenAI HumanEval
diff --git a/datasets/openslr/README.md b/datasets/openslr/README.md
index ddf14cbd482..72497795d54 100644
--- a/datasets/openslr/README.md
+++ b/datasets/openslr/README.md
@@ -74,9 +74,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- speech-processing
-task_ids:
 - automatic-speech-recognition
+task_ids: []
 paperswithcode_id: null
 ---
 
diff --git a/datasets/openwebtext/README.md b/datasets/openwebtext/README.md
index 3adc80d644e..dae418a99c9 100644
--- a/datasets/openwebtext/README.md
+++ b/datasets/openwebtext/README.md
@@ -15,9 +15,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 paperswithcode_id: openwebtext
 ---
 
diff --git a/datasets/opus100/README.md b/datasets/opus100/README.md
index 0f7b82b2c5c..19e6a45e556 100644
--- a/datasets/opus100/README.md
+++ b/datasets/opus100/README.md
@@ -1,11 +1,13 @@
 ---
 pretty_name: Opus100
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 multilinguality:
 - translation
 task_ids:
 - language-modeling
+- masked-language-modeling
 languages:
   af-en:
   - af
diff --git a/datasets/opus_books/README.md b/datasets/opus_books/README.md
index 7d0cf334c25..65974ff607a 100644
--- a/datasets/opus_books/README.md
+++ b/datasets/opus_books/README.md
@@ -29,9 +29,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: OpusBooks
 ---
diff --git a/datasets/opus_dgt/README.md b/datasets/opus_dgt/README.md
index 073a763e1cc..db243a58ea4 100644
--- a/datasets/opus_dgt/README.md
+++ b/datasets/opus_dgt/README.md
@@ -57,9 +57,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: OpusDgt
 ---
diff --git a/datasets/opus_dogc/README.md b/datasets/opus_dogc/README.md
index 79b7be2d487..4912c132fa3 100644
--- a/datasets/opus_dogc/README.md
+++ b/datasets/opus_dogc/README.md
@@ -15,9 +15,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: OPUS DOGC
 ---
diff --git a/datasets/opus_elhuyar/README.md b/datasets/opus_elhuyar/README.md
index 5f43b2a0459..3844e25c0f8 100644
--- a/datasets/opus_elhuyar/README.md
+++ b/datasets/opus_elhuyar/README.md
@@ -15,9 +15,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: OpusElhuyar
 ---
diff --git a/datasets/opus_euconst/README.md b/datasets/opus_euconst/README.md
index 2a39dbc256c..84a0c9c6685 100644
--- a/datasets/opus_euconst/README.md
+++ b/datasets/opus_euconst/README.md
@@ -34,9 +34,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: OpusEuconst
 ---
diff --git a/datasets/opus_finlex/README.md b/datasets/opus_finlex/README.md
index 91197b4de6f..762fc2c941c 100644
--- a/datasets/opus_finlex/README.md
+++ b/datasets/opus_finlex/README.md
@@ -15,9 +15,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: OpusFinlex
 ---
diff --git a/datasets/opus_fiskmo/README.md b/datasets/opus_fiskmo/README.md
index 4c1f018727d..f8965de36ee 100644
--- a/datasets/opus_fiskmo/README.md
+++ b/datasets/opus_fiskmo/README.md
@@ -15,9 +15,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: OpusFiskmo
 ---
diff --git a/datasets/opus_gnome/README.md b/datasets/opus_gnome/README.md
index d49c860cf5c..7e0a719d023 100644
--- a/datasets/opus_gnome/README.md
+++ b/datasets/opus_gnome/README.md
@@ -219,9 +219,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: OpusGnome
 ---
diff --git a/datasets/opus_infopankki/README.md b/datasets/opus_infopankki/README.md
index 96f81db3a67..bde5a890778 100644
--- a/datasets/opus_infopankki/README.md
+++ b/datasets/opus_infopankki/README.md
@@ -211,9 +211,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: OpusInfopankki
 ---
diff --git a/datasets/opus_memat/README.md b/datasets/opus_memat/README.md
index a55f70caccf..cb3dbeb0f53 100644
--- a/datasets/opus_memat/README.md
+++ b/datasets/opus_memat/README.md
@@ -15,9 +15,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: OpusMemat
 ---
diff --git a/datasets/opus_montenegrinsubs/README.md b/datasets/opus_montenegrinsubs/README.md
index 57776cb3141..e791b100778 100644
--- a/datasets/opus_montenegrinsubs/README.md
+++ b/datasets/opus_montenegrinsubs/README.md
@@ -15,9 +15,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: OpusMontenegrinsubs
 ---
diff --git a/datasets/opus_openoffice/README.md b/datasets/opus_openoffice/README.md
index 3ac2107c68a..5fa918863d9 100644
--- a/datasets/opus_openoffice/README.md
+++ b/datasets/opus_openoffice/README.md
@@ -97,9 +97,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: OpusOpenoffice
 ---
diff --git a/datasets/opus_paracrawl/README.md b/datasets/opus_paracrawl/README.md
index 804c14bddfd..90367bb96ec 100644
--- a/datasets/opus_paracrawl/README.md
+++ b/datasets/opus_paracrawl/README.md
@@ -72,9 +72,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: OpusParaCrawl
 ---
diff --git a/datasets/opus_rf/README.md b/datasets/opus_rf/README.md
index 74f5216801b..25b08f3ac9c 100644
--- a/datasets/opus_rf/README.md
+++ b/datasets/opus_rf/README.md
@@ -43,9 +43,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: OpusRf
 ---
diff --git a/datasets/opus_tedtalks/README.md b/datasets/opus_tedtalks/README.md
index 5dc39418afd..061d96d44ed 100644
--- a/datasets/opus_tedtalks/README.md
+++ b/datasets/opus_tedtalks/README.md
@@ -15,9 +15,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: OpusTedtalks
 ---
diff --git a/datasets/opus_ubuntu/README.md b/datasets/opus_ubuntu/README.md
index 83ad32844b7..709e2ff295d 100644
--- a/datasets/opus_ubuntu/README.md
+++ b/datasets/opus_ubuntu/README.md
@@ -276,9 +276,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: OpusUbuntu
 ---
diff --git a/datasets/opus_wikipedia/README.md b/datasets/opus_wikipedia/README.md
index e4b84456bab..9af77016bff 100644
--- a/datasets/opus_wikipedia/README.md
+++ b/datasets/opus_wikipedia/README.md
@@ -42,9 +42,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: OpusWikipedia
 ---
diff --git a/datasets/opus_xhosanavy/README.md b/datasets/opus_xhosanavy/README.md
index 83451399699..67ae43c7e0a 100644
--- a/datasets/opus_xhosanavy/README.md
+++ b/datasets/opus_xhosanavy/README.md
@@ -15,9 +15,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: OpusXhosanavy
 ---
diff --git a/datasets/orange_sum/README.md b/datasets/orange_sum/README.md
index e5577d0face..53a3f20e0aa 100644
--- a/datasets/orange_sum/README.md
+++ b/datasets/orange_sum/README.md
@@ -15,9 +15,10 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
 - summarization
+task_ids:
+- news-articles-headline-generation
+- news-articles-summarization
 paperswithcode_id: orangesum
 ---
 
diff --git a/datasets/oscar/README.md b/datasets/oscar/README.md
index 7cf2d23e61c..f2ac235ab29 100644
--- a/datasets/oscar/README.md
+++ b/datasets/oscar/README.md
@@ -843,9 +843,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 paperswithcode_id: oscar
 ---
 
diff --git a/datasets/para_crawl/README.md b/datasets/para_crawl/README.md
index 984c767476b..b64f26e7c0e 100644
--- a/datasets/para_crawl/README.md
+++ b/datasets/para_crawl/README.md
@@ -38,9 +38,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: paracrawl
 ---
 
diff --git a/datasets/para_pat/README.md b/datasets/para_pat/README.md
index efe9d01410d..b7eaa345aeb 100644
--- a/datasets/para_pat/README.md
+++ b/datasets/para_pat/README.md
@@ -29,9 +29,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 paperswithcode_id: parapat
 pretty_name: Parallel Corpus of Patents Abstracts
 ---
diff --git a/datasets/paws-x/README.md b/datasets/paws-x/README.md
index 0ec7906d50a..7874458e63a 100644
--- a/datasets/paws-x/README.md
+++ b/datasets/paws-x/README.md
@@ -24,11 +24,11 @@ source_datasets:
 - extended|other-paws
 task_categories:
 - text-classification
-- text-scoring
 task_ids:
 - semantic-similarity-classification
 - semantic-similarity-scoring
-- text-scoring-other-paraphrase-identification
+- text-classification-other-paraphrase-identification
+- text-scoring
 paperswithcode_id: paws-x
 ---
 
diff --git a/datasets/paws/README.md b/datasets/paws/README.md
index 891532f525e..154df26e53d 100644
--- a/datasets/paws/README.md
+++ b/datasets/paws/README.md
@@ -26,11 +26,11 @@ source_datasets:
 - original
 task_categories:
 - text-classification
-- text-scoring
 task_ids:
 - semantic-similarity-classification
 - semantic-similarity-scoring
-- text-scoring-other-paraphrase-identification
+- text-classification-other-paraphrase-identification
+- text-scoring
 paperswithcode_id: paws
 ---
 
diff --git a/datasets/pec/README.md b/datasets/pec/README.md
index 305ebbf7552..596985f8b99 100644
--- a/datasets/pec/README.md
+++ b/datasets/pec/README.md
@@ -14,7 +14,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 - text-retrieval
 task_ids:
   all:
diff --git a/datasets/peoples_daily_ner/README.md b/datasets/peoples_daily_ner/README.md
index 6583098bf91..43a503cc8e8 100644
--- a/datasets/peoples_daily_ner/README.md
+++ b/datasets/peoples_daily_ner/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: null
diff --git a/datasets/persian_ner/README.md b/datasets/persian_ner/README.md
index 5e10dff7e9c..f2547f21009 100644
--- a/datasets/persian_ner/README.md
+++ b/datasets/persian_ner/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 pretty_name: Persian NER
diff --git a/datasets/php/README.md b/datasets/php/README.md
index 15321204ade..6569f1af419 100644
--- a/datasets/php/README.md
+++ b/datasets/php/README.md
@@ -36,9 +36,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: php
 ---
diff --git a/datasets/pib/README.md b/datasets/pib/README.md
index 1a4540a4f2b..cf2fb970aca 100644
--- a/datasets/pib/README.md
+++ b/datasets/pib/README.md
@@ -1,10 +1,11 @@
 ---
 task_categories:
-- conditional-text-generation
-- sequence-modeling
+- translation
+- text-generation
+- fill-mask
 task_ids:
-- machine-translation
 - language-modeling
+- masked-language-modeling
 multilinguality:
 - translation
 languages:
diff --git a/datasets/pn_summary/README.md b/datasets/pn_summary/README.md
index c1ac026877e..e7779021deb 100644
--- a/datasets/pn_summary/README.md
+++ b/datasets/pn_summary/README.md
@@ -14,10 +14,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
+- summarization
 - text-classification
 task_ids:
-- summarization
+- news-articles-summarization
+- news-articles-headline-generation
 - text-simplification
 - topic-classification
 paperswithcode_id: pn-summary
diff --git a/datasets/poleval2019_mt/README.md b/datasets/poleval2019_mt/README.md
index 868f2dab718..2d213037e66 100644
--- a/datasets/poleval2019_mt/README.md
+++ b/datasets/poleval2019_mt/README.md
@@ -17,9 +17,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: Poleval2019Mt
 ---
diff --git a/datasets/polsum/README.md b/datasets/polsum/README.md
index 6a48848cb26..68e004898d0 100644
--- a/datasets/polsum/README.md
+++ b/datasets/polsum/README.md
@@ -14,9 +14,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
 - summarization
+task_ids:
+- news-articles-summarization
 paperswithcode_id: null
 pretty_name: Polish Summaries Corpus
 ---
diff --git a/datasets/polyglot_ner/README.md b/datasets/polyglot_ner/README.md
index c96c5d6398e..e4025775475 100644
--- a/datasets/polyglot_ner/README.md
+++ b/datasets/polyglot_ner/README.md
@@ -54,7 +54,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: polyglot-ner
diff --git a/datasets/psc/README.md b/datasets/psc/README.md
index 0a07be50547..eb075e68fac 100644
--- a/datasets/psc/README.md
+++ b/datasets/psc/README.md
@@ -14,9 +14,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
 - summarization
+task_ids:
+- news-articles-summarization
 paperswithcode_id: null
 pretty_name: psc
 ---
diff --git a/datasets/ptb_text_only/README.md b/datasets/ptb_text_only/README.md
index 7955a72b6da..397778ca1d9 100644
--- a/datasets/ptb_text_only/README.md
+++ b/datasets/ptb_text_only/README.md
@@ -14,9 +14,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 paperswithcode_id: null
 pretty_name: Penn Treebank
 ---
diff --git a/datasets/pubmed/README.md b/datasets/pubmed/README.md
index 86bd4fed8b5..2a4c905d64a 100644
--- a/datasets/pubmed/README.md
+++ b/datasets/pubmed/README.md
@@ -14,14 +14,14 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-- sequence-modeling
+- text-generation
+- fill-mask
 - text-classification
-- text-scoring
 task_ids:
 - language-modeling
-- other-structured-to-text
-- text-scoring-other-citation-estimation
+- masked-language-modeling
+- text-classification-other-citation-estimation
+- text-scoring
 - topic-classification
 paperswithcode_id: pubmed
 pretty_name: PubMed
diff --git a/datasets/py_ast/README.md b/datasets/py_ast/README.md
index 68edd57de56..0f2465bc26e 100644
--- a/datasets/py_ast/README.md
+++ b/datasets/py_ast/README.md
@@ -16,9 +16,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
-task_ids:
-- sequence-modeling-other-code-modeling
+- text-generation
+- fill-mask
+- text-generation
+- fill-mask
+- text-generation-other-code-modeling
 paperswithcode_id: null
 ---
 # Dataset Card for [py_ast]
diff --git a/datasets/qed_amara/README.md b/datasets/qed_amara/README.md
index a78ed3cb49b..97c27223977 100644
--- a/datasets/qed_amara/README.md
+++ b/datasets/qed_amara/README.md
@@ -238,9 +238,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: QedAmara
 ---
diff --git a/datasets/quac/README.md b/datasets/quac/README.md
index e5e757a7c63..0f222943578 100644
--- a/datasets/quac/README.md
+++ b/datasets/quac/README.md
@@ -16,7 +16,8 @@ source_datasets:
 - extended|wikipedia
 task_categories:
 - question-answering
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - dialogue-modeling
 - extractive-qa
diff --git a/datasets/recipe_nlg/README.md b/datasets/recipe_nlg/README.md
index 3e58eadd8f2..db3c68ea67b 100644
--- a/datasets/recipe_nlg/README.md
+++ b/datasets/recipe_nlg/README.md
@@ -14,14 +14,16 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-- sequence-modeling
+- text2text-generation
+- text-generation
+- fill-mask
 - text-retrieval
 task_ids:
 - document-retrieval
 - entity-linking-retrieval
 - explanation-generation
 - language-modeling
+- masked-language-modeling
 - summarization
 paperswithcode_id: recipenlg
 pretty_name: RecipeNLG
diff --git a/datasets/reddit/README.md b/datasets/reddit/README.md
index 4b2f97ad18d..b35bedf3d13 100644
--- a/datasets/reddit/README.md
+++ b/datasets/reddit/README.md
@@ -16,9 +16,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
 - summarization
+task_ids:
+- summarization-other-reddit-posts-summarization
 ---
 
 # Dataset Card for Reddit Webis-TLDR-17
diff --git a/datasets/reddit_tifu/README.md b/datasets/reddit_tifu/README.md
index fbf9b0d9783..f58c3667dc0 100644
--- a/datasets/reddit_tifu/README.md
+++ b/datasets/reddit_tifu/README.md
@@ -15,9 +15,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
 - summarization
+task_ids:
+- summarization-other-reddit-posts-summarization
 paperswithcode_id: reddit-tifu
 ---
 
@@ -60,7 +60,7 @@ paperswithcode_id: reddit-tifu
 ### Dataset Summary
 
 Reddit dataset, where TIFU denotes the name of subbreddit /r/tifu.
-As defined in the publication, styel "short" uses title as summary and
+As defined in the publication, style "short" uses title as summary and
 "long" uses tldr as summary.
 
 Features includes:
diff --git a/datasets/refresd/README.md b/datasets/refresd/README.md
index 909f0d9b9f9..4a415d2e794 100644
--- a/datasets/refresd/README.md
+++ b/datasets/refresd/README.md
@@ -17,10 +17,10 @@ size_categories:
 source_datasets: []
 task_categories:
 - text-classification
-- text-scoring
 task_ids:
 - semantic-similarity-classification
 - semantic-similarity-scoring
+- text-scoring
 paperswithcode_id: refresd
 pretty_name: Rationalized English-French Semantic Divergences
 ---
diff --git a/datasets/ro_sts/README.md b/datasets/ro_sts/README.md
index 8a8007b22c4..c3f6447c8a0 100644
--- a/datasets/ro_sts/README.md
+++ b/datasets/ro_sts/README.md
@@ -13,8 +13,9 @@ size_categories:
 source_datasets:
 - extended|other-sts-b
 task_categories:
-- text-scoring
+- text-classification
 task_ids:
+- text-scoring
 - semantic-similarity-scoring
 paperswithcode_id: null
 pretty_name: RO-STS
diff --git a/datasets/ro_sts_parallel/README.md b/datasets/ro_sts_parallel/README.md
index 4589e07e31e..f9d070df1e4 100755
--- a/datasets/ro_sts_parallel/README.md
+++ b/datasets/ro_sts_parallel/README.md
@@ -14,9 +14,8 @@ size_categories:
 source_datasets:
 - extended|other-sts-b
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: RO-STS-Parallel
 ---
diff --git a/datasets/ronec/README.md b/datasets/ronec/README.md
index d29ce13bea4..9b0614f5005 100644
--- a/datasets/ronec/README.md
+++ b/datasets/ronec/README.md
@@ -15,7 +15,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: ronec
diff --git a/datasets/s2orc/README.md b/datasets/s2orc/README.md
index 0343bd9c5e2..7523f7d5f75 100644
--- a/datasets/s2orc/README.md
+++ b/datasets/s2orc/README.md
@@ -15,10 +15,12 @@ source_datasets:
 - original
 task_categories:
 - other
-- sequence-modeling
+- text-generation
+- fill-mask
 - text-classification
 task_ids:
 - language-modeling
+- masked-language-modeling
 - multi-class-classification
 - multi-label-classification
 - other-other-citation-recommendation
diff --git a/datasets/samsum/README.md b/datasets/samsum/README.md
index ea114633db8..2e90f0b8285 100644
--- a/datasets/samsum/README.md
+++ b/datasets/samsum/README.md
@@ -14,9 +14,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
 - summarization
+task_ids:
+- summarization-other-conversations-summarization
 paperswithcode_id: samsum-corpus
 pretty_name: SAMSum Corpus
 ---
diff --git a/datasets/sanskrit_classic/README.md b/datasets/sanskrit_classic/README.md
index 0dad96d49c7..16e4accba50 100644
--- a/datasets/sanskrit_classic/README.md
+++ b/datasets/sanskrit_classic/README.md
@@ -14,9 +14,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 paperswithcode_id: null
 pretty_name: SanskritClassic
 ---
diff --git a/datasets/saudinewsnet/README.md b/datasets/saudinewsnet/README.md
index 37c8b09dd5d..fe5981abdaa 100644
--- a/datasets/saudinewsnet/README.md
+++ b/datasets/saudinewsnet/README.md
@@ -14,9 +14,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 paperswithcode_id: null
 pretty_name: saudinewsnet
 ---
diff --git a/datasets/scb_mt_enth_2020/README.md b/datasets/scb_mt_enth_2020/README.md
index d8cd272e76f..f935bf0debd 100644
--- a/datasets/scb_mt_enth_2020/README.md
+++ b/datasets/scb_mt_enth_2020/README.md
@@ -20,9 +20,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: scb-mt-en-th-2020
 pretty_name: ScbMtEnth2020
 ---
diff --git a/datasets/schema_guided_dstc8/README.md b/datasets/schema_guided_dstc8/README.md
index 3e7d5e61ead..e9368fa4da7 100644
--- a/datasets/schema_guided_dstc8/README.md
+++ b/datasets/schema_guided_dstc8/README.md
@@ -15,8 +15,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
-- structure-prediction
+- text-generation
+- fill-mask
+- token-classification
 - text-classification
 task_ids:
 - dialogue-modeling
diff --git a/datasets/scielo/README.md b/datasets/scielo/README.md
index 4afe0c5e917..d9bda3ebc69 100644
--- a/datasets/scielo/README.md
+++ b/datasets/scielo/README.md
@@ -23,9 +23,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: SciELO
 ---
diff --git a/datasets/scitldr/README.md b/datasets/scitldr/README.md
index 732cf5d0be8..b081cdb08f8 100644
--- a/datasets/scitldr/README.md
+++ b/datasets/scitldr/README.md
@@ -14,9 +14,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
 - summarization
+task_ids:
+- summarization-other-scientific-documents-summarization
 paperswithcode_id: scitldr
 pretty_name: SciTLDR
 ---
diff --git a/datasets/sede/README.md b/datasets/sede/README.md
index 5daac69ee37..212fcc92158 100644
--- a/datasets/sede/README.md
+++ b/datasets/sede/README.md
@@ -16,7 +16,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - parsing
 ---
diff --git a/datasets/sem_eval_2014_task_1/README.md b/datasets/sem_eval_2014_task_1/README.md
index e1a90cd1c16..7bce74dacdc 100644
--- a/datasets/sem_eval_2014_task_1/README.md
+++ b/datasets/sem_eval_2014_task_1/README.md
@@ -15,8 +15,8 @@ source_datasets:
 - extended|other-ImageFlickr and SemEval-2012 STS MSR-Video Descriptions
 task_categories:
 - text-classification
-- text-scoring
 task_ids:
+- text-scoring
 - natural-language-inference
 - semantic-similarity-scoring
 paperswithcode_id: null
diff --git a/datasets/sem_eval_2020_task_11/README.md b/datasets/sem_eval_2020_task_11/README.md
index 945c1f094a3..c70e6b8285c 100644
--- a/datasets/sem_eval_2020_task_11/README.md
+++ b/datasets/sem_eval_2020_task_11/README.md
@@ -15,10 +15,10 @@ source_datasets:
 - original
 task_categories:
 - text-classification
-- structure-prediction
+- token-classification
 task_ids:
 - text-classification-other-propaganda-technique-classification
-- structure-prediction-other-propaganda-span-identification
+- token-classification-other-propaganda-span-identification
 paperswithcode_id: null
 pretty_name: "SemEval-2020 Task 11"
 ---
diff --git a/datasets/senti_ws/README.md b/datasets/senti_ws/README.md
index b5d2e37b498..0bb76a8d187 100644
--- a/datasets/senti_ws/README.md
+++ b/datasets/senti_ws/README.md
@@ -15,11 +15,12 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
-- text-scoring
+- token-classification
+- text-classification
 task_ids:
+- text-scoring
 - sentiment-scoring
-- structure-prediction-other-pos-tagging
+- part-of-speech-tagging
 paperswithcode_id: null
 pretty_name: SentiWS
 ---
diff --git a/datasets/sepedi_ner/README.md b/datasets/sepedi_ner/README.md
index 4917e4475c5..97e563cec02 100644
--- a/datasets/sepedi_ner/README.md
+++ b/datasets/sepedi_ner/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: null
diff --git a/datasets/sesotho_ner_corpus/README.md b/datasets/sesotho_ner_corpus/README.md
index d51243f7800..65191198196 100644
--- a/datasets/sesotho_ner_corpus/README.md
+++ b/datasets/sesotho_ner_corpus/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: null
diff --git a/datasets/setimes/README.md b/datasets/setimes/README.md
index 560e812a2f3..5c3377ed13c 100644
--- a/datasets/setimes/README.md
+++ b/datasets/setimes/README.md
@@ -24,9 +24,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 ---
 
diff --git a/datasets/setswana_ner_corpus/README.md b/datasets/setswana_ner_corpus/README.md
index 9cd0646cfb2..e5b19ad2a48 100644
--- a/datasets/setswana_ner_corpus/README.md
+++ b/datasets/setswana_ner_corpus/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: null
diff --git a/datasets/silicone/README.md b/datasets/silicone/README.md
index 0a54a2a014d..750a5792545 100644
--- a/datasets/silicone/README.md
+++ b/datasets/silicone/README.md
@@ -33,49 +33,69 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 - text-classification
-- text-scoring
 task_ids:
   dyda_da:
+  - text-scoring
   - dialogue-modeling
   - language-modeling
+  - masked-language-modeling
   - text-classification-other-dialogue-act-classification
   dyda_e:
+  - text-scoring
   - dialogue-modeling
   - language-modeling
+  - masked-language-modeling
   - text-classification-other-emotion-classification
   iemocap:
+  - text-scoring
   - dialogue-modeling
   - language-modeling
+  - masked-language-modeling
   - text-classification-other-emotion-classification
   maptask:
+  - text-scoring
   - dialogue-modeling
   - language-modeling
+  - masked-language-modeling
   - text-classification-other-dialogue-act-classification
   meld_e:
+  - text-scoring
   - dialogue-modeling
   - language-modeling
+  - masked-language-modeling
   - text-classification-other-emotion-classification
   meld_s:
+  - text-scoring
   - dialogue-modeling
   - language-modeling
+  - masked-language-modeling
   - sentiment-classification
   mrda:
+  - text-scoring
   - dialogue-modeling
   - language-modeling
+  - masked-language-modeling
   - text-classification-other-dialogue-act-classification
   oasis:
+  - text-scoring
   - dialogue-modeling
   - language-modeling
+  - masked-language-modeling
   - text-classification-other-dialogue-act-classification
   sem:
+  - text-scoring
   - dialogue-modeling
   - language-modeling
+  - masked-language-modeling
   - sentiment-classification
   swda:
+  - text-scoring
   - dialogue-modeling
   - language-modeling
+  - masked-language-modeling
   - text-classification-other-dialogue-act-classification
 paperswithcode_id: null
 pretty_name: SILICONE Benchmark
diff --git a/datasets/siswati_ner_corpus/README.md b/datasets/siswati_ner_corpus/README.md
index d3921d29960..0f89e86c676 100644
--- a/datasets/siswati_ner_corpus/README.md
+++ b/datasets/siswati_ner_corpus/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: null
diff --git a/datasets/smartdata/README.md b/datasets/smartdata/README.md
index c889c00e059..1f2650d9e23 100644
--- a/datasets/smartdata/README.md
+++ b/datasets/smartdata/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: null
diff --git a/datasets/snow_simplified_japanese_corpus/README.md b/datasets/snow_simplified_japanese_corpus/README.md
index 946d5bf99ba..01ba5827bfa 100644
--- a/datasets/snow_simplified_japanese_corpus/README.md
+++ b/datasets/snow_simplified_japanese_corpus/README.md
@@ -16,9 +16,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: SNOW T15 and T23 (simplified Japanese corpus)
 ---
diff --git a/datasets/so_stacksample/README.md b/datasets/so_stacksample/README.md
index 7f9c09c088a..1c67122e3c3 100644
--- a/datasets/so_stacksample/README.md
+++ b/datasets/so_stacksample/README.md
@@ -14,10 +14,10 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- question-answering
+- text2text-generation
 task_ids:
 - abstractive-qa
-- open-domain-qa
+- open-domain-abstractive-qa
 paperswithcode_id: null
 pretty_name: SO StackSample
 ---
diff --git a/datasets/social_bias_frames/README.md b/datasets/social_bias_frames/README.md
index dfee00c0b5a..8a29c68277b 100644
--- a/datasets/social_bias_frames/README.md
+++ b/datasets/social_bias_frames/README.md
@@ -15,10 +15,10 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
+- text2text-generation
 - text-classification
 task_ids:
-- explanation-generation
+- text2text-generation-other-explanation-generation
 - hate-speech-detection
 paperswithcode_id: null
 ---
diff --git a/datasets/sofc_materials_articles/README.md b/datasets/sofc_materials_articles/README.md
index ec314e5a7a0..94fe7632a2d 100644
--- a/datasets/sofc_materials_articles/README.md
+++ b/datasets/sofc_materials_articles/README.md
@@ -14,8 +14,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
-- structure-prediction
+- text-generation
+- fill-mask
+- token-classification
 - text-classification
 task_ids:
 - named-entity-recognition
diff --git a/datasets/spanish_billion_words/README.md b/datasets/spanish_billion_words/README.md
index 2eaac990c4a..a921faa10cb 100644
--- a/datasets/spanish_billion_words/README.md
+++ b/datasets/spanish_billion_words/README.md
@@ -15,9 +15,11 @@ source_datasets:
 - original
 task_categories:
 - other
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 - other-other-pretraining-language-models
 paperswithcode_id: sbwce
 pretty_name: Spanish Billion Word Corpus and Embeddings
diff --git a/datasets/spc/README.md b/datasets/spc/README.md
index 9b2dc8d2a97..7a9e1489366 100644
--- a/datasets/spc/README.md
+++ b/datasets/spc/README.md
@@ -22,9 +22,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: spc
 ---
diff --git a/datasets/species_800/README.md b/datasets/species_800/README.md
index 828842f811c..6711d200f36 100644
--- a/datasets/species_800/README.md
+++ b/datasets/species_800/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: null
diff --git a/datasets/speech_commands/README.md b/datasets/speech_commands/README.md
index 991e1a68092..61a34f5ab50 100644
--- a/datasets/speech_commands/README.md
+++ b/datasets/speech_commands/README.md
@@ -18,9 +18,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- speech-processing
+- audio-classification
 task_ids:
-- other-other-keyword-spotting
+- keyword-spotting
 ---
 
 # Dataset Card for SpeechCommands
diff --git a/datasets/spider/README.md b/datasets/spider/README.md
index 45818ff30e2..fa5967bfa47 100644
--- a/datasets/spider/README.md
+++ b/datasets/spider/README.md
@@ -15,9 +15,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
+- text2text-generation
 task_ids:
-- other-structured-to-text
+- text2text-generation-other-text-to-sql
 paperswithcode_id: spider-1
 pretty_name: Spider
 ---
diff --git a/datasets/srwac/README.md b/datasets/srwac/README.md
index a4da3f5aca4..7600eb58950 100644
--- a/datasets/srwac/README.md
+++ b/datasets/srwac/README.md
@@ -14,9 +14,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 paperswithcode_id: null
 pretty_name: SrWac
 ---
diff --git a/datasets/sst/README.md b/datasets/sst/README.md
index 58366a8e8a8..c9c19e95284 100644
--- a/datasets/sst/README.md
+++ b/datasets/sst/README.md
@@ -18,8 +18,8 @@ size_categories:
 source_datasets: []
 task_categories:
 - text-classification
-- text-scoring
 task_ids:
+- text-scoring
 - sentiment-classification
 - sentiment-scoring
 paperswithcode_id: sst
diff --git a/datasets/stsb_multi_mt/README.md b/datasets/stsb_multi_mt/README.md
index 0bc2212dd49..71f96a435dd 100644
--- a/datasets/stsb_multi_mt/README.md
+++ b/datasets/stsb_multi_mt/README.md
@@ -25,8 +25,9 @@ size_categories:
 source_datasets:
 - extended|other-sts-b
 task_categories:
-- text-scoring
+- text-classification
 task_ids:
+- text-scoring
 - semantic-similarity-scoring
 paperswithcode_id: null
 pretty_name: STSb Multi MT
diff --git a/datasets/superb/README.md b/datasets/superb/README.md
index 9d3903213f0..6a25d66990f 100644
--- a/datasets/superb/README.md
+++ b/datasets/superb/README.md
@@ -18,18 +18,16 @@ source_datasets:
 - extended|other-librimix
 - extended|other-speech_commands
 task_categories:
-- speech-processing
-task_ids:
 - automatic-speech-recognition
-- phoneme-recognition
+task_ids: []
 - keyword-spotting
 - query-by-example-spoken-term-detection
 - speaker-identification
 - automatic-speaker-verification
 - speaker-diarization
-- intent-classification
-- slot-filling
-- emotion-recognition
+- speaker-intent-classification
+- audio-slot-filling
+- speaker-emotion-recognition
 ---
 
 # Dataset Card for SUPERB
diff --git a/datasets/swahili/README.md b/datasets/swahili/README.md
index 67e7bbbd022..e7520931aa5 100644
--- a/datasets/swahili/README.md
+++ b/datasets/swahili/README.md
@@ -14,9 +14,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 paperswithcode_id: null
 pretty_name: swahili
 ---
diff --git a/datasets/swedish_medical_ner/README.md b/datasets/swedish_medical_ner/README.md
index bf5d24a6597..73484aa562f 100644
--- a/datasets/swedish_medical_ner/README.md
+++ b/datasets/swedish_medical_ner/README.md
@@ -15,7 +15,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 pretty_name: SwedMedNER
diff --git a/datasets/swedish_ner_corpus/README.md b/datasets/swedish_ner_corpus/README.md
index b5bd0141a26..8be91728111 100644
--- a/datasets/swedish_ner_corpus/README.md
+++ b/datasets/swedish_ner_corpus/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: null
diff --git a/datasets/tanzil/README.md b/datasets/tanzil/README.md
index d01ed32af29..0587cb80213 100644
--- a/datasets/tanzil/README.md
+++ b/datasets/tanzil/README.md
@@ -55,9 +55,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: tanzil
 ---
diff --git a/datasets/tapaco/README.md b/datasets/tapaco/README.md
index ef2ea6ab124..27874146d4a 100644
--- a/datasets/tapaco/README.md
+++ b/datasets/tapaco/README.md
@@ -380,11 +380,11 @@ size_categories:
 source_datasets:
 - extended|other-tatoeba
 task_categories:
-- conditional-text-generation
+- text2text-generation
+- translation
 - text-classification
 task_ids:
-- conditional-text-generation-other-given-a-sentence-generate-a-paraphrase-either-in-same-language-or-another-language
-- machine-translation
+- text2text-generation-other-paraphrase-generation
 - semantic-similarity-classification
 paperswithcode_id: tapaco
 pretty_name: TaPaCo Corpus
diff --git a/datasets/tashkeela/README.md b/datasets/tashkeela/README.md
index 923e89d92f1..842190713f3 100644
--- a/datasets/tashkeela/README.md
+++ b/datasets/tashkeela/README.md
@@ -14,9 +14,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 - other-diacritics-prediction
 paperswithcode_id: null
 pretty_name: Tashkeela
diff --git a/datasets/taskmaster1/README.md b/datasets/taskmaster1/README.md
index e36d40e69b6..d9f8dd2a499 100644
--- a/datasets/taskmaster1/README.md
+++ b/datasets/taskmaster1/README.md
@@ -14,7 +14,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - dialogue-modeling
 paperswithcode_id: taskmaster-1
diff --git a/datasets/taskmaster2/README.md b/datasets/taskmaster2/README.md
index 8945f0e38d4..a4c2850e678 100644
--- a/datasets/taskmaster2/README.md
+++ b/datasets/taskmaster2/README.md
@@ -14,7 +14,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - dialogue-modeling
 paperswithcode_id: taskmaster-2
diff --git a/datasets/taskmaster3/README.md b/datasets/taskmaster3/README.md
index 2255c721374..1de020d7814 100644
--- a/datasets/taskmaster3/README.md
+++ b/datasets/taskmaster3/README.md
@@ -14,7 +14,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - dialogue-modeling
 paperswithcode_id: null
diff --git a/datasets/tatoeba/README.md b/datasets/tatoeba/README.md
index ce88b8e0673..856357917c0 100644
--- a/datasets/tatoeba/README.md
+++ b/datasets/tatoeba/README.md
@@ -372,9 +372,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: tatoeba
 pretty_name: Tatoeba
 ---
diff --git a/datasets/ted_iwlst2013/README.md b/datasets/ted_iwlst2013/README.md
index 9cee316b1bb..ba5f4b271be 100644
--- a/datasets/ted_iwlst2013/README.md
+++ b/datasets/ted_iwlst2013/README.md
@@ -55,9 +55,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: TedIwlst2013
 ---
diff --git a/datasets/ted_talks_iwslt/README.md b/datasets/ted_talks_iwslt/README.md
index 41354422610..4bf536811fc 100644
--- a/datasets/ted_talks_iwslt/README.md
+++ b/datasets/ted_talks_iwslt/README.md
@@ -152,9 +152,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: Web Inventory of Transcribed & Translated(WIT) Ted Talks
 ---
diff --git a/datasets/telugu_books/README.md b/datasets/telugu_books/README.md
index 9ec044df8a9..becff151032 100644
--- a/datasets/telugu_books/README.md
+++ b/datasets/telugu_books/README.md
@@ -14,9 +14,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 paperswithcode_id: null
 pretty_name: TeluguBooks
 ---
diff --git a/datasets/telugu_news/README.md b/datasets/telugu_news/README.md
index 855b017cd9d..09a33707146 100644
--- a/datasets/telugu_news/README.md
+++ b/datasets/telugu_news/README.md
@@ -14,10 +14,12 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 - text-classification
 task_ids:
 - language-modeling
+- masked-language-modeling
 - multi-class-classification
 - topic-classification
 paperswithcode_id: null
diff --git a/datasets/tep_en_fa_para/README.md b/datasets/tep_en_fa_para/README.md
index 62dcba438a3..c58cf71535e 100644
--- a/datasets/tep_en_fa_para/README.md
+++ b/datasets/tep_en_fa_para/README.md
@@ -15,9 +15,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: TepEnFaPara
 ---
diff --git a/datasets/text2log/README.md b/datasets/text2log/README.md
index 54c9a22bf12..bcdeaaf10c0 100644
--- a/datasets/text2log/README.md
+++ b/datasets/text2log/README.md
@@ -15,9 +15,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 ---
 
 # Dataset Card for text2log
diff --git a/datasets/thainer/README.md b/datasets/thainer/README.md
index a0cb4146b3c..cdd904d54ac 100644
--- a/datasets/thainer/README.md
+++ b/datasets/thainer/README.md
@@ -16,7 +16,7 @@ size_categories:
 source_datasets:
 - extended|other-tirasaroj-aroonmanakun
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 - part-of-speech-tagging
diff --git a/datasets/thaisum/README.md b/datasets/thaisum/README.md
index 2a5ed72444c..ca991ca90d0 100644
--- a/datasets/thaisum/README.md
+++ b/datasets/thaisum/README.md
@@ -14,11 +14,12 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-- sequence-modeling
+- summarization
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
-- summarization
+- masked-language-modeling
 paperswithcode_id: null
 pretty_name: ThaiSum
 ---
diff --git a/datasets/the_pile/README.md b/datasets/the_pile/README.md
index 04eea945da2..431e5cf78dc 100644
--- a/datasets/the_pile/README.md
+++ b/datasets/the_pile/README.md
@@ -15,9 +15,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 ---
 
 # Dataset Card for The Pile
diff --git a/datasets/the_pile_books3/README.md b/datasets/the_pile_books3/README.md
index 8ca13c6a9a3..ab691304274 100644
--- a/datasets/the_pile_books3/README.md
+++ b/datasets/the_pile_books3/README.md
@@ -15,9 +15,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 ---
 
 # Dataset Card for the_pile_books3
diff --git a/datasets/the_pile_openwebtext2/README.md b/datasets/the_pile_openwebtext2/README.md
index 5a6f3885282..bb7ea6c387b 100644
--- a/datasets/the_pile_openwebtext2/README.md
+++ b/datasets/the_pile_openwebtext2/README.md
@@ -15,10 +15,12 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 - text-scoring
 task_ids:
 - language-modeling
+- masked-language-modeling
 - text-scoring-other-rating
 ---
 
diff --git a/datasets/the_pile_stack_exchange/README.md b/datasets/the_pile_stack_exchange/README.md
index aefb716d72d..7555e5bcf83 100644
--- a/datasets/the_pile_stack_exchange/README.md
+++ b/datasets/the_pile_stack_exchange/README.md
@@ -15,9 +15,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 ---
 
 # Dataset Card for Stack Exchange
diff --git a/datasets/tilde_model/README.md b/datasets/tilde_model/README.md
index 489bbb21785..020d32b23ae 100644
--- a/datasets/tilde_model/README.md
+++ b/datasets/tilde_model/README.md
@@ -43,9 +43,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: tilde-model-corpus
 pretty_name: Tilde Multilingual Open Data for European Languages
 ---
diff --git a/datasets/times_of_india_news_headlines/README.md b/datasets/times_of_india_news_headlines/README.md
index 780c6a5fe11..ec2a55f210d 100644
--- a/datasets/times_of_india_news_headlines/README.md
+++ b/datasets/times_of_india_news_headlines/README.md
@@ -14,13 +14,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
+- text2text-generation
 - text-retrieval
 task_ids:
 - document-retrieval
-- explanation-generation
 - fact-checking-retrieval
-- other-structured-to-text
 - text-simplification
 paperswithcode_id: null
 pretty_name: Times of India News Headlines
diff --git a/datasets/timit_asr/README.md b/datasets/timit_asr/README.md
index 35eba5d4015..066aa791c6d 100644
--- a/datasets/timit_asr/README.md
+++ b/datasets/timit_asr/README.md
@@ -15,9 +15,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- speech-processing
-task_ids:
 - automatic-speech-recognition
+task_ids: []
 paperswithcode_id: timit
 ---
 
diff --git a/datasets/tlc/README.md b/datasets/tlc/README.md
index d346396edfa..30c8a9d2017 100644
--- a/datasets/tlc/README.md
+++ b/datasets/tlc/README.md
@@ -16,9 +16,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 paperswithcode_id: null
 ---
 
diff --git a/datasets/tmu_gfm_dataset/README.md b/datasets/tmu_gfm_dataset/README.md
index 6d89c5e21d0..bced365b97a 100644
--- a/datasets/tmu_gfm_dataset/README.md
+++ b/datasets/tmu_gfm_dataset/README.md
@@ -14,9 +14,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
+- text2text-generation
 task_ids:
-- conditional-text-generation-other-grammatical-error-correction
+- text2text-generation-other-grammatical-error-correction
 paperswithcode_id: null
 pretty_name: TMU-GFM-Dataset
 ---
diff --git a/datasets/totto/README.md b/datasets/totto/README.md
index 6be6bb4d4b2..4f692ba216f 100644
--- a/datasets/totto/README.md
+++ b/datasets/totto/README.md
@@ -14,9 +14,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
 - table-to-text
+task_ids: []
 paperswithcode_id: totto
 pretty_name: ToTTo
 ---
diff --git a/datasets/trivia_qa/README.md b/datasets/trivia_qa/README.md
index 1d617173957..4bd57552359 100644
--- a/datasets/trivia_qa/README.md
+++ b/datasets/trivia_qa/README.md
@@ -18,8 +18,10 @@ source_datasets:
 - original
 task_categories:
 - question-answering
+- text2text-generation
 task_ids:
 - open-domain-qa
+- open-domain-abstractive-qa
 - extractive-qa
 - abstractive-qa
 ---
diff --git a/datasets/turk/README.md b/datasets/turk/README.md
index 7673f9ba9c3..84ec0f00e26 100644
--- a/datasets/turk/README.md
+++ b/datasets/turk/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
+- text2text-generation
 task_ids:
 - text-simplification
 paperswithcode_id: null
diff --git a/datasets/turkic_xwmt/README.md b/datasets/turkic_xwmt/README.md
index fe5ef21eae6..12193675500 100644
--- a/datasets/turkic_xwmt/README.md
+++ b/datasets/turkic_xwmt/README.md
@@ -282,9 +282,8 @@ pretty_name: turkic_xwmt
 size_categories:
 - n<1K
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 source_datasets:
 - extended|WMT 2020 News Translation Task
 ---
diff --git a/datasets/turkish_ner/README.md b/datasets/turkish_ner/README.md
index ca9b21a0ede..7a295c9c37e 100644
--- a/datasets/turkish_ner/README.md
+++ b/datasets/turkish_ner/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: null
diff --git a/datasets/turkish_shrinked_ner/README.md b/datasets/turkish_shrinked_ner/README.md
index bd210860fef..d292d554d0f 100644
--- a/datasets/turkish_shrinked_ner/README.md
+++ b/datasets/turkish_shrinked_ner/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - extended|other-turkish_ner
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: null
diff --git a/datasets/turku_ner_corpus/README.md b/datasets/turku_ner_corpus/README.md
index 1c96fc7f22b..3d79998ca15 100644
--- a/datasets/turku_ner_corpus/README.md
+++ b/datasets/turku_ner_corpus/README.md
@@ -15,7 +15,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: null
diff --git a/datasets/tweets_ar_en_parallel/README.md b/datasets/tweets_ar_en_parallel/README.md
index c96d0fb0710..42be16fd5d9 100644
--- a/datasets/tweets_ar_en_parallel/README.md
+++ b/datasets/tweets_ar_en_parallel/README.md
@@ -16,9 +16,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- other
+- translation
 task_ids:
-- other-other-machine-translation
+- translation-other-tweets-translation
 paperswithcode_id: bilingual-corpus-of-arabic-english-parallel
 pretty_name: Bilingual Corpus of Arabic-English Parallel Tweets
 ---
diff --git a/datasets/twi_text_c3/README.md b/datasets/twi_text_c3/README.md
index 22cfd763f2b..359921a4ff2 100644
--- a/datasets/twi_text_c3/README.md
+++ b/datasets/twi_text_c3/README.md
@@ -14,9 +14,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 paperswithcode_id: null
 pretty_name: Twi Text C3
 ---
diff --git a/datasets/twi_wordsim353/README.md b/datasets/twi_wordsim353/README.md
index c34b07b6c41..19ddb12681a 100644
--- a/datasets/twi_wordsim353/README.md
+++ b/datasets/twi_wordsim353/README.md
@@ -14,8 +14,9 @@ size_categories:
 - n<1K
 source_datasets: []
 task_categories:
-- text-scoring
+- text-classification
 task_ids:
+- text-scoring
 - semantic-similarity-scoring
 paperswithcode_id: null
 pretty_name: Yorùbá Wordsim-353
diff --git a/datasets/udhr/README.md b/datasets/udhr/README.md
index b9c31c4acf7..c8596fb15c5 100644
--- a/datasets/udhr/README.md
+++ b/datasets/udhr/README.md
@@ -417,9 +417,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: The Universal Declaration of Human Rights (UDHR)
 ---
diff --git a/datasets/um005/README.md b/datasets/um005/README.md
index 4b60babf3ca..d971660e236 100644
--- a/datasets/um005/README.md
+++ b/datasets/um005/README.md
@@ -15,9 +15,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: umc005-english-urdu
 pretty_name: UMC005 English-Urdu
 ---
diff --git a/datasets/un_ga/README.md b/datasets/un_ga/README.md
index accfbecb42b..b0735e132e7 100644
--- a/datasets/un_ga/README.md
+++ b/datasets/un_ga/README.md
@@ -58,9 +58,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: UnGa
 ---
diff --git a/datasets/un_multi/README.md b/datasets/un_multi/README.md
index 11b02174779..9b1f0de3b56 100644
--- a/datasets/un_multi/README.md
+++ b/datasets/un_multi/README.md
@@ -76,9 +76,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: multiun
 pretty_name: Multilingual Corpus from United Nation Documents
 ---
diff --git a/datasets/un_pc/README.md b/datasets/un_pc/README.md
index 47140f7015a..0097d500c42 100644
--- a/datasets/un_pc/README.md
+++ b/datasets/un_pc/README.md
@@ -58,9 +58,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: united-nations-parallel-corpus
 pretty_name: United Nations Parallel Corpus
 ---
diff --git a/datasets/universal_morphologies/README.md b/datasets/universal_morphologies/README.md
index 141a5089091..0d1e6702b78 100644
--- a/datasets/universal_morphologies/README.md
+++ b/datasets/universal_morphologies/README.md
@@ -452,12 +452,12 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 - text-classification
 task_ids:
 - multi-class-classification
 - multi-label-classification
-- structure-prediction-other-morphology
+- token-classification-other-morphology
 paperswithcode_id: null
 pretty_name: UniversalMorphologies
 ---
diff --git a/datasets/vctk/README.md b/datasets/vctk/README.md
index 1e6ac4d449d..37373094d28 100644
--- a/datasets/vctk/README.md
+++ b/datasets/vctk/README.md
@@ -15,9 +15,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- speech-processing
-task_ids:
 - automatic-speech-recognition
+task_ids: []
 paperswithcode_id: vctk
 ---
 
diff --git a/datasets/vivos/README.md b/datasets/vivos/README.md
index dd77ffb5ce2..7e230912365 100644
--- a/datasets/vivos/README.md
+++ b/datasets/vivos/README.md
@@ -16,9 +16,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- speech-processing
-task_ids:
 - automatic-speech-recognition
+task_ids: []
 ---
 
 # Dataset Card for VIVOS
diff --git a/datasets/web_nlg/README.md b/datasets/web_nlg/README.md
index dfd5c0ac6de..ad5ad0828d9 100644
--- a/datasets/web_nlg/README.md
+++ b/datasets/web_nlg/README.md
@@ -32,39 +32,9 @@ source_datasets:
 - extended|other-db_pedia
 - original
 task_categories:
-  release_v1:
-  - conditional-text-generation
-  release_v2:
-  - conditional-text-generation
-  release_v2.1:
-  - conditional-text-generation
-  release_v2.1_constrained:
-  - conditional-text-generation
-  release_v2_constrained:
-  - conditional-text-generation
-  release_v3.0_en:
-  - conditional-text-generation
-  release_v3.0_ru:
-  - conditional-text-generation
-  webnlg_challenge_2017:
-  - conditional-text-generation
+- structured-to-text
 task_ids:
-  release_v1:
-  - other-structured-to-text
-  release_v2:
-  - other-structured-to-text
-  release_v2.1:
-  - other-structured-to-text
-  release_v2.1_constrained:
-  - other-structured-to-text
-  release_v2_constrained:
-  - other-structured-to-text
-  release_v3.0_en:
-  - other-structured-to-text
-  release_v3.0_ru:
-  - other-structured-to-text
-  webnlg_challenge_2017:
-  - other-structured-to-text
+- rdf-to-text
 paperswithcode_id: webnlg
 pretty_name: WebNLG
 ---
diff --git a/datasets/weibo_ner/README.md b/datasets/weibo_ner/README.md
index 9e952fc9a7e..105a5f6b221 100644
--- a/datasets/weibo_ner/README.md
+++ b/datasets/weibo_ner/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: weibo-ner
diff --git a/datasets/wi_locness/README.md b/datasets/wi_locness/README.md
index 361e4fee8b3..c51f854d7dc 100644
--- a/datasets/wi_locness/README.md
+++ b/datasets/wi_locness/README.md
@@ -18,9 +18,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
+- text2text-generation
 task_ids:
-- conditional-text-generation-other-grammatical-error-correction
+- text2text-generation-other-grammatical-error-correction
 paperswithcode_id: locness-corpus
 pretty_name:
   wi: Cambridge English Write & Improve
diff --git a/datasets/wiki_asp/README.md b/datasets/wiki_asp/README.md
index 841065de7f3..b99532ce7da 100644
--- a/datasets/wiki_asp/README.md
+++ b/datasets/wiki_asp/README.md
@@ -14,9 +14,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
 - summarization
+task_ids:
+- summarization-other-aspect-based-summarization
 paperswithcode_id: wikiasp
 pretty_name: WikiAsp
 ---
diff --git a/datasets/wiki_atomic_edits/README.md b/datasets/wiki_atomic_edits/README.md
index c29443bff2e..83f18989575 100644
--- a/datasets/wiki_atomic_edits/README.md
+++ b/datasets/wiki_atomic_edits/README.md
@@ -76,10 +76,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- explanation-generation
 - summarization
+task_ids: []
 paperswithcode_id: wikiatomicedits
 pretty_name: WikiAtomicEdits
 ---
diff --git a/datasets/wiki_auto/README.md b/datasets/wiki_auto/README.md
index a507922b5e4..934502ec923 100644
--- a/datasets/wiki_auto/README.md
+++ b/datasets/wiki_auto/README.md
@@ -23,7 +23,7 @@ size_categories:
 source_datasets:
 - extended|other-wikipedia
 task_categories:
-- conditional-text-generation
+- text2text-generation
 task_ids:
 - text-simplification
 paperswithcode_id: null
diff --git a/datasets/wiki_bio/README.md b/datasets/wiki_bio/README.md
index 3d883233c5d..a562b5fafc0 100644
--- a/datasets/wiki_bio/README.md
+++ b/datasets/wiki_bio/README.md
@@ -14,10 +14,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- explanation-generation
 - table-to-text
+task_ids: []
 paperswithcode_id: wikibio
 pretty_name: WikiBio
 ---
diff --git a/datasets/wiki_dpr/README.md b/datasets/wiki_dpr/README.md
index cb576874918..afd8ad0aa7d 100644
--- a/datasets/wiki_dpr/README.md
+++ b/datasets/wiki_dpr/README.md
@@ -9,10 +9,12 @@ licenses:
 - cc-by-sa-3.0
 - gfdl-1.3-or-later
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 - other-text-search
 task_ids:
 - language-modeling
+- masked-language-modeling
 - other-neural-search
 source_datasets:
 - original
diff --git a/datasets/wiki_lingua/README.md b/datasets/wiki_lingua/README.md
index 98a4622a694..970e7212f3b 100644
--- a/datasets/wiki_lingua/README.md
+++ b/datasets/wiki_lingua/README.md
@@ -84,9 +84,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
 - summarization
+task_ids: []
 paperswithcode_id: wikilingua
 pretty_name: WikiLingua
 ---
diff --git a/datasets/wiki_source/README.md b/datasets/wiki_source/README.md
index 40e8ac13e11..7e455a6243c 100644
--- a/datasets/wiki_source/README.md
+++ b/datasets/wiki_source/README.md
@@ -15,9 +15,8 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 pretty_name: WikiSource
 ---
diff --git a/datasets/wiki_summary/README.md b/datasets/wiki_summary/README.md
index 6ff40447f8e..7287429a0bc 100644
--- a/datasets/wiki_summary/README.md
+++ b/datasets/wiki_summary/README.md
@@ -14,14 +14,15 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- conditional-text-generation
+- text2text-generation
+- translation
 - question-answering
 task_ids:
 - abstractive-qa
 - explanation-generation
 - extractive-qa
-- machine-translation
 - open-domain-qa
+- open-domain-abstractive-qa
 - summarization
 - text-simplification
 pretty_name: WikiSummary
diff --git a/datasets/wikiann/README.md b/datasets/wikiann/README.md
index af6f3560291..1bdd23164a3 100644
--- a/datasets/wikiann/README.md
+++ b/datasets/wikiann/README.md
@@ -365,7 +365,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: wikiann-1
diff --git a/datasets/wikicorpus/README.md b/datasets/wikicorpus/README.md
index 6fd8a20a25c..aa2311f258e 100644
--- a/datasets/wikicorpus/README.md
+++ b/datasets/wikicorpus/README.md
@@ -49,37 +49,43 @@ source_datasets:
 - original
 task_categories:
   raw_ca:
-  - sequence-modeling
-  raw_en:
-  - sequence-modeling
+  - text-generation
+  - fill-mask
+  - text-generation
+  - fill-mask
+  - text-generation
+  - fill-mask
   raw_es:
-  - sequence-modeling
+  - text-generation
   tagged_ca:
-  - structure-prediction
+  - token-classification
   - text-classification
   tagged_en:
-  - structure-prediction
+  - token-classification
   - text-classification
   tagged_es:
-  - structure-prediction
+  - token-classification
   - text-classification
 task_ids:
   raw_ca:
   - language-modeling
-  raw_en:
+  - masked-language-modeling
+  - language-modeling
+  - masked-language-modeling
   - language-modeling
+  - masked-language-modeling
   raw_es:
   - language-modeling
   tagged_ca:
-  - structure-prediction-other-lemmatization
+  - token-classification-other-lemmatization
   - part-of-speech-tagging
   - text-classification-other-word-sense-disambiguation
   tagged_en:
-  - structure-prediction-other-lemmatization
+  - token-classification-other-lemmatization
   - part-of-speech-tagging
   - text-classification-other-word-sense-disambiguation
   tagged_es:
-  - structure-prediction-other-lemmatization
+  - token-classification-other-lemmatization
   - part-of-speech-tagging
   - text-classification-other-word-sense-disambiguation
 paperswithcode_id: null
diff --git a/datasets/wikipedia/README.md b/datasets/wikipedia/README.md
index b990f47ee59..a852efe36aa 100644
--- a/datasets/wikipedia/README.md
+++ b/datasets/wikipedia/README.md
@@ -9,9 +9,11 @@ licenses:
 - cc-by-sa-3.0
 - gfdl-1.3-or-later
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 source_datasets:
 - original
 multilinguality:
diff --git a/datasets/wikitext/README.md b/datasets/wikitext/README.md
index 842fa444ce9..3bccab21f8e 100644
--- a/datasets/wikitext/README.md
+++ b/datasets/wikitext/README.md
@@ -17,9 +17,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 ---
 
 # Dataset Card for "wikitext"
diff --git a/datasets/wikitext_tl39/README.md b/datasets/wikitext_tl39/README.md
index 40757886354..bb62d4236b8 100644
--- a/datasets/wikitext_tl39/README.md
+++ b/datasets/wikitext_tl39/README.md
@@ -15,9 +15,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 paperswithcode_id: wikitext-tl-39
 pretty_name: WikiText-TL-39
 ---
diff --git a/datasets/wino_bias/README.md b/datasets/wino_bias/README.md
index 6f7b8d11042..9765e25d0b3 100644
--- a/datasets/wino_bias/README.md
+++ b/datasets/wino_bias/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - coreference-resolution
 paperswithcode_id: winobias
diff --git a/datasets/winograd_wsc/README.md b/datasets/winograd_wsc/README.md
index 34398c8d751..a1e6e56aee0 100644
--- a/datasets/winograd_wsc/README.md
+++ b/datasets/winograd_wsc/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- multiple-choice
 task_ids:
 - coreference-resolution
 paperswithcode_id: wsc
diff --git a/datasets/wisesight1000/README.md b/datasets/wisesight1000/README.md
index 7abd0a61cf8..fdb7267317b 100644
--- a/datasets/wisesight1000/README.md
+++ b/datasets/wisesight1000/README.md
@@ -14,9 +14,9 @@ size_categories:
 source_datasets:
 - extended|wisesight_sentiment
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
-- structure-prediction-other-word-tokenization
+- token-classification-other-word-tokenization
 paperswithcode_id: null
 pretty_name: wisesight1000
 ---
diff --git a/datasets/wmt14/README.md b/datasets/wmt14/README.md
index 080aa0c91db..18a0c4145c6 100644
--- a/datasets/wmt14/README.md
+++ b/datasets/wmt14/README.md
@@ -4,9 +4,8 @@ paperswithcode_id: wmt-2014
 multilinguality:
 - translation
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 ---
 
 # Dataset Card for "wmt14"
diff --git a/datasets/wmt15/README.md b/datasets/wmt15/README.md
index f385e02368c..555deee4087 100644
--- a/datasets/wmt15/README.md
+++ b/datasets/wmt15/README.md
@@ -4,9 +4,8 @@ paperswithcode_id: wmt-2015
 multilinguality:
 - translation
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 ---
 
 # Dataset Card for "wmt15"
diff --git a/datasets/wmt16/README.md b/datasets/wmt16/README.md
index a17b2e6475c..1b745336715 100644
--- a/datasets/wmt16/README.md
+++ b/datasets/wmt16/README.md
@@ -4,9 +4,8 @@ paperswithcode_id: wmt-2016
 multilinguality:
 - translation
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 ---
 
 # Dataset Card for "wmt16"
diff --git a/datasets/wmt17/README.md b/datasets/wmt17/README.md
index a9c024baae0..acabc271105 100644
--- a/datasets/wmt17/README.md
+++ b/datasets/wmt17/README.md
@@ -4,9 +4,8 @@ paperswithcode_id: null
 multilinguality:
 - translation
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 ---
 
 # Dataset Card for "wmt17"
diff --git a/datasets/wmt18/README.md b/datasets/wmt18/README.md
index 8e8ca2206fe..efe05ea201b 100644
--- a/datasets/wmt18/README.md
+++ b/datasets/wmt18/README.md
@@ -4,9 +4,8 @@ paperswithcode_id: wmt-2018
 multilinguality:
 - translation
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 ---
 
 # Dataset Card for "wmt18"
diff --git a/datasets/wmt19/README.md b/datasets/wmt19/README.md
index 3b39ef4c951..0cd7538f0e1 100644
--- a/datasets/wmt19/README.md
+++ b/datasets/wmt19/README.md
@@ -4,9 +4,8 @@ paperswithcode_id: null
 multilinguality:
 - translation
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 ---
 
 # Dataset Card for "wmt19"
diff --git a/datasets/wmt20_mlqe_task1/README.md b/datasets/wmt20_mlqe_task1/README.md
index 6f717b4d718..5f83fed45de 100644
--- a/datasets/wmt20_mlqe_task1/README.md
+++ b/datasets/wmt20_mlqe_task1/README.md
@@ -37,9 +37,8 @@ source_datasets:
 - extended|reddit
 - extended|wikipedia
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 ---
 
diff --git a/datasets/wmt20_mlqe_task2/README.md b/datasets/wmt20_mlqe_task2/README.md
index f3e370a2af8..c1890965bb0 100644
--- a/datasets/wmt20_mlqe_task2/README.md
+++ b/datasets/wmt20_mlqe_task2/README.md
@@ -21,9 +21,8 @@ size_categories:
 source_datasets:
 - extended|wikipedia
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 ---
 
diff --git a/datasets/wmt20_mlqe_task3/README.md b/datasets/wmt20_mlqe_task3/README.md
index 692297472a4..c61520f4bff 100644
--- a/datasets/wmt20_mlqe_task3/README.md
+++ b/datasets/wmt20_mlqe_task3/README.md
@@ -17,9 +17,8 @@ size_categories:
 source_datasets:
 - extended|amazon_us_reviews
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 paperswithcode_id: null
 ---
 
diff --git a/datasets/wmt_t2t/README.md b/datasets/wmt_t2t/README.md
index 3727d4ccfd7..67e22ba9256 100644
--- a/datasets/wmt_t2t/README.md
+++ b/datasets/wmt_t2t/README.md
@@ -4,9 +4,8 @@ paperswithcode_id: null
 multilinguality:
 - translation
 task_categories:
-- conditional-text-generation
-task_ids:
-- machine-translation
+- translation
+task_ids: []
 ---
 
 # Dataset Card for "wmt_t2t"
diff --git a/datasets/wnut_17/README.md b/datasets/wnut_17/README.md
index 9cc8b6d6b7d..b31e2b56fc4 100644
--- a/datasets/wnut_17/README.md
+++ b/datasets/wnut_17/README.md
@@ -16,7 +16,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 ---
diff --git a/datasets/woz_dialogue/README.md b/datasets/woz_dialogue/README.md
index 2689ecea5de..f215ace989a 100644
--- a/datasets/woz_dialogue/README.md
+++ b/datasets/woz_dialogue/README.md
@@ -25,8 +25,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
-- structure-prediction
+- text-generation
+- fill-mask
+- token-classification
 - text-classification
 task_ids:
 - dialogue-modeling
diff --git a/datasets/xglue/README.md b/datasets/xglue/README.md
index bbff7f6924c..f83c5006d7a 100644
--- a/datasets/xglue/README.md
+++ b/datasets/xglue/README.md
@@ -237,19 +237,19 @@ task_categories:
   nc:
   - text-classification
   ner:
-  - structure-prediction
+  - token-classification
   ntg:
-  - conditional-text-generation
+  - summarization
   paws-x:
   - text-classification
   pos:
-  - structure-prediction
+  - token-classification
   qadsm:
   - text-classification
   qam:
   - text-classification
   qg:
-  - conditional-text-generation
+  - text2text-generation
   wpr:
   - text-classification
   xnli:
@@ -262,8 +262,7 @@ task_ids:
   - topic-classification
   ner:
   - named-entity-recognition
-  ntg:
-  - summarization
+  ntg: []
   paws-x:
   - text-classification-other-paraphrase-identification
   pos:
@@ -273,7 +272,7 @@ task_ids:
   qam:
   - acceptability-classification
   qg:
-  - conditional-text-generation-other-question-answering
+  - text2text-generation-other-question-answering
   wpr:
   - acceptability-classification
   xnli:
diff --git a/datasets/xsum/README.md b/datasets/xsum/README.md
index 8408d6a3692..0fb3a493006 100644
--- a/datasets/xsum/README.md
+++ b/datasets/xsum/README.md
@@ -4,9 +4,9 @@ languages:
 - en
 paperswithcode_id: xsum
 task_categories:
-- conditional-text-generation
-task_ids:
 - summarization
+task_ids:
+- news-articles-summarization
 ---
 
 # Dataset Card for "xsum"
diff --git a/datasets/xsum_factuality/README.md b/datasets/xsum_factuality/README.md
index b6a4a98bf0f..7693775774e 100644
--- a/datasets/xsum_factuality/README.md
+++ b/datasets/xsum_factuality/README.md
@@ -14,9 +14,9 @@ size_categories:
 source_datasets:
 - extended|other-xsum
 task_categories:
-- conditional-text-generation
-task_ids:
 - summarization
+task_ids:
+- summarization-other-hallucinations
 paperswithcode_id: null
 pretty_name: XSum Hallucination Annotations
 ---
diff --git a/datasets/xtreme/README.md b/datasets/xtreme/README.md
index 45b697743d9..e16ee13bd8b 100644
--- a/datasets/xtreme/README.md
+++ b/datasets/xtreme/README.md
@@ -450,7 +450,7 @@ source_datasets:
 - extended|squad
 task_categories:
 - question-answering
-- structure-prediction
+- token-classification
 - text-classification
 - text-retrieval
 task_ids:
diff --git a/datasets/yoruba_gv_ner/README.md b/datasets/yoruba_gv_ner/README.md
index 85af9fa0f75..8f44860f76f 100644
--- a/datasets/yoruba_gv_ner/README.md
+++ b/datasets/yoruba_gv_ner/README.md
@@ -14,7 +14,7 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- structure-prediction
+- token-classification
 task_ids:
 - named-entity-recognition
 paperswithcode_id: null
diff --git a/datasets/yoruba_text_c3/README.md b/datasets/yoruba_text_c3/README.md
index 192df47fe55..0c5a90ec7dd 100644
--- a/datasets/yoruba_text_c3/README.md
+++ b/datasets/yoruba_text_c3/README.md
@@ -14,9 +14,11 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - language-modeling
+- masked-language-modeling
 paperswithcode_id: null
 pretty_name: Yorùbá Text C3
 ---
diff --git a/datasets/yoruba_wordsim353/README.md b/datasets/yoruba_wordsim353/README.md
index a687a6073b9..d25bfe27327 100644
--- a/datasets/yoruba_wordsim353/README.md
+++ b/datasets/yoruba_wordsim353/README.md
@@ -15,8 +15,9 @@ size_categories:
 source_datasets:
 - original
 task_categories:
-- text-scoring
+- text-classification
 task_ids:
+- text-scoring
 - semantic-similarity-scoring
 paperswithcode_id: null
 pretty_name: Wordsim-353 In Yorùbá (YorubaWordsim353)
diff --git a/datasets/youtube_caption_corrections/README.md b/datasets/youtube_caption_corrections/README.md
index 56fc987ccc4..3f941d5c242 100644
--- a/datasets/youtube_caption_corrections/README.md
+++ b/datasets/youtube_caption_corrections/README.md
@@ -16,7 +16,8 @@ source_datasets:
 - original
 task_categories:
 - other
-- sequence-modeling
+- text-generation
+- fill-mask
 task_ids:
 - other-other-token-classification-of-text-errors
 - slot-filling
diff --git a/datasets/zest/README.md b/datasets/zest/README.md
index 40141f5ba02..b62aa03313e 100644
--- a/datasets/zest/README.md
+++ b/datasets/zest/README.md
@@ -15,12 +15,12 @@ source_datasets:
 - original
 task_categories:
 - question-answering
-- structure-prediction
+- token-classification
 task_ids:
 - closed-domain-qa
 - extractive-qa
 - question-answering-other-yes-no-qa
-- structure-prediction-other-output-structure
+- token-classification-other-output-structure
 paperswithcode_id: zest
 pretty_name: ZEST
 ---

From 86fcef2cf2e082e042af03a287bc427c3b2965b5 Mon Sep 17 00:00:00 2001
From: Quentin Lhoest <lhoest.q@gmail.com>
Date: Wed, 30 Mar 2022 17:53:31 +0200
Subject: [PATCH 03/10] more cards updates

---
 datasets/dart/README.md             | 2 +-
 datasets/enriched_web_nlg/README.md | 2 +-
 datasets/gem/README.md              | 6 +++---
 datasets/stsb_mt_sv/README.md       | 3 ++-
 datasets/web_nlg/README.md          | 2 +-
 5 files changed, 8 insertions(+), 7 deletions(-)

diff --git a/datasets/dart/README.md b/datasets/dart/README.md
index a62f65f6595..61a27de7522 100644
--- a/datasets/dart/README.md
+++ b/datasets/dart/README.md
@@ -19,7 +19,7 @@ source_datasets:
 - extended|web_nlg
 - extended|cleaned_e2e
 task_categories:
-- structured-to-text
+- tabular-to-text
 task_ids:
 - rdf-to-text
 paperswithcode_id: dart
diff --git a/datasets/enriched_web_nlg/README.md b/datasets/enriched_web_nlg/README.md
index 325426cded6..23ed1ea2bbb 100644
--- a/datasets/enriched_web_nlg/README.md
+++ b/datasets/enriched_web_nlg/README.md
@@ -17,7 +17,7 @@ size_categories:
 source_datasets:
 - extended|other-web-nlg
 task_categories:
-- structured-to-text
+- tabular-to-text
 task_ids:
 - rdf-to-text
 paperswithcode_id: null
diff --git a/datasets/gem/README.md b/datasets/gem/README.md
index c8a390f01b4..a4eea71128c 100644
--- a/datasets/gem/README.md
+++ b/datasets/gem/README.md
@@ -219,7 +219,7 @@ task_categories:
   cs_restaurants:
   - text2text-generation
   dart:
-  - structured-to-text
+  - tabular-to-text
   e2e_nlg:
   - text2text-generation
   mlsum_de:
@@ -232,9 +232,9 @@ task_categories:
   totto:
   - text2text-generation
   web_nlg_en:
-  - structured-to-text
+  - tabular-to-text
   web_nlg_ru:
-  - structured-to-text
+  - tabular-to-text
   wiki_auto_asset_turk:
   - text2text-generation
   wiki_lingua_es_en:
diff --git a/datasets/stsb_mt_sv/README.md b/datasets/stsb_mt_sv/README.md
index c6af47e0488..5f169581c9b 100644
--- a/datasets/stsb_mt_sv/README.md
+++ b/datasets/stsb_mt_sv/README.md
@@ -15,8 +15,9 @@ size_categories:
 source_datasets:
 - extended|other-sts-b
 task_categories:
-- text-scoring
+- text-classification
 task_ids:
+- text-scoring
 - semantic-similarity-scoring
 paperswithcode_id: null
 pretty_name: Swedish Machine Translated STS-B
diff --git a/datasets/web_nlg/README.md b/datasets/web_nlg/README.md
index ad5ad0828d9..23095876a52 100644
--- a/datasets/web_nlg/README.md
+++ b/datasets/web_nlg/README.md
@@ -32,7 +32,7 @@ source_datasets:
 - extended|other-db_pedia
 - original
 task_categories:
-- structured-to-text
+- tabular-to-text
 task_ids:
 - rdf-to-text
 paperswithcode_id: webnlg

From 5ef9b7cfaeecb920d7a2de4b38248835c116ff22 Mon Sep 17 00:00:00 2001
From: Quentin Lhoest <lhoest.q@gmail.com>
Date: Wed, 30 Mar 2022 17:53:49 +0200
Subject: [PATCH 04/10] update dataset tags parser

---
 src/datasets/utils/metadata.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/datasets/utils/metadata.py b/src/datasets/utils/metadata.py
index 090b59c25a6..a0ed9469ea4 100644
--- a/src/datasets/utils/metadata.py
+++ b/src/datasets/utils/metadata.py
@@ -321,9 +321,9 @@ def validate_task_categories(task_categories: Union[List[str], Dict[str, List[st
     def validate_task_ids(task_ids: Union[List[str], Dict[str, List[str]]]) -> ValidatorOutput:
         # TODO: we're currently ignoring all values starting with 'other' as our task taxonomy is bound to change
         #   in the near future and we don't want to waste energy in tagging against a moving taxonomy.
-        known_set = [tid for _cat, d in known_task_ids.items() for tid in d["options"]]
+        known_set = [tid for _cat, d in known_task_ids.items() for tid in d.get("subtasks", [])]
         validated, error = tagset_validator(
-            task_ids, known_set, "task_ids", known_task_ids_url, lambda e: "-other-" in e or e.startswith("other-")
+            task_ids, known_set, "task_ids", known_task_ids_url, lambda e: not e or "-other-" in e or e.startswith("other-")
         )
         return validated, error
 

From 526dba9dce6f983ebcacd65bef35a868a5735df6 Mon Sep 17 00:00:00 2001
From: Quentin Lhoest <lhoest.q@gmail.com>
Date: Wed, 30 Mar 2022 17:53:57 +0200
Subject: [PATCH 05/10] fix multi-choice-qa

---
 src/datasets/utils/resources/tasks.json | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/src/datasets/utils/resources/tasks.json b/src/datasets/utils/resources/tasks.json
index 540e6ffbccd..4d5658d7645 100644
--- a/src/datasets/utils/resources/tasks.json
+++ b/src/datasets/utils/resources/tasks.json
@@ -55,7 +55,7 @@
     "multiple-choice": {
         "type": "text",
         "subtasks": [
-            "multiple-choice-question-answering",
+            "multiple-choice-qa",
             "multiple-choice-coreference-resolution"
         ]
     },
@@ -201,5 +201,8 @@
     },
     "reinforcement-learning": {
         "type": "other"
+    },
+    "other": {
+        "type": "other"
     }
 }
\ No newline at end of file

From a6fb7e9485a681d37965ea17cb557257c9e0af2e Mon Sep 17 00:00:00 2001
From: Quentin Lhoest <lhoest.q@gmail.com>
Date: Fri, 8 Apr 2022 17:45:52 +0200
Subject: [PATCH 06/10] style

---
 src/datasets/utils/metadata.py | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/src/datasets/utils/metadata.py b/src/datasets/utils/metadata.py
index a0ed9469ea4..23f41b93e02 100644
--- a/src/datasets/utils/metadata.py
+++ b/src/datasets/utils/metadata.py
@@ -323,7 +323,11 @@ def validate_task_ids(task_ids: Union[List[str], Dict[str, List[str]]]) -> Valid
         #   in the near future and we don't want to waste energy in tagging against a moving taxonomy.
         known_set = [tid for _cat, d in known_task_ids.items() for tid in d.get("subtasks", [])]
         validated, error = tagset_validator(
-            task_ids, known_set, "task_ids", known_task_ids_url, lambda e: not e or "-other-" in e or e.startswith("other-")
+            task_ids,
+            known_set,
+            "task_ids",
+            known_task_ids_url,
+            lambda e: not e or "-other-" in e or e.startswith("other-"),
         )
         return validated, error
 

From 54e9964e5a1f72459cabc2eab21e07c4c273dc9f Mon Sep 17 00:00:00 2001
From: Quentin Lhoest <lhoest.q@gmail.com>
Date: Fri, 8 Apr 2022 19:50:54 +0200
Subject: [PATCH 07/10] small improvements in some dataset cards

---
 datasets/id_liputan6/README.md              | 4 +++-
 datasets/librispeech_asr/README.md          | 6 ++++--
 datasets/multilingual_librispeech/README.md | 6 ++++--
 datasets/wmt20_mlqe_task2/README.md         | 7 +++++--
 4 files changed, 16 insertions(+), 7 deletions(-)

diff --git a/datasets/id_liputan6/README.md b/datasets/id_liputan6/README.md
index 4e78415ee70..5cea1c06a44 100644
--- a/datasets/id_liputan6/README.md
+++ b/datasets/id_liputan6/README.md
@@ -15,7 +15,9 @@ source_datasets:
 - original
 task_categories:
 - summarization
-task_ids: []
+task_ids:
+- summarization-other-extractive-summarization
+- news-articles-summarization
 paperswithcode_id: null
 pretty_name: Large-scale Indonesian Summarization
 ---
diff --git a/datasets/librispeech_asr/README.md b/datasets/librispeech_asr/README.md
index 329ecfb246b..8806cab4258 100644
--- a/datasets/librispeech_asr/README.md
+++ b/datasets/librispeech_asr/README.md
@@ -18,7 +18,9 @@ source_datasets:
 - original
 task_categories:
 - automatic-speech-recognition
-task_ids: []
+- audio-classification
+task_ids:
+- audio-speaker-identification
 ---
 
 # Dataset Card for librispeech_asr
@@ -61,7 +63,7 @@ LibriSpeech is a corpus of approximately 1000 hours of 16kHz read English speech
 
 ### Supported Tasks and Leaderboards
 
-- `automatic-speech-recognition`, `speaker-identification`: The dataset can be used to train a model for Automatic Speech Recognition (ASR). The model is presented with an audio file and asked to transcribe the audio file to written text. The most common evaluation metric is the word error rate (WER). The task has an active leaderboard which can be found at https://paperswithcode.com/sota/speech-recognition-on-librispeech-test-clean and ranks models based on their WER.
+- `automatic-speech-recognition`, `audio-speaker-identification`: The dataset can be used to train a model for Automatic Speech Recognition (ASR). The model is presented with an audio file and asked to transcribe the audio file to written text. The most common evaluation metric is the word error rate (WER). The task has an active leaderboard which can be found at https://paperswithcode.com/sota/speech-recognition-on-librispeech-test-clean and ranks models based on their WER.
 
 ### Languages
 
diff --git a/datasets/multilingual_librispeech/README.md b/datasets/multilingual_librispeech/README.md
index 5d390f3f25f..87c9e25898c 100644
--- a/datasets/multilingual_librispeech/README.md
+++ b/datasets/multilingual_librispeech/README.md
@@ -24,7 +24,9 @@ source_datasets:
 - original
 task_categories:
 - automatic-speech-recognition
-task_ids: []
+- audio-classification
+task_ids:
+- audio-speaker-identification
 ---
 
 # Dataset Card for MultiLingual LibriSpeech
@@ -66,7 +68,7 @@ Multilingual LibriSpeech (MLS) dataset is a large multilingual corpus suitable f
 
 ### Supported Tasks and Leaderboards
 
-- `automatic-speech-recognition`, `speaker-identification`: The dataset can be used to train a model for Automatic Speech Recognition (ASR). The model is presented with an audio file and asked to transcribe the audio file to written text. The most common evaluation metric is the word error rate (WER). The task has an active leaderboard which can be found at https://paperswithcode.com/dataset/multilingual-librispeech and ranks models based on their WER.
+- `automatic-speech-recognition`, `audio-speaker-identification`: The dataset can be used to train a model for Automatic Speech Recognition (ASR). The model is presented with an audio file and asked to transcribe the audio file to written text. The most common evaluation metric is the word error rate (WER). The task has an active leaderboard which can be found at https://paperswithcode.com/dataset/multilingual-librispeech and ranks models based on their WER.
 
 ### Languages
 
diff --git a/datasets/wmt20_mlqe_task2/README.md b/datasets/wmt20_mlqe_task2/README.md
index c1890965bb0..6ab246d4b64 100644
--- a/datasets/wmt20_mlqe_task2/README.md
+++ b/datasets/wmt20_mlqe_task2/README.md
@@ -22,13 +22,16 @@ source_datasets:
 - extended|wikipedia
 task_categories:
 - translation
-task_ids: []
+- text-classification
+task_ids:
+- text-classification-other-translation-quality-estimation
 paperswithcode_id: null
 ---
 
-# Dataset Card Creation Guide
+# Dataset Card for WMT20 - MultiLingual Quality Estimation (MLQE) Task2
 
 ## Table of Contents
+
 - [Dataset Description](#dataset-description)
   - [Dataset Summary](#dataset-summary)
   - [Supported Tasks and Leaderboards](#supported-tasks-and-leaderboards)

From fe3e79e550e4b1057d249da3fc59a5f34835d772 Mon Sep 17 00:00:00 2001
From: Quentin Lhoest <lhoest.q@gmail.com>
Date: Fri, 8 Apr 2022 19:51:05 +0200
Subject: [PATCH 08/10] allow certain tag fields to be empty

---
 src/datasets/utils/metadata.py | 22 ++++++++++++++++++----
 1 file changed, 18 insertions(+), 4 deletions(-)

diff --git a/src/datasets/utils/metadata.py b/src/datasets/utils/metadata.py
index 23f41b93e02..2b75cc7be7a 100644
--- a/src/datasets/utils/metadata.py
+++ b/src/datasets/utils/metadata.py
@@ -146,7 +146,14 @@ def validate_type(value: Any, expected_type: Type):
                         error_string += "\nOR\n" + "(" + temp_error_string + ")"
 
         else:
-            # Assuming `List`/`Dict`/`Tuple`
+            # Assuming non empty `List`/`Dict`/`Tuple`
+            if expected_type == EmptyList:
+                if len(value) == 0:
+                    return ""
+                else:
+                    return f"Expected `{expected_type_origin}` of length 0. Found value of type: `{type(value)}`, with length: {len(value)}.\n"
+
+            # Assuming non empty
             if not isinstance(value, expected_type_origin) or len(value) == 0:
                 return f"Expected `{expected_type_origin}` with length > 0. Found value of type: `{type(value)}`, with length: {len(value)}.\n"
 
@@ -185,18 +192,25 @@ def validate_metadata_type(metadata_dict: dict):
         raise TypeError(f"The following typing errors are found: {typing_errors}")
 
 
+class _nothing:
+    pass
+
+
+EmptyList = List[_nothing]
+
+
 @dataclass
 class DatasetMetadata:
     annotations_creators: Union[List[str], Dict[str, List[str]]]
-    language_creators: Union[List[str], Dict[str, List[str]]]
-    languages: Union[List[str], Dict[str, List[str]]]
+    language_creators: Union[EmptyList, List[str], Dict[str, List[str]]]
+    languages: Union[EmptyList, List[str], Dict[str, List[str]]]
     licenses: Union[List[str], Dict[str, List[str]]]
     multilinguality: Union[List[str], Dict[str, List[str]]]
     pretty_name: Union[str, Dict[str, str]]
     size_categories: Union[List[str], Dict[str, List[str]]]
     source_datasets: Union[List[str], Dict[str, List[str]]]
     task_categories: Union[List[str], Dict[str, List[str]]]
-    task_ids: Union[List[str], Dict[str, List[str]]]
+    task_ids: Union[EmptyList, List[str], Dict[str, List[str]]]
     paperswithcode_id: Optional[str] = None
 
     def validate(self):

From b82199c466604da06182b3d1850f58b3ac6413ea Mon Sep 17 00:00:00 2001
From: Quentin Lhoest <lhoest.q@gmail.com>
Date: Mon, 11 Apr 2022 17:19:27 +0200
Subject: [PATCH 09/10] update vision datasets tags

---
 datasets/beans/README.md         | 2 +-
 datasets/cats_vs_dogs/README.md  | 2 +-
 datasets/cifar10/README.md       | 3 +--
 datasets/cifar100/README.md      | 5 ++---
 datasets/fashion_mnist/README.md | 2 +-
 datasets/food101/README.md       | 2 +-
 datasets/mnist/README.md         | 2 +-
 datasets/red_caps/README.md      | 2 --
 datasets/svhn/README.md          | 2 +-
 9 files changed, 9 insertions(+), 13 deletions(-)

diff --git a/datasets/beans/README.md b/datasets/beans/README.md
index 1b37467e350..971629f70dc 100644
--- a/datasets/beans/README.md
+++ b/datasets/beans/README.md
@@ -17,7 +17,7 @@ source_datasets:
 task_categories:
 - image-classification
 task_ids:
-- single-label-image-classification
+- image-classification-other-leaves-classification
 ---
 
 # Dataset Card for Beans
diff --git a/datasets/cats_vs_dogs/README.md b/datasets/cats_vs_dogs/README.md
index 11b65fb82ec..8543e6ff741 100644
--- a/datasets/cats_vs_dogs/README.md
+++ b/datasets/cats_vs_dogs/README.md
@@ -17,7 +17,7 @@ source_datasets:
 task_categories:
 - image-classification
 task_ids:
-- single-label-image-classification
+- image-classification-other-animals-classification
 ---
 
 # Dataset Card for Cats Vs. Dogs
diff --git a/datasets/cifar10/README.md b/datasets/cifar10/README.md
index 7edba5e9240..ce97aaa0cba 100644
--- a/datasets/cifar10/README.md
+++ b/datasets/cifar10/README.md
@@ -16,8 +16,7 @@ source_datasets:
 - extended|other-80-Million-Tiny-Images
 task_categories:
 - image-classification
-task_ids:
-- single-label-image-classification
+task_ids: []
 paperswithcode_id: cifar-10
 ---
 
diff --git a/datasets/cifar100/README.md b/datasets/cifar100/README.md
index bba8b31292e..3ab94875a23 100644
--- a/datasets/cifar100/README.md
+++ b/datasets/cifar100/README.md
@@ -16,12 +16,11 @@ source_datasets:
 - extended|other-80-Million-Tiny-Images
 task_categories:
 - image-classification
-task_ids:
-- single-label-image-classification
+task_ids: []
 paperswithcode_id: cifar-100
 ---
  
-# Dataset Card for CIFAR-10
+# Dataset Card for CIFAR-100
 
 ## Table of Contents
 - [Dataset Description](#dataset-description)
diff --git a/datasets/fashion_mnist/README.md b/datasets/fashion_mnist/README.md
index 34c84628057..75799471ecd 100644
--- a/datasets/fashion_mnist/README.md
+++ b/datasets/fashion_mnist/README.md
@@ -16,7 +16,7 @@ source_datasets:
 task_categories:
 - image-classification
 task_ids:
-- single-label-image-classification
+- image-classification-other-clothing-classification
 paperswithcode_id: fashion-mnist
 pretty_name: FashionMNIST
 ---
diff --git a/datasets/food101/README.md b/datasets/food101/README.md
index 6b45228ce9d..2d6fb763b83 100644
--- a/datasets/food101/README.md
+++ b/datasets/food101/README.md
@@ -17,7 +17,7 @@ source_datasets:
 task_categories:
 - image-classification
 task_ids:
-- single-label-image-classification
+- image-classification-other-food-classification
 paperswithcode_id: food-101
 ---
 
diff --git a/datasets/mnist/README.md b/datasets/mnist/README.md
index 997f57522c4..21051419736 100644
--- a/datasets/mnist/README.md
+++ b/datasets/mnist/README.md
@@ -16,7 +16,7 @@ source_datasets:
 task_categories:
 - image-classification
 task_ids:
-- single-label-image-classification
+- image-classification-other-digits-classification
 paperswithcode_id: mnist
 pretty_name: MNIST
 ---
diff --git a/datasets/red_caps/README.md b/datasets/red_caps/README.md
index a7b021eb567..9624d208e3d 100644
--- a/datasets/red_caps/README.md
+++ b/datasets/red_caps/README.md
@@ -15,10 +15,8 @@ source_datasets:
 - original
 task_categories:
 - image-to-text
-- image-classification
 task_ids:
 - image-captioning
-- single-label-image-classification
 paperswithcode_id: redcaps
 pretty_name: RedCaps
 ---
diff --git a/datasets/svhn/README.md b/datasets/svhn/README.md
index 2bfed37544a..4826a0f9450 100644
--- a/datasets/svhn/README.md
+++ b/datasets/svhn/README.md
@@ -18,7 +18,7 @@ task_categories:
 - image-classification
 - object-detection
 task_ids:
-- single-label-image-classification
+- object-detection-other-digit-detection
 paperswithcode_id: svhn
 pretty_name: Street View House Numbers
 ---

From 496b33c631b004fff3fdbfe5f0749d9be738f326 Mon Sep 17 00:00:00 2001
From: Quentin Lhoest <lhoest.q@gmail.com>
Date: Wed, 13 Apr 2022 16:53:01 +0200
Subject: [PATCH 10/10] use multi-class-image-classification and remove other
 tags

---
 datasets/beans/README.md         | 2 +-
 datasets/cats_vs_dogs/README.md  | 3 +--
 datasets/fashion_mnist/README.md | 2 +-
 datasets/food101/README.md       | 2 +-
 datasets/mnist/README.md         | 2 +-
 datasets/svhn/README.md          | 3 +--
 6 files changed, 6 insertions(+), 8 deletions(-)

diff --git a/datasets/beans/README.md b/datasets/beans/README.md
index 971629f70dc..317827a551a 100644
--- a/datasets/beans/README.md
+++ b/datasets/beans/README.md
@@ -17,7 +17,7 @@ source_datasets:
 task_categories:
 - image-classification
 task_ids:
-- image-classification-other-leaves-classification
+- multi-class-image-classification
 ---
 
 # Dataset Card for Beans
diff --git a/datasets/cats_vs_dogs/README.md b/datasets/cats_vs_dogs/README.md
index 8543e6ff741..28b278ca734 100644
--- a/datasets/cats_vs_dogs/README.md
+++ b/datasets/cats_vs_dogs/README.md
@@ -16,8 +16,7 @@ source_datasets:
 - original
 task_categories:
 - image-classification
-task_ids:
-- image-classification-other-animals-classification
+task_ids: []
 ---
 
 # Dataset Card for Cats Vs. Dogs
diff --git a/datasets/fashion_mnist/README.md b/datasets/fashion_mnist/README.md
index 75799471ecd..266e08d1369 100644
--- a/datasets/fashion_mnist/README.md
+++ b/datasets/fashion_mnist/README.md
@@ -16,7 +16,7 @@ source_datasets:
 task_categories:
 - image-classification
 task_ids:
-- image-classification-other-clothing-classification
+- multi-class-image-classification
 paperswithcode_id: fashion-mnist
 pretty_name: FashionMNIST
 ---
diff --git a/datasets/food101/README.md b/datasets/food101/README.md
index 2d6fb763b83..fa0f9ff0741 100644
--- a/datasets/food101/README.md
+++ b/datasets/food101/README.md
@@ -17,7 +17,7 @@ source_datasets:
 task_categories:
 - image-classification
 task_ids:
-- image-classification-other-food-classification
+- multi-class-image-classification
 paperswithcode_id: food-101
 ---
 
diff --git a/datasets/mnist/README.md b/datasets/mnist/README.md
index 21051419736..302e2b87fb9 100644
--- a/datasets/mnist/README.md
+++ b/datasets/mnist/README.md
@@ -16,7 +16,7 @@ source_datasets:
 task_categories:
 - image-classification
 task_ids:
-- image-classification-other-digits-classification
+- multi-class-image-classification
 paperswithcode_id: mnist
 pretty_name: MNIST
 ---
diff --git a/datasets/svhn/README.md b/datasets/svhn/README.md
index 4826a0f9450..e174b55fe2a 100644
--- a/datasets/svhn/README.md
+++ b/datasets/svhn/README.md
@@ -17,8 +17,7 @@ source_datasets:
 task_categories:
 - image-classification
 - object-detection
-task_ids:
-- object-detection-other-digit-detection
+task_ids: []
 paperswithcode_id: svhn
 pretty_name: Street View House Numbers
 ---