diff --git a/hfutils/utils/irregular_repo.json b/hfutils/utils/irregular_repo.json index 7378355758..f2e3cb79e2 100644 --- a/hfutils/utils/irregular_repo.json +++ b/hfutils/utils/irregular_repo.json @@ -2,6 +2,7 @@ "datasets": [ "acronym_identification", "ade_corpus_v2", + "adv_glue", "aeslc", "afrikaans_ner_corpus", "ag_news", @@ -42,10 +43,12 @@ "best2009", "bible_para", "big_patent", + "bigbench", "billsum", "bing_coronavirus_query_set", "biomrc", "biosses", + "biwi_kinect_head_pose", "blended_skill_talk", "blog_authorship_corpus", "bn_hate_speech", @@ -105,9 +108,12 @@ "common_voice", "compguesswhat", "conceptnet5", + "conceptual_12m", + "conceptual_captions", "conll2000", "conll2002", "conll2003", + "conll2012_ontonotesv5", "conllpp", "consumer-finance-complaints", "conv_ai", @@ -163,15 +169,18 @@ "electricity_load_diagrams", "eli5", "eli5_category", + "elkarhizketak", "emea", "emo", "emotone_ar", "empathetic_dialogues", "enriched_web_nlg", + "enwik8", "eraser_multi_rc", "esnli", "eth_py150_open", "ethos", + "ett", "eu_regulatory_ir", "eurlex", "euronews", @@ -209,6 +218,7 @@ "google_wellformed_query", "grail_qa", "great_code", + "gsm8k", "guardian_authorship", "gutenberg_time", "hans", @@ -254,6 +264,8 @@ "igbo_monolingual", "igbo_ner", "ilist", + "imagenet-1k", + "imagenet_sketch", "imdb_urdu_reviews", "imppres", "indic_glue", @@ -290,6 +302,7 @@ "large_spanish_corpus", "laroseda", "lc_quad", + "lccc", "lener_br", "liar", "librispeech_asr", @@ -319,6 +332,7 @@ "medical_questions_pairs", "menyo20k_mt", "meta_woz", + "metashift", "metooma", "metrec", "miam", @@ -328,6 +342,7 @@ "mlsum", "mnist", "mocha", + "monash_tsf", "moroco", "movie_rationales", "mrqa", @@ -396,8 +411,8 @@ "para_pat", "parsinlu_reading_comprehension", "pass", - "paws-x", "paws", + "paws-x", "pec", "peoples_daily_ner", "per_sent", @@ -430,6 +445,7 @@ "quac", "quail", "quarel", + "quickdraw", "quora", "quoref", "re_dial", @@ -445,12 +461,14 @@ "ro_sts", "ro_sts_parallel", "roman_urdu", + "roman_urdu_hate_speech", "ronec", "rotten_tomatoes", "samsum", "sanskrit_classic", "saudinewsnet", "sberquad", + "sbu_captions", "scan", "scb_mt_enth_2020", "scene_parse_150", @@ -530,6 +548,7 @@ "telugu_news", "tep_en_fa_para", "text2log", + "textvqa", "thai_toxicity_tweet", "thainer", "thaiqa_squad", @@ -543,9 +562,11 @@ "timit_asr", "tlc", "tmu_gfm_dataset", + "tne", "told-br", "totto", "trec", + "truthful_qa", "tsac", "ttc4900", "tunizi", @@ -572,6 +593,7 @@ "urdu_fake_news", "urdu_sentiment_corpus", "vctk", + "visual_genome", "vivos", "web_nlg", "web_of_science", @@ -599,6 +621,7 @@ "wikihow", "wikipedia", "wikisql", + "wikitablequestions", "wikitext", "wikitext_tl39", "wili_2018", @@ -632,30 +655,7 @@ "yoruba_text_c3", "yoruba_wordsim353", "youtube_caption_corrections", - "zest", - "elkarhizketak", - "wikitablequestions", - "conll2012_ontonotesv5", - "monash_tsf", - "roman_urdu_hate_speech", - "adv_glue", - "metashift", - "gsm8k", - "sbu_captions", - "conceptual_captions", - "conceptual_12m", - "visual_genome", - "imagenet-1k", - "tne", - "textvqa", - "ett", - "imagenet_sketch", - "biwi_kinect_head_pose", - "enwik8", - "truthful_qa", - "bigbench", - "quickdraw", - "lccc" + "zest" ], "models": [], "spaces": []