Skip to content

Commit 114c09a

Browse files
authored
Generate tasks.json taxonomy from huggingface_hub (#4154)
* Update tasks.json * recompute export * honor `hideInDatasets`
1 parent b9aa570 commit 114c09a

File tree

1 file changed

+51
-55
lines changed

1 file changed

+51
-55
lines changed

src/datasets/utils/resources/tasks.json

Lines changed: 51 additions & 55 deletions
Original file line numberDiff line numberDiff line change
@@ -13,10 +13,10 @@
1313
"type": "audio"
1414
},
1515
"automatic-speech-recognition": {
16-
"type": "multimodal"
16+
"type": "audio"
1717
},
1818
"conversational": {
19-
"type": "text",
19+
"type": "nlp",
2020
"subtasks": [
2121
"dialogue-generation"
2222
]
@@ -25,90 +25,96 @@
2525
"type": "multimodal"
2626
},
2727
"fill-mask": {
28-
"type": "text",
28+
"type": "nlp",
2929
"subtasks": [
3030
"slot-filling",
3131
"masked-language-modeling"
3232
]
3333
},
3434
"image-classification": {
35-
"type": "image",
35+
"type": "cv",
3636
"subtasks": [
3737
"multi-label-image-classification",
3838
"multi-class-image-classification"
3939
]
4040
},
4141
"image-segmentation": {
42-
"type": "image",
42+
"type": "cv",
4343
"subtasks": [
4444
"instance-segmentation",
4545
"semantic-segmentation",
4646
"panoptic-segmentation"
4747
]
4848
},
49+
"image-to-image": {
50+
"type": "cv"
51+
},
4952
"image-to-text": {
5053
"type": "multimodal",
5154
"subtasks": [
5255
"image-captioning"
5356
]
5457
},
5558
"multiple-choice": {
56-
"type": "text",
59+
"type": "nlp",
5760
"subtasks": [
5861
"multiple-choice-qa",
5962
"multiple-choice-coreference-resolution"
6063
]
6164
},
6265
"object-detection": {
63-
"type": "image",
66+
"type": "cv",
6467
"subtasks": [
6568
"face-detection",
6669
"vehicle-detection"
6770
]
6871
},
72+
"other": {
73+
"type": "other"
74+
},
6975
"question-answering": {
70-
"type": "text",
71-
"aliases": [
72-
"extractive-question-answering"
73-
],
76+
"type": "nlp",
7477
"subtasks": [
7578
"extractive-qa",
7679
"open-domain-qa",
7780
"closed-domain-qa"
7881
]
7982
},
8083
"sentence-similarity": {
81-
"type": "text"
84+
"type": "nlp"
85+
},
86+
"summarization": {
87+
"type": "nlp",
88+
"subtasks": [
89+
"news-articles-summarization",
90+
"news-articles-headline-generation"
91+
]
92+
},
93+
"table-question-answering": {
94+
"type": "nlp"
95+
},
96+
"table-to-text": {
97+
"type": "nlp",
98+
"subtasks": [
99+
"rdf-to-text"
100+
]
82101
},
83102
"tabular-classification": {
84-
"type": "text",
103+
"type": "structured",
85104
"subtasks": [
86105
"tabular-multi-class-classification",
87106
"tabular-multi-label-classification",
88107
"tabular-single-column-regression"
89108
]
90109
},
91110
"tabular-to-text": {
92-
"type": "text",
111+
"type": "structured",
93112
"subtasks": [
94113
"rdf-to-text"
95114
]
96115
},
97-
"summarization": {
98-
"type": "text",
99-
"subtasks": [
100-
"news-articles-summarization",
101-
"news-articles-headline-generation"
102-
]
103-
},
104-
"table-to-text": {
105-
"type": "text"
106-
},
107-
"table-question-answering": {
108-
"type": "text"
109-
},
110116
"text-classification": {
111-
"type": "text",
117+
"type": "nlp",
112118
"subtasks": [
113119
"acceptability-classification",
114120
"entity-linking-classification",
@@ -128,14 +134,14 @@
128134
]
129135
},
130136
"text-generation": {
131-
"type": "text",
137+
"type": "nlp",
132138
"subtasks": [
133139
"dialogue-modeling",
134140
"language-modeling"
135141
]
136142
},
137143
"text-retrieval": {
138-
"type": "text",
144+
"type": "nlp",
139145
"subtasks": [
140146
"document-retrieval",
141147
"utterance-retrieval",
@@ -146,18 +152,11 @@
146152
"text-to-image": {
147153
"type": "multimodal"
148154
},
149-
"text-to-tabular": {
150-
"type": "text",
151-
"subtasks": [
152-
"relation-extraction",
153-
"semantic-role-labeling"
154-
]
155-
},
156155
"text-to-speech": {
157-
"type": "multimodal"
156+
"type": "audio"
158157
},
159158
"text2text-generation": {
160-
"type": "text",
159+
"type": "nlp",
161160
"subtasks": [
162161
"text-simplification",
163162
"explanation-generation",
@@ -169,45 +168,42 @@
169168
]
170169
},
171170
"time-series-forecasting": {
172-
"type": "time series",
171+
"type": "structured",
173172
"subtasks": [
174173
"univariate-time-series-forecasting",
175174
"multivariate-time-series-forecasting"
176175
]
177176
},
178177
"token-classification": {
179-
"type": "text",
180-
"aliases": [
181-
"structure-prediction"
182-
],
178+
"type": "nlp",
183179
"subtasks": [
184180
"named-entity-recognition",
185-
"part-of-speech-tagging",
181+
"part-of-speech",
186182
"parsing",
187183
"lemmatization",
188184
"word-sense-disambiguation",
189185
"coreference-resolution"
190186
]
191187
},
192188
"translation": {
193-
"type": "text"
189+
"type": "nlp"
190+
},
191+
"unconditional-image-generation": {
192+
"type": "cv"
194193
},
195194
"visual-question-answering": {
196-
"type": "multimodal"
195+
"type": "multimodal",
196+
"subtasks": [
197+
"visual-question-answering"
198+
]
197199
},
198200
"voice-activity-detection": {
199201
"type": "audio"
200202
},
201203
"zero-shot-classification": {
202-
"type": "text"
204+
"type": "nlp"
203205
},
204206
"zero-shot-image-classification": {
205-
"type": "multimodal"
206-
},
207-
"reinforcement-learning": {
208-
"type": "other"
209-
},
210-
"other": {
211-
"type": "other"
207+
"type": "cv"
212208
}
213209
}

0 commit comments

Comments
 (0)