Skip to content

Commit 46836cd

Browse files
committed
more fixes
1 parent 76d9a14 commit 46836cd

File tree

18 files changed

+537
-779
lines changed

18 files changed

+537
-779
lines changed

datasets/caner/README.md

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,8 @@ language_creators:
55
- expert-generated
66
languages:
77
- ar
8-
licenses: []
8+
licenses:
9+
- unknown
910
multilinguality:
1011
- monolingual
1112
size_categories:

datasets/chr_en/README.md

Lines changed: 21 additions & 50 deletions
Original file line numberDiff line numberDiff line change
@@ -1,67 +1,38 @@
11
---
22
annotations_creators:
3-
monolingual:
4-
- no-annotation
5-
monolingual_raw:
6-
- found
7-
parallel:
8-
- expert-generated
9-
parallel_raw:
10-
- expert-generated
3+
- expert-generated
4+
- found
5+
- no-annotation
116
language_creators:
127
- found
138
languages:
14-
monolingual:
15-
- chr
16-
- en
17-
monolingual_raw:
18-
- chr
19-
parallel:
20-
- chr
21-
- en
22-
parallel_raw:
23-
- chr
24-
- en
9+
- chr
10+
- en
2511
licenses:
2612
- other-different-license-per-source
2713
multilinguality:
28-
monolingual:
29-
- multilingual
30-
monolingual_raw:
31-
- monolingual
32-
parallel:
33-
- translation
34-
parallel_raw:
35-
- translation
14+
- monolingual
15+
- multilingual
16+
- translation
3617
size_categories:
37-
monolingual:
38-
- 100K<n<1M
39-
monolingual_raw:
40-
- 1K<n<10K
41-
parallel:
42-
- 10K<n<100K
43-
parallel_raw:
44-
- 10K<n<100K
18+
- 100K<n<1M
19+
- 10K<n<100K
20+
- 1K<n<10K
4521
source_datasets:
4622
- original
4723
task_categories:
48-
monolingual:
49-
- translation
50-
monolingual_raw:
51-
- text-generation
52-
- fill-mask
53-
parallel:
54-
- translation
55-
parallel_raw:
56-
- translation
24+
- fill-mask
25+
- text-generation
26+
- translation
5727
task_ids:
58-
monolingual: []
59-
monolingual_raw:
60-
- language-modeling
61-
- masked-language-modeling
62-
parallel: []
63-
parallel_raw: []
28+
- language-modeling
29+
- masked-language-modeling
6430
paperswithcode_id: chren
31+
configs:
32+
- monolingual
33+
- monolingual_raw
34+
- parallel
35+
- parallel_raw
6536
---
6637

6738
# Dataset Card for ChrEn

datasets/mkb/README.md

Lines changed: 48 additions & 90 deletions
Original file line numberDiff line numberDiff line change
@@ -24,100 +24,58 @@ annotations_creators:
2424
source_datasets:
2525
- original
2626
size_categories:
27-
bn-en:
28-
- 1K<n<10K
29-
bn-gu:
30-
- 1K<n<10K
31-
bn-hi:
32-
- 1K<n<10K
33-
bn-ml:
34-
- 1K<n<10K
35-
bn-mr:
36-
- 1K<n<10K
37-
bn-or:
38-
- n<1K
39-
bn-ta:
40-
- 1K<n<10K
41-
bn-te:
42-
- 1K<n<10K
43-
bn-ur:
44-
- n<1K
45-
en-gu:
46-
- 1K<n<10K
47-
en-hi:
48-
- 1K<n<10K
49-
en-ml:
50-
- 1K<n<10K
51-
en-mr:
52-
- 1K<n<10K
53-
en-or:
54-
- n<1K
55-
en-ta:
56-
- 1K<n<10K
57-
en-te:
58-
- 1K<n<10K
59-
en-ur:
60-
- 1K<n<10K
61-
gu-hi:
62-
- 1K<n<10K
63-
gu-ml:
64-
- 1K<n<10K
65-
gu-mr:
66-
- 1K<n<10K
67-
gu-or:
68-
- n<1K
69-
gu-ta:
70-
- 1K<n<10K
71-
gu-te:
72-
- 1K<n<10K
73-
gu-ur:
74-
- n<1K
75-
hi-ml:
76-
- 1K<n<10K
77-
hi-mr:
78-
- 1K<n<10K
79-
hi-or:
80-
- n<1K
81-
hi-ta:
82-
- 1K<n<10K
83-
hi-te:
84-
- 1K<n<10K
85-
hi-ur:
86-
- n<1K
87-
ml-mr:
88-
- 1K<n<10K
89-
ml-or:
90-
- n<1K
91-
ml-ta:
92-
- 1K<n<10K
93-
ml-te:
94-
- 1K<n<10K
95-
ml-ur:
96-
- n<1K
97-
mr-or:
98-
- n<1K
99-
mr-ta:
100-
- 1K<n<10K
101-
mr-te:
102-
- 1K<n<10K
103-
mr-ur:
104-
- n<1K
105-
or-ta:
106-
- n<1K
107-
or-te:
108-
- n<1K
109-
or-ur:
110-
- n<1K
111-
ta-te:
112-
- 1K<n<10K
113-
ta-ur:
114-
- n<1K
115-
te-ur:
116-
- n<1K
27+
- 1K<n<10K
28+
- n<1K
11729
licenses:
11830
- cc-by-4.0
11931
paperswithcode_id: null
12032
pretty_name: CVIT MKB
33+
configs:
34+
- bn-en
35+
- bn-gu
36+
- bn-hi
37+
- bn-ml
38+
- bn-mr
39+
- bn-or
40+
- bn-ta
41+
- bn-te
42+
- bn-ur
43+
- en-gu
44+
- en-hi
45+
- en-ml
46+
- en-mr
47+
- en-or
48+
- en-ta
49+
- en-te
50+
- en-ur
51+
- gu-hi
52+
- gu-ml
53+
- gu-mr
54+
- gu-or
55+
- gu-ta
56+
- gu-te
57+
- gu-ur
58+
- hi-ml
59+
- hi-mr
60+
- hi-or
61+
- hi-ta
62+
- hi-te
63+
- hi-ur
64+
- ml-mr
65+
- ml-or
66+
- ml-ta
67+
- ml-te
68+
- ml-ur
69+
- mr-or
70+
- mr-ta
71+
- mr-te
72+
- mr-ur
73+
- or-ta
74+
- or-te
75+
- or-ur
76+
- ta-te
77+
- ta-ur
78+
- te-ur
12179
---
12280

12381
# Dataset Card for CVIT MKB

datasets/myanmar_news/README.md

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,8 @@
11
---
2-
annotations_creators: []
3-
language_creators: []
2+
annotations_creators:
3+
- found
4+
language_creators:
5+
- found
46
languages:
57
- my
68
licenses:

datasets/norne/README.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@ annotations_creators:
44
language_creators:
55
- crowdsourced
66
languages:
7-
- false
7+
- "no"
88
licenses:
99
- other-national-library-of-norway
1010
multilinguality:

0 commit comments

Comments
 (0)