forked from Helsinki-NLP/Tatoeba-Challenge
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathopus-2020-07-04.yml
128 lines (128 loc) · 3.32 KB
/
opus-2020-07-04.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
release: iir-eng/opus-2020-07-04.zip
release-date: 2020-07-04
dataset-name: opus
modeltype: transformer
pre-processing: normalization + SentencePiece (spm32k,spm32k)
subwords:
- source: spm32k
- target: spm32k
subword-models:
- source: source.spm
- target: target.spm
source-languages:
- asm
- awa
- ben
- bho
- gom
- guj
- hif
- hin
- jdt
- kur
- mai
- mar
- npi
- ori
- oss
- pan
- pes
- pnb
- pus
- rom
- san
- sin
- snd
- tgk
- tly
- urd
- zza
target-languages:
- eng
test-data:
- Tatoeba-test.asm-eng: 117/573
- Tatoeba-test.awa-eng: 279/1042
- Tatoeba-test.ben-eng: 2500/11321
- Tatoeba-test.bho-eng: 42/229
- Tatoeba-test.fas-eng: 3768/26936
- Tatoeba-test.guj-eng: 154/767
- Tatoeba-test.hif-eng: 36/187
- Tatoeba-test.hin-eng: 5000/28315
- Tatoeba-test.jdt-eng: 2/6
- Tatoeba-test.kok-eng: 1/6
- Tatoeba-test.kur-eng: 296/1404
- Tatoeba-test.lah-eng: 32/162
- Tatoeba-test.mai-eng: 8/17
- Tatoeba-test.mar-eng: 10000/53713
- Tatoeba-test.multi-eng: 10000/55828
- Tatoeba-test.nep-eng: 115/389
- Tatoeba-test.ori-eng: 33/198
- Tatoeba-test.oss-eng: 57/312
- Tatoeba-test.pan-eng: 87/514
- Tatoeba-test.pus-eng: 31/239
- Tatoeba-test.rom-eng: 671/3765
- Tatoeba-test.san-eng: 144/504
- Tatoeba-test.sin-eng: 45/210
- Tatoeba-test.snd-eng: 4/15
- Tatoeba-test.tgk-eng: 29/176
- Tatoeba-test.tly-eng: 46/167
- Tatoeba-test.urd-eng: 1663/10180
- Tatoeba-test.zza-eng: 523/2522
BLEU-scores:
- Tatoeba-test.asm-eng: 10.4
- Tatoeba-test.awa-eng: 5.3
- Tatoeba-test.ben-eng: 38.7
- Tatoeba-test.bho-eng: 24.4
- Tatoeba-test.fas-eng: 5.0
- Tatoeba-test.guj-eng: 14.3
- Tatoeba-test.hif-eng: 1.2
- Tatoeba-test.hin-eng: 33.5
- Tatoeba-test.jdt-eng: 9.6
- Tatoeba-test.kok-eng: 3.4
- Tatoeba-test.kur-eng: 2.9
- Tatoeba-test.lah-eng: 18.3
- Tatoeba-test.mai-eng: 38.8
- Tatoeba-test.mar-eng: 19.5
- Tatoeba-test.multi-eng: 18.9
- Tatoeba-test.nep-eng: 2.1
- Tatoeba-test.ori-eng: 2.8
- Tatoeba-test.oss-eng: 1.5
- Tatoeba-test.pan-eng: 11.8
- Tatoeba-test.pus-eng: 1.5
- Tatoeba-test.rom-eng: 2.5
- Tatoeba-test.san-eng: 2.4
- Tatoeba-test.sin-eng: 26.3
- Tatoeba-test.snd-eng: 10.5
- Tatoeba-test.tgk-eng: 7.3
- Tatoeba-test.tly-eng: 0.8
- Tatoeba-test.urd-eng: 21.1
- Tatoeba-test.zza-eng: 0.8
chr-F-scores:
- Tatoeba-test.asm-eng: 0.308
- Tatoeba-test.awa-eng: 0.229
- Tatoeba-test.ben-eng: 0.542
- Tatoeba-test.bho-eng: 0.431
- Tatoeba-test.fas-eng: 0.251
- Tatoeba-test.guj-eng: 0.331
- Tatoeba-test.hif-eng: 0.212
- Tatoeba-test.hin-eng: 0.516
- Tatoeba-test.jdt-eng: 0.080
- Tatoeba-test.kok-eng: 0.230
- Tatoeba-test.kur-eng: 0.145
- Tatoeba-test.lah-eng: 0.315
- Tatoeba-test.mai-eng: 0.598
- Tatoeba-test.mar-eng: 0.435
- Tatoeba-test.multi-eng: 0.400
- Tatoeba-test.nep-eng: 0.166
- Tatoeba-test.ori-eng: 0.193
- Tatoeba-test.oss-eng: 0.182
- Tatoeba-test.pan-eng: 0.320
- Tatoeba-test.pus-eng: 0.203
- Tatoeba-test.rom-eng: 0.179
- Tatoeba-test.san-eng: 0.168
- Tatoeba-test.sin-eng: 0.485
- Tatoeba-test.snd-eng: 0.302
- Tatoeba-test.tgk-eng: 0.280
- Tatoeba-test.tly-eng: 0.085
- Tatoeba-test.urd-eng: 0.409
- Tatoeba-test.zza-eng: 0.102