forked from Helsinki-NLP/Tatoeba-Challenge
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathopus-2020-07-27.yml
50 lines (50 loc) · 1.18 KB
/
opus-2020-07-27.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
release: inc-inc/opus-2020-07-27.zip
release-date: 2020-07-27
dataset-name: opus
modeltype: transformer
pre-processing: normalization + SentencePiece (spm32k,spm32k)
subwords:
- source: spm32k
- target: spm32k
subword-models:
- source: source.spm
- target: target.spm
source-languages:
- asm
- hin
- mar
- urd
target-languages:
- asm
- hin
- mar
- urd
use-target-labels:
- >>asm<<
- >>hin<<
- >>mar<<
- >>urd<<
test-data:
- Tatoeba-test.asm-hin: 4/15
- Tatoeba-test.hin-asm: 4/13
- Tatoeba-test.hin-mar: 158/692
- Tatoeba-test.hin-urd: 239/1591
- Tatoeba-test.mar-hin: 158/860
- Tatoeba-test.multi-multi: 802/4683
- Tatoeba-test.urd-hin: 239/1512
BLEU-scores:
- Tatoeba-test.asm-hin: 2.6
- Tatoeba-test.hin-asm: 9.1
- Tatoeba-test.hin-mar: 28.1
- Tatoeba-test.hin-urd: 19.9
- Tatoeba-test.mar-hin: 11.6
- Tatoeba-test.multi-multi: 17.1
- Tatoeba-test.urd-hin: 13.5
chr-F-scores:
- Tatoeba-test.asm-hin: 0.231
- Tatoeba-test.hin-asm: 0.262
- Tatoeba-test.hin-mar: 0.548
- Tatoeba-test.hin-urd: 0.508
- Tatoeba-test.mar-hin: 0.466
- Tatoeba-test.multi-multi: 0.464
- Tatoeba-test.urd-hin: 0.377