-
Notifications
You must be signed in to change notification settings - Fork 91
/
Copy pathopus-2020-07-14.yml
141 lines (141 loc) · 3.21 KB
/
opus-2020-07-14.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
release: eng-gem/opus-2020-07-14.zip
release-date: 2020-07-14
dataset-name: opus
modeltype: transformer
pre-processing: normalization + SentencePiece (spm32k,spm32k)
subwords:
source: spm32k
target: spm32k
subword-models:
source: source.spm
target: target.spm
source-languages:
- eng
target-languages:
- afr
- ang
- dan
- deu
- enm
- fao
- frr
- fry
- gos
- got
- gsw
- isl
- ksh
- ltz
- nds
- nld
- nno
- nob
- non
- pdc
- sco
- stq
- swe
- swg
- yid
use-target-labels:
- ">>afr<<"
- ">>ang_Latn<<"
- ">>dan<<"
- ">>deu<<"
- ">>enm_Latn<<"
- ">>fao<<"
- ">>frr<<"
- ">>fry<<"
- ">>gos<<"
- ">>got_Goth<<"
- ">>gsw<<"
- ">>isl<<"
- ">>ksh<<"
- ">>ltz<<"
- ">>nds<<"
- ">>nld<<"
- ">>nno<<"
- ">>nob<<"
- ">>nob_Hebr<<"
- ">>non_Latn<<"
- ">>pdc<<"
- ">>sco<<"
- ">>stq<<"
- ">>swe<<"
- ">>swg<<"
- ">>yid<<"
test-data:
Tatoeba-test.eng-afr: 1374/8813
Tatoeba-test.eng-ang: 189/1596
Tatoeba-test.eng-dan: 10000/61469
Tatoeba-test.eng-deu: 10000/69441
Tatoeba-test.eng-enm: 49/243
Tatoeba-test.eng-fao: 294/1564
Tatoeba-test.eng-frr: 2/7
Tatoeba-test.eng-fry: 205/1265
Tatoeba-test.eng-gos: 1152/4241
Tatoeba-test.eng-got: 207/685
Tatoeba-test.eng-gsw: 205/761
Tatoeba-test.eng-isl: 2500/16288
Tatoeba-test.eng-ksh: 26/170
Tatoeba-test.eng-ltz: 283/1351
Tatoeba-test.eng-multi: 10000/61404
Tatoeba-test.eng-nds: 2500/15228
Tatoeba-test.eng-nld: 10000/60278
Tatoeba-test.eng-non: 15/109
Tatoeba-test.eng-pdc: 53/281
Tatoeba-test.eng-sco: 27/185
Tatoeba-test.eng-stq: 5/26
Tatoeba-test.eng-swe: 10000/54832
Tatoeba-test.eng-swg: 33/195
Tatoeba-test.eng-yid: 1168/6754
BLEU-scores:
Tatoeba-test.eng-afr: 56.3
Tatoeba-test.eng-ang: 5.8
Tatoeba-test.eng-dan: 56.7
Tatoeba-test.eng-deu: 39.2
Tatoeba-test.eng-enm: 1.4
Tatoeba-test.eng-fao: 8.1
Tatoeba-test.eng-frr: 6.4
Tatoeba-test.eng-fry: 16.5
Tatoeba-test.eng-gos: 2.5
Tatoeba-test.eng-got: 0.3
Tatoeba-test.eng-gsw: 0.9
Tatoeba-test.eng-isl: 23.0
Tatoeba-test.eng-ksh: 0.9
Tatoeba-test.eng-ltz: 19.3
Tatoeba-test.eng-multi: 45.6
Tatoeba-test.eng-nds: 19.1
Tatoeba-test.eng-nld: 52.5
Tatoeba-test.eng-non: 0.7
Tatoeba-test.eng-pdc: 5.9
Tatoeba-test.eng-sco: 31.0
Tatoeba-test.eng-stq: 5.5
Tatoeba-test.eng-swe: 57.2
Tatoeba-test.eng-swg: 1.1
Tatoeba-test.eng-yid: 6.4
chr-F-scores:
Tatoeba-test.eng-afr: 0.742
Tatoeba-test.eng-ang: 0.148
Tatoeba-test.eng-dan: 0.718
Tatoeba-test.eng-deu: 0.606
Tatoeba-test.eng-enm: 0.211
Tatoeba-test.eng-fao: 0.310
Tatoeba-test.eng-frr: 0.128
Tatoeba-test.eng-fry: 0.416
Tatoeba-test.eng-gos: 0.195
Tatoeba-test.eng-got: 0.012
Tatoeba-test.eng-gsw: 0.135
Tatoeba-test.eng-isl: 0.499
Tatoeba-test.eng-ksh: 0.141
Tatoeba-test.eng-ltz: 0.379
Tatoeba-test.eng-multi: 0.633
Tatoeba-test.eng-nds: 0.440
Tatoeba-test.eng-nld: 0.696
Tatoeba-test.eng-non: 0.176
Tatoeba-test.eng-pdc: 0.177
Tatoeba-test.eng-sco: 0.527
Tatoeba-test.eng-stq: 0.337
Tatoeba-test.eng-swe: 0.713
Tatoeba-test.eng-swg: 0.159
Tatoeba-test.eng-yid: 0.294