-
Notifications
You must be signed in to change notification settings - Fork 92
/
Copy pathopus-2020-07-26.yml
180 lines (180 loc) · 4.52 KB
/
opus-2020-07-26.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
release: eng-gem/opus-2020-07-26.zip
release-date: 2020-07-26
dataset-name: opus
modeltype: transformer
pre-processing: normalization + SentencePiece (spm32k,spm32k)
subwords:
source: spm32k
target: spm32k
subword-models:
source: source.spm
target: target.spm
source-languages:
- eng
target-languages:
- afr
- ang
- dan
- deu
- enm
- fao
- frr
- fry
- gos
- got
- gsw
- isl
- ksh
- ltz
- nds
- nld
- nno
- nob
- non
- pdc
- sco
- stq
- swe
- swg
- yid
use-target-labels:
- ">>afr<<"
- ">>ang_Latn<<"
- ">>dan<<"
- ">>deu<<"
- ">>enm_Latn<<"
- ">>fao<<"
- ">>frr<<"
- ">>fry<<"
- ">>gos<<"
- ">>got_Goth<<"
- ">>gsw<<"
- ">>isl<<"
- ">>ksh<<"
- ">>ltz<<"
- ">>nds<<"
- ">>nld<<"
- ">>nno<<"
- ">>nob<<"
- ">>nob_Hebr<<"
- ">>non_Latn<<"
- ">>pdc<<"
- ">>sco<<"
- ">>stq<<"
- ">>swe<<"
- ">>swg<<"
- ">>yid<<"
test-data:
Tatoeba-test.eng-afr: 1374/8813
Tatoeba-test.eng-ang: 189/1596
Tatoeba-test.eng-dan: 10000/61469
Tatoeba-test.eng-deu: 10000/69441
Tatoeba-test.eng-enm: 49/243
Tatoeba-test.eng-fao: 294/1564
Tatoeba-test.eng-frr: 2/7
Tatoeba-test.eng-fry: 205/1265
Tatoeba-test.eng-gos: 1152/4241
Tatoeba-test.eng-got: 207/685
Tatoeba-test.eng-gsw: 205/761
Tatoeba-test.eng-isl: 2500/16288
Tatoeba-test.eng-ksh: 26/170
Tatoeba-test.eng-ltz: 283/1351
Tatoeba-test.eng-multi: 10000/61404
Tatoeba-test.eng-nds: 2500/15228
Tatoeba-test.eng-nld: 10000/60278
Tatoeba-test.eng-non: 15/109
Tatoeba-test.eng-nor: 5000/33820
Tatoeba-test.eng-pdc: 53/281
Tatoeba-test.eng-sco: 27/185
Tatoeba-test.eng-stq: 5/26
Tatoeba-test.eng-swe: 10000/54832
Tatoeba-test.eng-swg: 33/195
Tatoeba-test.eng-yid: 1168/6754
news-test2008.eng-deu: 2051/41182
newssyscomb2009.eng-deu: 502/9802
newstest2009.eng-deu: 2525/54214
newstest2010.eng-deu: 2489/53161
newstest2011.eng-deu: 3003/62546
newstest2012.eng-deu: 3003/62513
newstest2013.eng-deu: 3000/54690
newstest2015-ende.eng-deu: 2169/38160
newstest2016-ende.eng-deu: 2999/53944
newstest2017-ende.eng-deu: 3004/52833
newstest2018-ende.eng-deu: 2998/54933
newstest2019-ende.eng-deu: 1997/42087
BLEU-scores:
Tatoeba-test.eng-afr: 56.1
Tatoeba-test.eng-ang: 6.3
Tatoeba-test.eng-dan: 57.2
Tatoeba-test.eng-deu: 39.9
Tatoeba-test.eng-enm: 1.3
Tatoeba-test.eng-fao: 9.4
Tatoeba-test.eng-frr: 3.6
Tatoeba-test.eng-fry: 16.6
Tatoeba-test.eng-gos: 2.2
Tatoeba-test.eng-got: 0.3
Tatoeba-test.eng-gsw: 0.9
Tatoeba-test.eng-isl: 23.0
Tatoeba-test.eng-ksh: 0.8
Tatoeba-test.eng-ltz: 20.8
Tatoeba-test.eng-multi: 46.0
Tatoeba-test.eng-nds: 19.1
Tatoeba-test.eng-nld: 52.7
Tatoeba-test.eng-non: 0.6
Tatoeba-test.eng-nor: 49.5
Tatoeba-test.eng-pdc: 4.0
Tatoeba-test.eng-sco: 29.8
Tatoeba-test.eng-stq: 2.8
Tatoeba-test.eng-swe: 57.5
Tatoeba-test.eng-swg: 0.8
Tatoeba-test.eng-yid: 6.3
news-test2008.eng-deu: 20.5
newssyscomb2009.eng-deu: 20.3
newstest2009.eng-deu: 20.1
newstest2010.eng-deu: 22.2
newstest2011.eng-deu: 20.0
newstest2012.eng-deu: 20.4
newstest2013.eng-deu: 23.9
newstest2015-ende.eng-deu: 27.5
newstest2016-ende.eng-deu: 32.3
newstest2017-ende.eng-deu: 26.0
newstest2018-ende.eng-deu: 38.7
newstest2019-ende.eng-deu: 34.4
chr-F-scores:
Tatoeba-test.eng-afr: 0.739
Tatoeba-test.eng-ang: 0.152
Tatoeba-test.eng-dan: 0.722
Tatoeba-test.eng-deu: 0.612
Tatoeba-test.eng-enm: 0.219
Tatoeba-test.eng-fao: 0.318
Tatoeba-test.eng-frr: 0.124
Tatoeba-test.eng-fry: 0.419
Tatoeba-test.eng-gos: 0.182
Tatoeba-test.eng-got: 0.012
Tatoeba-test.eng-gsw: 0.134
Tatoeba-test.eng-isl: 0.504
Tatoeba-test.eng-ksh: 0.143
Tatoeba-test.eng-ltz: 0.392
Tatoeba-test.eng-multi: 0.636
Tatoeba-test.eng-nds: 0.441
Tatoeba-test.eng-nld: 0.697
Tatoeba-test.eng-non: 0.171
Tatoeba-test.eng-nor: 0.671
Tatoeba-test.eng-pdc: 0.165
Tatoeba-test.eng-sco: 0.520
Tatoeba-test.eng-stq: 0.327
Tatoeba-test.eng-swe: 0.715
Tatoeba-test.eng-swg: 0.153
Tatoeba-test.eng-yid: 0.293
news-test2008.eng-deu: 0.506
newssyscomb2009.eng-deu: 0.517
newstest2009.eng-deu: 0.512
newstest2010.eng-deu: 0.523
newstest2011.eng-deu: 0.504
newstest2012.eng-deu: 0.503
newstest2013.eng-deu: 0.529
newstest2015-ende.eng-deu: 0.565
newstest2016-ende.eng-deu: 0.601
newstest2017-ende.eng-deu: 0.555
newstest2018-ende.eng-deu: 0.642
newstest2019-ende.eng-deu: 0.608