forked from Helsinki-NLP/Tatoeba-Challenge
-
Notifications
You must be signed in to change notification settings - Fork 0
/
opus4m-2020-08-12.yml
204 lines (204 loc) · 5.54 KB
/
opus4m-2020-08-12.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
release: roa-eng/opus4m-2020-08-12.zip
release-date: 2020-08-12
dataset-name: opus4m
modeltype: transformer
pre-processing: normalization + SentencePiece (spm32k,spm32k)
subwords:
source: spm32k
target: spm32k
subword-models:
source: source.spm
target: target.spm
source-languages:
- arg
- ast
- cat
- cos
- egl
- ext
- fra
- frm
- gcf
- glg
- hat
- ind
- ita
- lad
- lij
- lld
- lmo
- max
- mfe
- min
- mwl
- oci
- pap
- pms
- por
- roh
- ron
- scn
- spa
- tmw
- vec
- wln
- zlm
- zsm
target-languages:
- eng
test-data:
Tatoeba-test.arg-eng: 105/343
Tatoeba-test.ast-eng: 99/682
Tatoeba-test.cat-eng: 1631/10625
Tatoeba-test.cos-eng: 5/28
Tatoeba-test.egl-eng: 84/348
Tatoeba-test.ext-eng: 69/279
Tatoeba-test.fra-eng: 10000/65688
Tatoeba-test.frm-eng: 18/183
Tatoeba-test.gcf-eng: 99/455
Tatoeba-test.glg-eng: 1008/7171
Tatoeba-test.hat-eng: 64/281
Tatoeba-test.ita-eng: 10000/56443
Tatoeba-test.lad-eng: 629/2774
Tatoeba-test.lij-eng: 94/586
Tatoeba-test.lld-eng: 21/189
Tatoeba-test.lmo-eng: 17/104
Tatoeba-test.mfe-eng: 7/28
Tatoeba-test.msa-eng: 5000/31183
Tatoeba-test.multi-eng: 10000/63328
Tatoeba-test.mwl-eng: 4/19
Tatoeba-test.oci-eng: 841/4376
Tatoeba-test.pap-eng: 70/275
Tatoeba-test.pms-eng: 268/1708
Tatoeba-test.por-eng: 10000/63761
Tatoeba-test.roh-eng: 16/186
Tatoeba-test.ron-eng: 5000/31418
Tatoeba-test.scn-eng: 4/31
Tatoeba-test.spa-eng: 10000/67744
Tatoeba-test.vec-eng: 19/90
Tatoeba-test.wln-eng: 89/363
news-test2008.fra-eng: 2051/43455
news-test2008.spa-eng: 2051/43455
newsdev2016-enro.ron-eng: 1999/43535
newsdiscussdev2015-enfr.fra-eng: 1500/24201
newsdiscusstest2015-enfr.fra-eng: 1500/23668
newssyscomb2009.fra-eng: 502/10424
newssyscomb2009.ita-eng: 502/10424
newssyscomb2009.spa-eng: 502/10424
newstest2009.fra-eng: 2525/57625
newstest2009.ita-eng: 2525/57625
newstest2009.spa-eng: 2525/57625
newstest2010.fra-eng: 2489/54021
newstest2010.spa-eng: 2489/54021
newstest2011.fra-eng: 3003/65829
newstest2011.spa-eng: 3003/65829
newstest2012.fra-eng: 3003/63778
newstest2012.spa-eng: 3003/63778
newstest2013.fra-eng: 3000/56089
newstest2013.spa-eng: 3000/56089
newstest2014-fren.fra-eng: 3003/62338
newstest2016-enro.ron-eng: 1999/42055
BLEU-scores:
Tatoeba-test.arg-eng: 44.6
Tatoeba-test.ast-eng: 34.9
Tatoeba-test.cat-eng: 55.1
Tatoeba-test.cos-eng: 63.2
Tatoeba-test.egl-eng: 5.6
Tatoeba-test.ext-eng: 29.3
Tatoeba-test.fra-eng: 53.9
Tatoeba-test.frm-eng: 23.6
Tatoeba-test.gcf-eng: 18.0
Tatoeba-test.glg-eng: 55.4
Tatoeba-test.hat-eng: 37.3
Tatoeba-test.ita-eng: 65.4
Tatoeba-test.lad-eng: 14.0
Tatoeba-test.lij-eng: 9.2
Tatoeba-test.lld-eng: 8.7
Tatoeba-test.lmo-eng: 10.8
Tatoeba-test.mfe-eng: 66.0
Tatoeba-test.msa-eng: 41.1
Tatoeba-test.multi-eng: 55.1
Tatoeba-test.mwl-eng: 22.3
Tatoeba-test.oci-eng: 21.7
Tatoeba-test.pap-eng: 56.6
Tatoeba-test.pms-eng: 12.9
Tatoeba-test.por-eng: 59.8
Tatoeba-test.roh-eng: 19.4
Tatoeba-test.ron-eng: 55.4
Tatoeba-test.scn-eng: 35.8
Tatoeba-test.spa-eng: 56.4
Tatoeba-test.vec-eng: 13.6
Tatoeba-test.wln-eng: 13.4
news-test2008.fra-eng: 25.3
news-test2008.spa-eng: 26.4
newsdev2016-enro.ron-eng: 37.2
newsdiscussdev2015-enfr.fra-eng: 31.8
newsdiscusstest2015-enfr.fra-eng: 36.2
newssyscomb2009.fra-eng: 29.5
newssyscomb2009.ita-eng: 32.1
newssyscomb2009.spa-eng: 28.6
newstest2009.fra-eng: 28.7
newstest2009.ita-eng: 31.9
newstest2009.spa-eng: 29.1
newstest2010.fra-eng: 30.1
newstest2010.spa-eng: 33.3
newstest2011.fra-eng: 31.2
newstest2011.spa-eng: 32.2
newstest2012.fra-eng: 31.3
newstest2012.spa-eng: 35.1
newstest2013.fra-eng: 32.0
newstest2013.spa-eng: 32.9
newstest2014-fren.fra-eng: 34.6
newstest2016-enro.ron-eng: 35.9
chr-F-scores:
Tatoeba-test.arg-eng: 0.535
Tatoeba-test.ast-eng: 0.527
Tatoeba-test.cat-eng: 0.708
Tatoeba-test.cos-eng: 0.651
Tatoeba-test.egl-eng: 0.212
Tatoeba-test.ext-eng: 0.468
Tatoeba-test.fra-eng: 0.692
Tatoeba-test.frm-eng: 0.405
Tatoeba-test.gcf-eng: 0.316
Tatoeba-test.glg-eng: 0.712
Tatoeba-test.hat-eng: 0.553
Tatoeba-test.ita-eng: 0.772
Tatoeba-test.lad-eng: 0.441
Tatoeba-test.lij-eng: 0.282
Tatoeba-test.lld-eng: 0.267
Tatoeba-test.lmo-eng: 0.287
Tatoeba-test.mfe-eng: 0.805
Tatoeba-test.msa-eng: 0.595
Tatoeba-test.multi-eng: 0.699
Tatoeba-test.mwl-eng: 0.393
Tatoeba-test.oci-eng: 0.410
Tatoeba-test.pap-eng: 0.672
Tatoeba-test.pms-eng: 0.335
Tatoeba-test.por-eng: 0.738
Tatoeba-test.roh-eng: 0.429
Tatoeba-test.ron-eng: 0.704
Tatoeba-test.scn-eng: 0.388
Tatoeba-test.spa-eng: 0.716
Tatoeba-test.vec-eng: 0.343
Tatoeba-test.wln-eng: 0.315
news-test2008.fra-eng: 0.533
news-test2008.spa-eng: 0.541
newsdev2016-enro.ron-eng: 0.632
newsdiscussdev2015-enfr.fra-eng: 0.566
newsdiscusstest2015-enfr.fra-eng: 0.595
newssyscomb2009.fra-eng: 0.564
newssyscomb2009.ita-eng: 0.584
newssyscomb2009.spa-eng: 0.560
newstest2009.fra-eng: 0.557
newstest2009.ita-eng: 0.581
newstest2009.spa-eng: 0.561
newstest2010.fra-eng: 0.575
newstest2010.spa-eng: 0.595
newstest2011.fra-eng: 0.585
newstest2011.spa-eng: 0.584
newstest2012.fra-eng: 0.579
newstest2012.spa-eng: 0.605
newstest2013.fra-eng: 0.576
newstest2013.spa-eng: 0.591
newstest2014-fren.fra-eng: 0.610
newstest2016-enro.ron-eng: 0.614