forked from Helsinki-NLP/Tatoeba-Challenge
-
Notifications
You must be signed in to change notification settings - Fork 0
/
opus-2020-08-12.yml
36 lines (36 loc) · 870 Bytes
/
opus-2020-08-12.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
release: mkh-eng/opus-2020-08-12.zip
release-date: 2020-08-12
dataset-name: opus
modeltype: transformer
pre-processing: normalization + SentencePiece (spm32k,spm32k)
subwords:
source: spm32k
target: spm32k
subword-models:
source: source.spm
target: target.spm
source-languages:
- kha
- khm
- mnw
- vie
target-languages:
- eng
test-data:
Tatoeba-test.kha-eng: 1314/6985
Tatoeba-test.khm-eng: 752/3505
Tatoeba-test.mnw-eng: 9/67
Tatoeba-test.multi-eng: 4579/28701
Tatoeba-test.vie-eng: 2500/17313
BLEU-scores:
Tatoeba-test.kha-eng: 0.5
Tatoeba-test.khm-eng: 8.5
Tatoeba-test.mnw-eng: 0.7
Tatoeba-test.multi-eng: 24.5
Tatoeba-test.vie-eng: 34.4
chr-F-scores:
Tatoeba-test.kha-eng: 0.108
Tatoeba-test.khm-eng: 0.206
Tatoeba-test.mnw-eng: 0.110
Tatoeba-test.multi-eng: 0.407
Tatoeba-test.vie-eng: 0.529