Skip to content

Commit 29d2c2e

Browse files
committed
Update related to issue #11
1 parent 1d75072 commit 29d2c2e

21 files changed

+14786
-13847
lines changed

‎.gitignore

+3-1
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,5 @@
11
dist
2-
data
2+
data/tmp
3+
data/udhr
4+
data/tatoeba.csv
35
node_modules

‎data/bench/cld.json

+84
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,84 @@
1+
{
2+
"size": {
3+
"12": {
4+
"success_rate": 36.375,
5+
"error_rate": 3.25,
6+
"unindentified_rate": 60.375,
7+
"execution_time": 0.0706
8+
},
9+
"24": {
10+
"success_rate": 77.7188,
11+
"error_rate": 3.0313,
12+
"unindentified_rate": 19.25,
13+
"execution_time": 0.0548
14+
},
15+
"36": {
16+
"success_rate": 92.8125,
17+
"error_rate": 1.75,
18+
"unindentified_rate": 5.4375,
19+
"execution_time": 0.0545
20+
},
21+
"48": {
22+
"success_rate": 96.75,
23+
"error_rate": 1.0938,
24+
"unindentified_rate": 2.1563,
25+
"execution_time": 0.0582
26+
},
27+
"64": {
28+
"success_rate": 98.2813,
29+
"error_rate": 0.5,
30+
"unindentified_rate": 1.2188,
31+
"execution_time": 0.0566
32+
},
33+
"128": {
34+
"success_rate": 99.5625,
35+
"error_rate": 0.0938,
36+
"unindentified_rate": 0.3438,
37+
"execution_time": 0.0595
38+
},
39+
"256": {
40+
"success_rate": 99.9375,
41+
"error_rate": 0.0313,
42+
"unindentified_rate": 0.0313,
43+
"execution_time": 0.0662
44+
},
45+
"512": {
46+
"success_rate": 99.9688,
47+
"error_rate": 0,
48+
"unindentified_rate": 0.0313,
49+
"execution_time": 0.0799
50+
},
51+
"1024": {
52+
"success_rate": 100,
53+
"error_rate": 0,
54+
"unindentified_rate": 0,
55+
"execution_time": 0.1108
56+
}
57+
},
58+
"stats": {
59+
"min": 78.39,
60+
"max": 100,
61+
"success_rate": 92.3097,
62+
"error_rate": 1.6328,
63+
"unindentified_rate": 6.0574,
64+
"execution_time": 0.0543
65+
},
66+
"languages": {
67+
"jpn": 100,
68+
"kor": 100,
69+
"hin": 99.43,
70+
"eng": 99.18,
71+
"deu": 97.58,
72+
"fin": 96.3,
73+
"cmn": 94.52,
74+
"fra": 94.05,
75+
"tur": 93.2,
76+
"por": 91.89,
77+
"rus": 89.69,
78+
"nld": 89.58,
79+
"spa": 87.79,
80+
"ita": 85.9,
81+
"heb": 84.05,
82+
"ara": 78.39
83+
}
84+
}

‎data/bench/franc-all.json

+84
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,84 @@
1+
{
2+
"size": {
3+
"12": {
4+
"success_rate": 18.5313,
5+
"error_rate": 35,
6+
"unindentified_rate": 46.4688,
7+
"execution_time": 0.104
8+
},
9+
"24": {
10+
"success_rate": 48.4375,
11+
"error_rate": 51.5625,
12+
"unindentified_rate": 0,
13+
"execution_time": 0.2488
14+
},
15+
"36": {
16+
"success_rate": 60.625,
17+
"error_rate": 39.375,
18+
"unindentified_rate": 0,
19+
"execution_time": 0.3291
20+
},
21+
"48": {
22+
"success_rate": 69.5938,
23+
"error_rate": 30.4063,
24+
"unindentified_rate": 0,
25+
"execution_time": 0.4012
26+
},
27+
"64": {
28+
"success_rate": 73.5625,
29+
"error_rate": 26.4375,
30+
"unindentified_rate": 0,
31+
"execution_time": 0.473
32+
},
33+
"128": {
34+
"success_rate": 86.0938,
35+
"error_rate": 13.9063,
36+
"unindentified_rate": 0,
37+
"execution_time": 0.7312
38+
},
39+
"256": {
40+
"success_rate": 93.6875,
41+
"error_rate": 6.3125,
42+
"unindentified_rate": 0,
43+
"execution_time": 1.2803
44+
},
45+
"512": {
46+
"success_rate": 96.3125,
47+
"error_rate": 3.6875,
48+
"unindentified_rate": 0,
49+
"execution_time": 2.2039
50+
},
51+
"1024": {
52+
"success_rate": 98.381,
53+
"error_rate": 1.619,
54+
"unindentified_rate": 0,
55+
"execution_time": 3.7052
56+
}
57+
},
58+
"stats": {
59+
"min": 29.47,
60+
"max": 99.93,
61+
"success_rate": 66.4673,
62+
"error_rate": 33.5327,
63+
"unindentified_rate": 0,
64+
"execution_time": 0.3554
65+
},
66+
"languages": {
67+
"jpn": 99.93,
68+
"kor": 99.8261,
69+
"cmn": 99.35,
70+
"heb": 98.18,
71+
"ara": 91.73,
72+
"deu": 80.77,
73+
"fin": 70.8,
74+
"fra": 67.27,
75+
"hin": 60.4,
76+
"nld": 59.65,
77+
"rus": 51.94,
78+
"eng": 49.88,
79+
"por": 49.39,
80+
"ita": 42.55,
81+
"tur": 32.27,
82+
"spa": 29.47
83+
}
84+
}

‎data/bench/franc-min.json

+84
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,84 @@
1+
{
2+
"size": {
3+
"12": {
4+
"success_rate": 21.4375,
5+
"error_rate": 29.375,
6+
"unindentified_rate": 49.1875,
7+
"execution_time": 0.0187
8+
},
9+
"24": {
10+
"success_rate": 53.25,
11+
"error_rate": 40.5,
12+
"unindentified_rate": 6.25,
13+
"execution_time": 0.0368
14+
},
15+
"36": {
16+
"success_rate": 66.9375,
17+
"error_rate": 26.8125,
18+
"unindentified_rate": 6.25,
19+
"execution_time": 0.0513
20+
},
21+
"48": {
22+
"success_rate": 73.4063,
23+
"error_rate": 20.3438,
24+
"unindentified_rate": 6.25,
25+
"execution_time": 0.0628
26+
},
27+
"64": {
28+
"success_rate": 75.9063,
29+
"error_rate": 17.875,
30+
"unindentified_rate": 6.2188,
31+
"execution_time": 0.0753
32+
},
33+
"128": {
34+
"success_rate": 82.4688,
35+
"error_rate": 11.3438,
36+
"unindentified_rate": 6.1875,
37+
"execution_time": 0.1207
38+
},
39+
"256": {
40+
"success_rate": 85.1563,
41+
"error_rate": 8.6875,
42+
"unindentified_rate": 6.1563,
43+
"execution_time": 0.2316
44+
},
45+
"512": {
46+
"success_rate": 86.5625,
47+
"error_rate": 7.4063,
48+
"unindentified_rate": 6.0313,
49+
"execution_time": 0.4174
50+
},
51+
"1024": {
52+
"success_rate": 86.9841,
53+
"error_rate": 7.0159,
54+
"unindentified_rate": 6,
55+
"execution_time": 0.7425
56+
}
57+
},
58+
"stats": {
59+
"min": 0.01,
60+
"max": 99.93,
61+
"success_rate": 70.1739,
62+
"error_rate": 23.3584,
63+
"unindentified_rate": 6.4677,
64+
"execution_time": 0.0657
65+
},
66+
"languages": {
67+
"jpn": 99.93,
68+
"kor": 99.8261,
69+
"cmn": 99.35,
70+
"deu": 94.18,
71+
"ara": 91.89,
72+
"fra": 87.32,
73+
"nld": 87.21,
74+
"eng": 81.38,
75+
"por": 76.8,
76+
"ita": 74.31,
77+
"hin": 68.22,
78+
"spa": 67.38,
79+
"tur": 58.11,
80+
"rus": 54.59,
81+
"fin": 0.01,
82+
"heb": 0.01
83+
}
84+
}

‎data/bench/franc.json

+84
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,84 @@
1+
{
2+
"size": {
3+
"12": {
4+
"success_rate": 20.6875,
5+
"error_rate": 32.8438,
6+
"unindentified_rate": 46.4688,
7+
"execution_time": 0.0431
8+
},
9+
"24": {
10+
"success_rate": 54.6875,
11+
"error_rate": 45.3125,
12+
"unindentified_rate": 0,
13+
"execution_time": 0.0943
14+
},
15+
"36": {
16+
"success_rate": 69.125,
17+
"error_rate": 30.875,
18+
"unindentified_rate": 0,
19+
"execution_time": 0.1228
20+
},
21+
"48": {
22+
"success_rate": 77.0938,
23+
"error_rate": 22.9063,
24+
"unindentified_rate": 0,
25+
"execution_time": 0.1526
26+
},
27+
"64": {
28+
"success_rate": 80.9375,
29+
"error_rate": 19.0625,
30+
"unindentified_rate": 0,
31+
"execution_time": 0.1831
32+
},
33+
"128": {
34+
"success_rate": 91.1875,
35+
"error_rate": 8.8125,
36+
"unindentified_rate": 0,
37+
"execution_time": 0.2902
38+
},
39+
"256": {
40+
"success_rate": 96.7188,
41+
"error_rate": 3.2813,
42+
"unindentified_rate": 0,
43+
"execution_time": 0.5402
44+
},
45+
"512": {
46+
"success_rate": 98.9375,
47+
"error_rate": 1.0625,
48+
"unindentified_rate": 0,
49+
"execution_time": 0.971
50+
},
51+
"1024": {
52+
"success_rate": 99.6825,
53+
"error_rate": 0.3175,
54+
"unindentified_rate": 0,
55+
"execution_time": 1.6949
56+
}
57+
},
58+
"stats": {
59+
"min": 48.96,
60+
"max": 99.93,
61+
"success_rate": 74.0726,
62+
"error_rate": 25.9274,
63+
"unindentified_rate": 0,
64+
"execution_time": 0.1482
65+
},
66+
"languages": {
67+
"jpn": 99.93,
68+
"kor": 99.8261,
69+
"cmn": 99.35,
70+
"heb": 98.23,
71+
"ara": 91.85,
72+
"deu": 83.87,
73+
"fra": 79.36,
74+
"fin": 78.53,
75+
"hin": 68.22,
76+
"ita": 64.19,
77+
"por": 62.29,
78+
"nld": 62.01,
79+
"eng": 60.38,
80+
"rus": 52.3,
81+
"spa": 51.25,
82+
"tur": 48.96
83+
}
84+
}

0 commit comments

Comments
 (0)