Add model files
#1
by
starride-teklia
- opened
- README.md +21 -3
- language_model.arpa.gz +3 -0
- lexicon.txt +100 -0
- model +0 -0
- syms.txt +100 -0
- tokens.txt +100 -0
- weights.ckpt +3 -0
README.md
CHANGED
@@ -1,3 +1,21 @@
|
|
1 |
-
|
2 |
-
|
3 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
# PyLaia Rimes
|
2 |
+
|
3 |
+
## Datasets
|
4 |
+
|
5 |
+
Trained on text-lines from the [Rimes 2011 dataset](https://teklia.com/research/rimes-database/).
|
6 |
+
|
7 |
+
| split | N lines |
|
8 |
+
|--------|--------:|
|
9 |
+
| train | 10,188 |
|
10 |
+
| val | 1,138 |
|
11 |
+
| test | 778 |
|
12 |
+
|
13 |
+
## Results
|
14 |
+
|
15 |
+
* Fixed line height: 128 pixels
|
16 |
+
* Language model: 6-gram character model trained on the training set with KenLM
|
17 |
+
|
18 |
+
| Model | val CER | test CER | val WER | test WER |
|
19 |
+
|:--------------------------------|--------:|---------:|--------:|---------:|
|
20 |
+
| Model without LM | 4.55 | 4.53 | 14.39 | 15.06 |
|
21 |
+
| Model with LM (`weight = 1.5`) | 3.68 | 3.47 | 10.01 | 10.20 |
|
language_model.arpa.gz
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:119d9433498a3c17f934be86db2dbc7794cc5ff3861c8d0a4fa8e197f10658d5
|
3 |
+
size 5140408
|
lexicon.txt
ADDED
@@ -0,0 +1,100 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
<ctc> <ctc>
|
2 |
+
! !
|
3 |
+
" "
|
4 |
+
% %
|
5 |
+
' '
|
6 |
+
( (
|
7 |
+
) )
|
8 |
+
, ,
|
9 |
+
- -
|
10 |
+
. .
|
11 |
+
/ /
|
12 |
+
0 0
|
13 |
+
1 1
|
14 |
+
2 2
|
15 |
+
3 3
|
16 |
+
4 4
|
17 |
+
5 5
|
18 |
+
6 6
|
19 |
+
7 7
|
20 |
+
8 8
|
21 |
+
9 9
|
22 |
+
: :
|
23 |
+
; ;
|
24 |
+
= =
|
25 |
+
? ?
|
26 |
+
A A
|
27 |
+
B B
|
28 |
+
C C
|
29 |
+
D D
|
30 |
+
E E
|
31 |
+
F F
|
32 |
+
G G
|
33 |
+
H H
|
34 |
+
I I
|
35 |
+
J J
|
36 |
+
K K
|
37 |
+
L L
|
38 |
+
M M
|
39 |
+
N N
|
40 |
+
O O
|
41 |
+
P P
|
42 |
+
Q Q
|
43 |
+
R R
|
44 |
+
S S
|
45 |
+
T T
|
46 |
+
U U
|
47 |
+
V V
|
48 |
+
W W
|
49 |
+
X X
|
50 |
+
Y Y
|
51 |
+
Z Z
|
52 |
+
_ _
|
53 |
+
a a
|
54 |
+
b b
|
55 |
+
c c
|
56 |
+
d d
|
57 |
+
e e
|
58 |
+
f f
|
59 |
+
g g
|
60 |
+
h h
|
61 |
+
i i
|
62 |
+
j j
|
63 |
+
k k
|
64 |
+
l l
|
65 |
+
m m
|
66 |
+
n n
|
67 |
+
o o
|
68 |
+
p p
|
69 |
+
q q
|
70 |
+
r r
|
71 |
+
s s
|
72 |
+
t t
|
73 |
+
u u
|
74 |
+
v v
|
75 |
+
w w
|
76 |
+
x x
|
77 |
+
y y
|
78 |
+
z z
|
79 |
+
{ {
|
80 |
+
} }
|
81 |
+
¤ ¤
|
82 |
+
° °
|
83 |
+
² ²
|
84 |
+
À À
|
85 |
+
É É
|
86 |
+
à à
|
87 |
+
â â
|
88 |
+
ç ç
|
89 |
+
è è
|
90 |
+
é é
|
91 |
+
ê ê
|
92 |
+
ë ë
|
93 |
+
î î
|
94 |
+
ô ô
|
95 |
+
ù ù
|
96 |
+
û û
|
97 |
+
œ œ
|
98 |
+
€ €
|
99 |
+
<unk> <unk>
|
100 |
+
<space> <space>
|
model
ADDED
Binary file (1.52 kB). View file
|
|
syms.txt
ADDED
@@ -0,0 +1,100 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
<ctc> 0
|
2 |
+
! 1
|
3 |
+
" 2
|
4 |
+
% 3
|
5 |
+
' 4
|
6 |
+
( 5
|
7 |
+
) 6
|
8 |
+
, 7
|
9 |
+
- 8
|
10 |
+
. 9
|
11 |
+
/ 10
|
12 |
+
0 11
|
13 |
+
1 12
|
14 |
+
2 13
|
15 |
+
3 14
|
16 |
+
4 15
|
17 |
+
5 16
|
18 |
+
6 17
|
19 |
+
7 18
|
20 |
+
8 19
|
21 |
+
9 20
|
22 |
+
: 21
|
23 |
+
; 22
|
24 |
+
= 23
|
25 |
+
? 24
|
26 |
+
A 25
|
27 |
+
B 26
|
28 |
+
C 27
|
29 |
+
D 28
|
30 |
+
E 29
|
31 |
+
F 30
|
32 |
+
G 31
|
33 |
+
H 32
|
34 |
+
I 33
|
35 |
+
J 34
|
36 |
+
K 35
|
37 |
+
L 36
|
38 |
+
M 37
|
39 |
+
N 38
|
40 |
+
O 39
|
41 |
+
P 40
|
42 |
+
Q 41
|
43 |
+
R 42
|
44 |
+
S 43
|
45 |
+
T 44
|
46 |
+
U 45
|
47 |
+
V 46
|
48 |
+
W 47
|
49 |
+
X 48
|
50 |
+
Y 49
|
51 |
+
Z 50
|
52 |
+
_ 51
|
53 |
+
a 52
|
54 |
+
b 53
|
55 |
+
c 54
|
56 |
+
d 55
|
57 |
+
e 56
|
58 |
+
f 57
|
59 |
+
g 58
|
60 |
+
h 59
|
61 |
+
i 60
|
62 |
+
j 61
|
63 |
+
k 62
|
64 |
+
l 63
|
65 |
+
m 64
|
66 |
+
n 65
|
67 |
+
o 66
|
68 |
+
p 67
|
69 |
+
q 68
|
70 |
+
r 69
|
71 |
+
s 70
|
72 |
+
t 71
|
73 |
+
u 72
|
74 |
+
v 73
|
75 |
+
w 74
|
76 |
+
x 75
|
77 |
+
y 76
|
78 |
+
z 77
|
79 |
+
{ 78
|
80 |
+
} 79
|
81 |
+
¤ 80
|
82 |
+
° 81
|
83 |
+
² 82
|
84 |
+
À 83
|
85 |
+
É 84
|
86 |
+
à 85
|
87 |
+
â 86
|
88 |
+
ç 87
|
89 |
+
è 88
|
90 |
+
é 89
|
91 |
+
ê 90
|
92 |
+
ë 91
|
93 |
+
î 92
|
94 |
+
ô 93
|
95 |
+
ù 94
|
96 |
+
û 95
|
97 |
+
œ 96
|
98 |
+
€ 97
|
99 |
+
<unk> 98
|
100 |
+
<space> 99
|
tokens.txt
ADDED
@@ -0,0 +1,100 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
<ctc>
|
2 |
+
!
|
3 |
+
"
|
4 |
+
%
|
5 |
+
'
|
6 |
+
(
|
7 |
+
)
|
8 |
+
,
|
9 |
+
-
|
10 |
+
.
|
11 |
+
/
|
12 |
+
0
|
13 |
+
1
|
14 |
+
2
|
15 |
+
3
|
16 |
+
4
|
17 |
+
5
|
18 |
+
6
|
19 |
+
7
|
20 |
+
8
|
21 |
+
9
|
22 |
+
:
|
23 |
+
;
|
24 |
+
=
|
25 |
+
?
|
26 |
+
A
|
27 |
+
B
|
28 |
+
C
|
29 |
+
D
|
30 |
+
E
|
31 |
+
F
|
32 |
+
G
|
33 |
+
H
|
34 |
+
I
|
35 |
+
J
|
36 |
+
K
|
37 |
+
L
|
38 |
+
M
|
39 |
+
N
|
40 |
+
O
|
41 |
+
P
|
42 |
+
Q
|
43 |
+
R
|
44 |
+
S
|
45 |
+
T
|
46 |
+
U
|
47 |
+
V
|
48 |
+
W
|
49 |
+
X
|
50 |
+
Y
|
51 |
+
Z
|
52 |
+
_
|
53 |
+
a
|
54 |
+
b
|
55 |
+
c
|
56 |
+
d
|
57 |
+
e
|
58 |
+
f
|
59 |
+
g
|
60 |
+
h
|
61 |
+
i
|
62 |
+
j
|
63 |
+
k
|
64 |
+
l
|
65 |
+
m
|
66 |
+
n
|
67 |
+
o
|
68 |
+
p
|
69 |
+
q
|
70 |
+
r
|
71 |
+
s
|
72 |
+
t
|
73 |
+
u
|
74 |
+
v
|
75 |
+
w
|
76 |
+
x
|
77 |
+
y
|
78 |
+
z
|
79 |
+
{
|
80 |
+
}
|
81 |
+
¤
|
82 |
+
°
|
83 |
+
²
|
84 |
+
À
|
85 |
+
É
|
86 |
+
à
|
87 |
+
â
|
88 |
+
ç
|
89 |
+
è
|
90 |
+
é
|
91 |
+
ê
|
92 |
+
ë
|
93 |
+
î
|
94 |
+
ô
|
95 |
+
ù
|
96 |
+
û
|
97 |
+
œ
|
98 |
+
€
|
99 |
+
<unk>
|
100 |
+
<space>
|
weights.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b24aa78625c3c5cfbd07926aee3d5890dec2d7aab931a1c55bdbe6770236a8aa
|
3 |
+
size 42750044
|