Commit 7eb16d1f authored by Ivan Bogatyy's avatar Ivan Bogatyy Committed by calberti
Browse files

Update docs & tutorial (#1178)

* Release DRAGNN

* Update CoNLL evaluation table & evaluator.py

* Update documentation & tutorial for DRAGNN
parent 7d30a017
......@@ -38,16 +38,19 @@ def parse_tree_graph(sentence):
warnings.simplefilter("ignore")
svg = graph.draw(format="svg", prog="dot")
svg = unicode(svg, "utf-8")
# For both inline and "new window" displays, we show the tokens with the
# graph. (The sentence order of nodes is sometimes difficult to read.)
image_and_text = "<p><em>Text:</em> {}</p>{}".format(" ".join(
image_and_text = u"<p><em>Text:</em> {}</p>{}".format(" ".join(
token.word for token in sentence.token), svg)
# We generate a base64 URI. This is not too big, but older browsers may not
# handle it well.
new_window_html = ("<style type='text/css'>svg { max-width: 100%; }</style>" +
image_and_text)
as_uri = "data:text/html;base64,{}".format(base64.b64encode(new_window_html))
new_window_html = (u"<style type='text/css'>svg { max-width: 100%; }</style>"
+ image_and_text).encode("utf-8")
as_uri = "data:text/html;charset=utf-8;base64,{}".format(
base64.b64encode(new_window_html))
return "{}<p><a target='_blank' href='{}'>Open in new window</a></p>".format(
return u"{}<p><a target='_blank' href='{}'>Open in new window</a></p>".format(
image_and_text, as_uri)
......@@ -17,7 +17,7 @@ class RenderParseTreeGraphvizTest(googletest.TestCase):
document.token.add(start=1, end=1, word='there')
contents = render_parse_tree_graphviz.parse_tree_graph(document)
self.assertIn('<polygon', contents)
self.assertIn('text/html;base64', contents)
self.assertIn('text/html;charset=utf-8;base64', contents)
self.assertIn('something', contents)
self.assertIn('hi', contents)
self.assertIn('there', contents)
......
291
e 194689
a 174901
o 121583
n 106574
s 101928
r 96059
i 95120
l 83450
d 77144
t 65680
c 63070
u 57078
m 37618
p 35913
9 23979
, 18307
b 18176
g 16618
. 14475
y 13387
v 13197
ó 11400
f 11251
h 10796
q 9967
í 7152
E 5983
á 5719
z 5627
j 5260
C 4656
A 4280
S 4212
é 3968
L 3736
M 3421
P 3112
ñ 2851
" 2328
x 2311
B 2203
D 2094
T 2036
( 2025
) 2022
ú 1920
R 1897
I 1872
k 1733
G 1624
F 1622
N 1592
- 1370
H 1306
J 1176
V 1152
U 1004
O 977
w 698
% 618
: 553
W 484
K 475
' 334
X 325
Y 315
² 296
; 236
/ 224
Z 210
« 154
» 153
Q 148
Á 130
? 111
¿ 107
$ 101
ü 95
É 62
! 57
º 50
° 41
ö 35
& 31
è 29
à 22
€ 22
+ 21
¡ 20
ª 20
= 19
[ 19
ç 19
] 18
Ó 17
ō 16
ä 14
â 13
# 11
ã 10
α 10
ο 10
ð 9
ø 9
Í 8
λ 8
* 7
× 7
å 7
ô 7
ć 7
ρ 7
ا 7
 7
` 6
ū 6
ς 6
• 6
Ú 5
æ 5
ι 5
φ 5
и 5
Ñ 4
Ö 4
ë 4
ò 4
č 4
ε 4
κ 4
μ 4
τ 4
р 4
ت 4
ل 4
م 4
� 4
| 3
¢ 3
£ 3
· 3
ï 3
õ 3
ù 3
ā 3
ğ 3
ī 3
ı 3
ő 3
œ 3
ş 3
š 3
Δ 3
η 3
π 3
υ 3
е 3
н 3
о 3
т 3
ب 3
ा 3
ম 3
³ 2
Î 2
Ü 2
î 2
ý 2
Đ 2
Ł 2
ř 2
Š 2
ǚ 2
ɔ 2
ə 2
Γ 2
Ζ 2
Φ 2
ί 2
ν 2
ό 2
А 2
К 2
а 2
в 2
г 2
й 2
ר 2
ح 2
س 2
ن 2
ग 2
ৌ 2
♯ 2
一 2
下 2
关 2
天 2
第 2
_ 1
Å 1
È 1
ß 1
ê 1
ì 1
û 1
þ 1
đ 1
ē 1
ġ 1
İ 1
ł 1
Ś 1
ů 1
ŵ 1
ž 1
ɛ 1
ʂ 1
ː 1
Β 1
Κ 1
Ν 1
έ 1
ή 1
β 1
γ 1
δ 1
σ 1
χ 1
З 1
И 1
О 1
П 1
С 1
Ф 1
д 1
к 1
п 1
с 1
ч 1
ё 1
ְ 1
ֵ 1
ָ 1
ה 1
ט 1
ס 1
ע 1
פ 1
ء 1
ة 1
ج 1
د 1
ر 1
ط 1
غ 1
ف 1
و 1
ي 1
ं 1
औ 1
द 1
ब 1
भ 1
र 1
व 1
ि 1
ক 1
ভ 1
স 1
ি 1
ী 1
ু 1
ḥ 1
Ἀ 1
ᾶ 1
ῦ 1
† 1
№ 1
が 1
ぎ 1
ぐ 1
げ 1
ご 1
上 1
円 1
海 1
申 1
花 1
銭 1
雄 1
32
case 56548
det 51438
punct 40104
nmod 33120
obl 20916
amod 19460
conj 14420
root 13477
nsubj 13214
obj 11448
cc 11100
mark 9681
advmod 9517
appos 7524
iobj 6239
flat 6110
nummod 6054
cop 5274
acl 4722
acl:relcl 4478
advcl 3547
aux 3483
fixed 2365
aux:pass 1578
parataxis 1370
ccomp 1320
xcomp 1188
dep 1021
nsubj:pass 1006
csubj 567
compound 357
csubj:pass 5
component {
name: "char_lstm"
transition_system {
registered_name: "char-shift-only"
parameters {
key: "left_to_right"
value: "true"
}
}
fixed_feature {
name: "chars"
fml: "char-input.text-char"
embedding_dim: 16
}
network_unit {
registered_name: "wrapped_units.LayerNormBasicLSTMNetwork"
parameters {
key: "hidden_layer_sizes"
value: "256"
}
}
backend {
registered_name: "SyntaxNetComponent"
}
component_builder {
registered_name: "DynamicComponentBuilder"
}
}
component {
name: "lookahead"
transition_system {
registered_name: "shift-only"
parameters {
key: "left_to_right"
value: "false"
}
}
linked_feature {
name: "char_lstm"
fml: "input.last-char-focus"
embedding_dim: 64
source_component: "char_lstm"
source_translator: "identity"
source_layer: "state_h_0"
}
network_unit {
registered_name: "wrapped_units.LayerNormBasicLSTMNetwork"
parameters {
key: "hidden_layer_sizes"
value: "256"
}
}
backend {
registered_name: "SyntaxNetComponent"
}
component_builder {
registered_name: "DynamicComponentBuilder"
}
}
component {
name: "tagger"
transition_system {
registered_name: "tagger"
}
linked_feature {
name: "lookahead"
fml: "input.focus"
embedding_dim: 64
source_component: "lookahead"
source_translator: "reverse-token"
source_layer: "state_h_0"
}
network_unit {
registered_name: "wrapped_units.LayerNormBasicLSTMNetwork"
parameters {
key: "hidden_layer_sizes"
value: "256"
}
}
backend {
registered_name: "SyntaxNetComponent"
}
component_builder {
registered_name: "DynamicComponentBuilder"
}
}
component {
name: "parser"
transition_system {
registered_name: "arc-standard"
}
fixed_feature {
name: "labels"
fml: "stack.child(1).label stack.child(1).sibling(-1).label stack.child(-1).label stack.child(-1).sibling(1).label stack(1).child(1).label stack(1).child(1).sibling(-1).label stack(1).child(-1).label stack(1).child(-1).sibling(1).label stack.child(2).label stack.child(-2).label stack(1).child(2).label stack(1).child(-2).label"
embedding_dim: 16
}
linked_feature {
name: "lookahead"
fml: "input.focus"
embedding_dim: 64
source_component: "lookahead"
source_translator: "reverse-token"
source_layer: "state_h_0"
}
linked_feature {
name: "tagger"
fml: "input.focus stack.focus stack(1).focus"
embedding_dim: 64
source_component: "tagger"
source_translator: "identity"
source_layer: "state_h_0"
}
linked_feature {
name: "rnn-stack"
fml: "stack.focus stack(1).focus"
embedding_dim: 64
source_component: "parser"
source_translator: "shift-reduce-step"
source_layer: "layer_0"
}
network_unit {
registered_name: "FeedForwardNetwork"
parameters {
key: "hidden_layer_sizes"
value: "256"
}
parameters {
key: "layer_norm_hidden"
value: "true"
}
}
backend {
registered_name: "SyntaxNetComponent"
}
component_builder {
registered_name: "DynamicComponentBuilder"
}
}
291
e 194689
a 174901
o 121583
n 106574
s 101928
r 96059
i 95120
l 83450
d 77144
t 65680
c 63070
u 57078
m 37618
p 35913
9 23979
, 18307
b 18176
g 16618
. 14475
y 13387
v 13197
ó 11400
f 11251
h 10796
q 9967
í 7152
E 5983
á 5719
z 5627
j 5260
C 4656
A 4280
S 4212
é 3968
L 3736
M 3421
P 3112
ñ 2851
" 2328
x 2311
B 2203
D 2094
T 2036
( 2025
) 2022
ú 1920
R 1897
I 1872
k 1733
G 1624
F 1622
N 1592
- 1370
H 1306
J 1176
V 1152
U 1004
O 977
w 698
% 618
: 553
W 484
K 475
' 334
X 325
Y 315
² 296
; 236
/ 224
Z 210
« 154
» 153
Q 148
Á 130
? 111
¿ 107
$ 101
ü 95
É 62
! 57
º 50
° 41
ö 35
& 31
è 29
à 22
€ 22
+ 21
¡ 20
ª 20
= 19
[ 19
ç 19
] 18
Ó 17
ō 16
ä 14
â 13
# 11
ã 10
α 10
ο 10
ð 9
ø 9
Í 8
λ 8
* 7
× 7
å 7
ô 7
ć 7
ρ 7
ا 7
 7
` 6
ū 6
ς 6
• 6
Ú 5
æ 5
ι 5
φ 5
и 5
Ñ 4
Ö 4
ë 4
ò 4
č 4
ε 4
κ 4
μ 4
τ 4
р 4
ت 4
ل 4
م 4
� 4
| 3
¢ 3
£ 3
· 3
ï 3
õ 3
ù 3
ā 3
ğ 3
ī 3
ı 3
ő 3
œ 3
ş 3
š 3
Δ 3
η 3
π 3
υ 3
е 3
н 3
о 3
т 3
ب 3
ा 3
ম 3
³ 2
Î 2
Ü 2
î 2
ý 2
Đ 2
Ł 2
ř 2
Š 2
ǚ 2
ɔ 2
ə 2
Γ 2
Ζ 2
Φ 2
ί 2
ν 2
ό 2
А 2
К 2
а 2
в 2
г 2
й 2
ר 2
ح 2
س 2
ن 2
ग 2
ৌ 2
♯ 2
一 2
下 2
关 2
天 2
第 2
_ 1
Å 1
È 1
ß 1
ê 1
ì 1
û 1
þ 1
đ 1
ē 1
ġ 1
İ 1
ł 1
Ś 1
ů 1
ŵ 1
ž 1
ɛ 1
ʂ 1
ː 1
Β 1
Κ 1
Ν 1
έ 1
ή 1
β 1
γ 1
δ 1
σ 1
χ 1
З 1
И 1
О 1
П 1
С 1
Ф 1
д 1
к 1
п 1
с 1
ч 1
ё 1
ְ 1
ֵ 1
ָ 1
ה 1
ט 1
ס 1
ע 1
פ 1
ء 1
ة 1
ج 1
د 1
ر 1
ط 1
غ 1
ف 1
و 1
ي 1
ं 1
औ 1
द 1
ब 1
भ 1
र 1
व 1
ि 1
ক 1
ভ 1
স 1
ি 1
ী 1
ু 1
ḥ 1
Ἀ 1
ᾶ 1
ῦ 1
† 1
№ 1
が 1
ぎ 1
ぐ 1
げ 1
ご 1
上 1
円 1
海 1
申 1
花 1
銭 1
雄 1
2621
de 38554
en 31682
es 26577
la 22548
er 20776
os 20645
el 19830
ra 18923
ar 17417
on 17136
as 16882
nt 16819
an 16362
re 16068
co 15947
ci 15924
ue 15570
te 14952
ta 14776
99 14646
or 14196
do 13978
ad 13916
st 12880
al 12829
na 11676
un 10883
ro 10836
ca 10828
in 10478
to 10265
ri 10181
lo 10090
da 10041
qu 9945
se 9816
ic 9803
ti 9009
po 8455
tr 8443
io 8291
le 8283
ie 8282
ac 8076
ia 7871
pa 7687
id 7464
no 7337
me 7302
nd 7100
si 7082
ma 6968
di 6722
ió 6444
ne 6388
ec 6291
is 6261
om 6238
li 6196
ón 6090
pr 5967
nc 5714
pe 5678
am 5592
ni 5574
mi 5282
mo 5260
su 5065
so 5062
ce 4673
ab 4648
rt 4586
it 4581
ha 4571
cu 4416
sa 4412
em 4396
at 4308
ll 4042
il 4038
ol 3962
ba 3948
vi 3925
ur 3840
ve 3727
im 3591
ed 3506
mp 3488
ía 3452
tu 3405
eg 3336
oc 3291
bi 3280
ns 3259
ua 3254
br 3188
ga 3176
us 3098
ir 3037
ct 2947
va 2856
gu 2839
rr 2804
mb 2769
fi 2751
et 2736
za 2685
ui 2655
sp 2637
ch 2634
ob 2633
iv 2595
ot 2545
pu 2534
bl 2511
od 2508
ig 2470
ul 2417
fu 2379
gr 2376
mu 2347
rm 2335
ea 2308
go 2265
pi 2156
sc 2131
uc 2052
vo 1914
má 1887
lu 1878
ho 1868
La 1835
añ 1822
El 1815
ev 1795
rc 1780
ás 1761
ng 1751
ip 1748
ap 1734
rd 1717
rí 1698
ge 1683
ño 1682
pl 1662
du 1641
ag 1628
ud 1603
Es 1600
iz 1597
op 1580
gi 1554
fe 1550
ru 1528
ex 1520
hi 1519
cr 1510
ep 1502
rs 1492
lt 1462
ut 1457
rg 1452
be 1440
ib 1418
jo 1414
aj 1407
En 1374
rn 1346
fo 1339
ay 1305
Co 1290
au 1282
nu 1277
he 1266
Ma 1265
ub 1259
cl 1256
um 1229
bo 1223
ja 1185
ej 1180
rá 1166
dr 1165
án 1165
fa 1164
Ca 1159
je 1156
ez 1140
av 1136
ov 1132
ju 1110
eb 1101
fr 1042
if 1029
up 1023
eo 1017
cc 1006
bu 1004
én 981
Se 977
og 967
az 917
ña 916
uy 911
lm 881
tá 859
.9 854
9. 853
és 852
sm 841
Sa 834
nf 830
ié 824
ug 823
zo 812
ef 788
lí 776
De 774
of 772
Pa 760
xi 757
Lo 756
Al 751
ya 748
nz 734
eñ 732
nv 726
ún 726
yo 713
Un 685
ís 644
tó 639
Re 613
rv 608
ró 603
ye 601
lg 596
Su 584
Ba 583
gl 583
eq 578
oy 558
ai 557
tí 556
ei 544
iu 539
ín 537
dí 536
af 530
Po 525
pt 522
ér 507
hu 499
lv 489
ou 484
In 483
Ar 482
sd 476
xp 476
Pr 473
Pe 464
Mi 455
ey 452
ld 452
Me 445
Mo 445
Ch 444
ae 444
Si 441
sí 437
uv 437
Ro 426
An 425
eu 424
,9 421
9, 421
rp 410
bí 408
xt 408
aí 406
nq 406
ní 406
cí 403
ít 400
gú 399
Na 390
ué 387
No 385
ee 380
ló 379
nó 378
sl 376
rq 371
Ha 369
íc 369
rb 362
Ju 356
km 354
ij 352
só 351
zó 351
ól 351
có 350
lc 349
Jo 346
gn 345
Ta 341
rz 340
Tr 338
Vi 334
oo 332
Mu 331
rl 329
uj 329
To 326
th 323
Di 322
Be 318
So 318
Le 313
ío 312
fl 311
Fr 309
Bo 304
Gr 301
Gu 296
ah 296
ss 293
oe 292
oa 291
át 290
Ce 283
Li 282
Te 280
Ga 279
lb 278
óm 277
ck 276
Fu 274
As 270
aq 270
ál 270
té 269
ár 265
mó 264
tt 264
Cu 263
Br 261
ls 259
nn 256
sh 256
úl 256
Fe 255
lé 255
II 252
gó 248
mé 248
oj 248
Ho 245
él 244
éc 243
dó 242
sf 242
Lu 240
Va 240
ác 240
ví 239
Ja 237
ki 237
lá 223
Ad 222
Ci 222
He 222
rf 220
úb 218
pú 217
Ra 216
Ge 215
ke 215
Am 209
bs 209
yu 208
Or 207
Au 206
Go 206
oz 203
oi 202
uí 202
Da 200
ry 199
St 197
cá 196
Ve 195
Do 193
nú 193
Cr 192
ór 192
Bu 191
Cl 191
dé 191
ow 190
ús 189
uz 188
Fi 186
mí 184
mú 184
ré 184
ét 184
Du 183
Ri 182
vu 182
Th 181
eó 181
fí 179
-9 177
lq 177
nm 177
Pi 176
pó 175
gí 174
ak 173
sq 173
xc 173
íf 173
9- 172
nj 170
uo 168
íd 167
Ni 165
Ti 164
Bi 162
Hi 162
ka 162
iq 161
tl 161
Eu 159
sé 158
úm 157
Ac 156
pc 156
Nu 155
óg 155
Ne 154
éx 154
tb 153
wa 153
jó 151
ám 151
cn 150
cé 150
Fa 148
Ru 148
oh 147
ts 145
rk 144
Pu 140
lp 139
áf 138
iñ 137
Pl 136
ps 136
lf 135
uf 135
ná 134
ím 134
Hu 132
iá 131
-- 130
.. 128
dm 128
Je 127
Qu 127
mm 126
Wi 125
ik 125
vé 124
Fo 123
oq 121
gé 118
ox 118
bt 117
Gi 116
gh 115
hí 115
mn 115
Ka 114
At 112
ao 112
we 112
Sh 111
bj 111
zu 111
ós 110
Wa 109
Is 108
Bl 107
áp 107
Ag 106
Tu 106
nr 106
ty 106
óp 106
Ed 105
eh 105
ép 105
óv 104
Yo 103
út 103
jé 102
né 101
Mé 100
nk 100
ny 100
sk 100
ñí 100
Ex 98
Ap 97
VI 97
ph 97
ly 96
hn 94
zc 94
xa 92
Of 91
Ki 90
Sc 88
ko 88
yó 88
lr 87
Fl 86
ok 86
Sp 85
ji 85
wi 85
óx 85
aú 84
ág 84
ew 82
sg 82
bó 81
zi 81
fá 80
ht 80
áb 80
éd 80
íg 80
ds 78
sb 78
Ab 77
Ai 77
ñe 77
Ot 76
íp 75
Er 74
We 74
uñ 74
Dr 73
Em 72
Ya 72
It 71
ax 71
XI 70
pp 70
zq 70
ks 69
ms 69
sn 69
ix 68
Ir 67
aw 67
hr 67
nl 67
pá 67
tc 67
ód 67
Ll 66
Má 66
fú 66
ff 65
ft 65
Av 64
XV 64
dá 64
wn 64
ze 64
Za 63
Ol 62
eí 62
nh 62
tm 62
ys 62
Ko 61
rú 61
áx 61
uá 60
pí 59
zá 59
ém 59
úa 59
dq 58
dy 57
uq 57
yl 57
Ej 56
Ke 56
bá 56
hó 56
Ig 55
Im 55
Vo 55
Wo 55
bé 55
tz 55
Ec 54
Ur 54
lk 54
Oc 53
gü 53
tú 53
ux 53
vó 53
ót 52
fó 51
Ob 50
pé 50
Có 49
íb 49
üe 49
Ay 48
yn 48
uk 47
my 46
sv 46
zz 46
óc 46
cm 45
sá 45
wo 45
XX 44
aa 44
ii 44
xo 44
Ph 43
ek 43
rj 43
yr 43
éf 43
Ib 42
Os 42
Rí 42
gm 42
hl 42
Án 42
ír 42
by 41
gt 41
ñó 41
ku 40
FC 39
Gl 39
fé 39
kl 39
ky 39
oñ 39
úc 39
AS 38
IV 38
bú 38
dw 38
yc 38
yp 38
há 37
lz 37
9: 36
:9 36
aé 36
dd 36
gá 36
Cá 35
dv 35
ln 35
sú 35
tn 35
xu 35
yt 35
's 34
hy 34
ih 34
r. 34
ég 34
C. 33
DE 33
ES 33
Ev 33
Op 33
c. 33
cy 33
dg 33
zg 33
EE 32
SS 32
Yu 32
hm 32
nb 32
xe 32
Ah 31
EC 31
IX 31
éi 31
óf 31
SA 30
rh 30
uó 30
Kr 29
Mc 29
RA 29
Sm 29
tw 29
ws 29
Ál 29
Ku 28
dl 28
gg 28
Áf 28
ád 28
AC 27
Ló 27
TV 27
cs 27
cú 27
gs 27
vá 27
zh 27
A. 26
E. 26
IN 26
ON 26
PP 26
Pé 26
RE 26
Wh 26
Ye 26
Ze 26
bb 26
d' 26
hú 26
lh 26
ww 26
ym 26
ñi 26
BA 25
Dí 25
EN 25
Ji 25
Zo 25
hé 25
ív 25
íz 25
AM 24
AN 24
Ae 24
CD 24
ER 24
Fú 24
ID 24
Il 24
PS 24
TA 24
iy 24
sr 24
sy 24
És 24
AD 23
Az 23
Jr 23
NA 23
s. 23
xh 23
yd 23
áv 23
íe 23
AR 22
CE 22
CO 22
Cy 22
DR 22
Zi 22
Zu 22
dh 22
gd 22
oí 22
yi 22
Él 22
áu 22
Ea 21
Eg 21
FA 21
MI 21
NE 21
PC 21
Sá 21
dú 21
íl 21
AL 20
Af 20
CA 20
IA 20
IC 20
NI 20
On 20
TE 20
kh 20
kk 20
n. 20
wl 20
ái 20
Añ 19
MS 19
S. 19
ST 19
UU 19
hc 19
ml 19
sw 19
éa 19
'9 18
Hé 18
IS 18
MA 18
My 18
PA 18
Sw 18
Só 18
U. 18
UE 18
US 18
áz 18
.c 17
Aq 17
CI 17
Et 17
Hy 17
IB 17
Io 17
LA 17
Ly 17
NB 17
NC 17
SC 17
SE 17
bd 17
lú 17
yw 17
úr 17
AP 16
Aé 16
Bá 16
EP 16
Nú 16
Om 16
P. 16
Ps 16
RI 16
SD 16
Ty 16
Us 16
bm 16
dj 16
áq 16
íq 16
úp 16
'' 15
AA 15
CC 15
D. 15
DA 15
DN 15
DS 15
IP 15
IR 15
Kn 15
OS 15
PI 15
RO 15
Ry 15
SI 15
SO 15
UN 15
VE 15
bc 15
xq 15
ób 15
.U 14
BC 14
Bé 14
CB 14
ED 14
EL 14
H9 14
Mú 14
PR 14
Sy 14
Ul 14
tp 14
Ár 14
.A 13
Aw 13
BB 13
CR 13
DC 13
EF 13
ET 13
Ei 13
Ep 13
FI 13
Iz 13
NG 13
PD 13
Pú 13
SP 13
VA 13
Ví 13
dn 13
kg 13
rw 13
w. 13
éu 13
úñ 13
.C 12
EM 12
GB 12
Gü 12
NH 12
Oa 12
Oe 12
RC 12
Sk 12
Sl 12
TI 12
Ut 12
Xi 12
bv 12
dt 12
eá 12
gf 12
gy 12
kt 12
np 12
sz 12
áj 12
èr 12
.e 11
AB 11
AF 11
BS 11
CP 11
DV 11
EU 11
Fé 11
Hz 11
IE 11
Id 11
Lí 11
NO 11
Ná 11
O' 11
Oj 11
R9 11
TO 11
Tl 11
Tw 11
UR 11
Zh 11
fs 11
hw 11
já 11
t. 11
tx 11
uh 11
vr 11
vy 11
xó 11
yb 11
ör 11
9' 10
9/ 10
AE 10
BI 10
BR 10
CH 10
CN 10
CV 10
DO 10
HD 10
L. 10
LO 10
MT 10
Mí 10
Mó 10
O. 10
OL 10
Ow 10
P9 10
Pá 10
R. 10
Té 10
Tú 10
Ub 10
Vu 10
Wr 10
a. 10
iP 10
iè 10
l' 10
nw 10
nç 10
o. 10
tg 10
zú 10
év 10
úe 10
A9 9
AI 9
AT 9
AV 9
Aa 9
B. 9
BL 9
BT 9
BV 9
CF 9
CW 9
Cé 9
DI 9
Dy 9
E9 9
EA 9
FE 9
Fá 9
GA 9
Gh 9
I. 9
IT 9
Iv 9
J. 9
M. 9
N. 9
NU 9
OE 9
OR 9
Od 9
Oh 9
Sq 9
Sv 9
Sí 9
T. 9
Wu 9
bf 9
bn 9
cq 9
gk 9
lw 9
m. 9
nx 9
oé 9
pn 9
uu 9
yf 9
ão 9
éb 9
ée 9
9t 8
:/ 8
Ak 8
BM 8
CU 8
Ef 8
F. 8
GP 8
Gé 8
Gó 8
Ic 8
Já 8
Kh 8
LC 8
MP 8
NT 8
OC 8
OM 8
OT 8
PE 8
PN 8
Qa 8
RM 8
RS 8
S9 8
Sr 8
Sé 8
TC 8
UC 8
VD 8
W. 8
WW 8
Xa 8
ZA 8
db 8
dc 8
hâ 8
py 8
tk 8
tv 8
vc 8
vs 8
zk 8
zm 8
zn 8
zt 8
éj 8
úd 8
'A 7
.S 7
.m 7
9F 7
AG 7
AZ 7
BG 7
CT 7
Eq 7
GM 7
HC 7
HM 7
HT 7
K. 7
Kl 7
L' 7
LM 7
LP 7
MO 7
NS 7
Oi 7
Ok 7
Ox 7
PL 7
PU 7
RP 7
SM 7
SN 7
UL 7
Uc 7
Vl 7
WA 7
Zú 7
gb 7
hs 7
iT 7
kr 7
ká 7
lj 7
m² 7
oá 7
tf 7
wt 7
xf 7
xy 7
yg 7
yy 7
yá 7
áh 7
ön 7
úo 7
üi 7
+9 6
.M 6
.O 6
.T 6
.a 6
.o 6
// 6
/9 6
9D 6
AH 6
AX 6
By 6
CS 6
Cn 6
DH 6
FM 6
FR 6
HS 6
IO 6
Ky 6
LG 6
LL 6
MB 6
ME 6
MH 6
MV 6
MW 6
ND 6
OO 6
PO 6
Sã 6
TS 6
Tá 6
UP 6
UT 6
Vá 6
WC 6
aó 6
cL 6
eú 6
fg 6
gz 6
hb 6
iú 6
ić 6
jí 6
mt 6
p: 6
wk 6
yú 6
zb 6
zs 6
Áv 6
Ós 6
áe 6
ât 6
ça 6
ço 6
öl 6
úz 6
.D 5
.n 5
/w 5
9A 5
9B 5
9m 5
9s 5
9v 5
AU 5
Aú 5
B9 5
BP 5
Bh 5
C9 5
CJ 5
CL 5
Cí 5
Cú 5
DM 5
Dh 5
EB 5
EG 5
EO 5
Ee 5
Ey 5
FS 5
Fí 5
Fó 5
GH 5
GL 5
HO 5
IM 5
LE 5
LI 5
M9 5
Mü 5
NF 5
NV 5
NZ 5
Nó 5
Ou 5
Pt 5
Py 5
Pí 5
RB 5
Rh 5
SB 5
SL 5
Tí 5
UA 5
UD 5
UV 5
bh 5
cC 5
cD 5
d. 5
hv 5
ià 5
kn 5
mc 5
pm 5
rx 5
uT 5
vk 5
wb 5
wh 5
wr 5
wá 5
x9 5
yS 5
yk 5
yé 5
zl 5
Ág 5
áñ 5
èn 5
ès 5
ün 5
ür 5
üs 5
'O 4
'a 4
.h 4
9N 4
9O 4
9k 4
9x 4
== 4
BE 4
BH 4
Bí 4
CG 4
Cô 4
D9 4
DK 4
DL 4
DP 4
DT 4
DU 4
Dá 4
Dé 4
EI 4
EV 4
Eb 4
F9 4
FU 4
G. 4
GE 4
Gm 4
Gy 4
H. 4
HG 4
HP 4
IF 4
IH 4
Iñ 4
LN 4
Lá 4
MC 4
MD 4
MM 4
Mr 4
NW 4
OP 4
Ov 4
PK 4
PM 4
QU 4
RD 4
RF 4
RN 4
RR 4
RT 4
RU 4
RV 4
Ré 4
SG 4
SU 4
Sn 4
T9 4
TF 4
TL 4
TR 4
Ud 4
Uz 4
VN 4
VP 4
Vé 4
WE 4
WH 4
X. 4
Xu 4
Yi 4
Ys 4
a' 4
cB 4
cK 4
cd 4
df 4
dz 4
e. 4
fm 4
fy 4
gw 4
gè 4
hō 4
iC 4
iF 4
iw 4
k9 4
kf 4
kw 4
mf 4
mr 4
mw 4
oS 4
qa 4
rè 4
rö 4
vd 4
vl 4
vn 4
wc 4
wm 4
wy 4
xí 4
zy 4
àl 4
ân 4
ñá 4
ôt 4
üc 4
ül 4
üí 4
ος 4
'C 3
'N 3
'e 3
'm 3
.B 3
.E 3
.F 3
.I 3
.K 3
.P 3
.d 3
.p 3
9P 3
9h 3
AK 3
AO 3
Ax 3
BN 3
Bj 3
Bt 3
CM 3
Cd 3
DG 3
Dn 3
Dw 3
Eh 3
Ek 3
Ez 3
FB 3
FF 3
FG 3
FL 3
GO 3
GR 3
GT 3
Gw 3
Gá 3
Gö 3
HE 3
HF 3
HL 3
Hí 3
Hú 3
IG 3
IL 3
IU 3
If 3
Ih 3
Ip 3
Iq 3
Iw 3
Ix 3
KS 3
Ká 3
L9 3
Lt 3
ML 3
MN 3
MU 3
Mä 3
N9 3
NN 3
NP 3
Né 3
Nö 3
Og 3
PF 3
PG 3
PJ 3
PT 3
PV 3
Rá 3
Rü 3
Sz 3
Sú 3
TD 3
TN 3
TP 3
TT 3
Ts 3
Tx 3
Tü 3
UG 3
Ug 3
Um 3
Up 3
V. 3
V9 3
VH 3
VS 3
Wy 3
X9 3
Xb 3
Xo 3
YA 3
YN 3
Zw 3
aç 3
b' 3
bp 3
cz 3
dk 3
fq 3
gp 3
hd 3
hh 3
hk 3
hp 3
js 3
jø 3
l. 3
lx 3
lü 3
md 3
mg 3
må 3
n' 3
nB 3
nE 3
nG 3
oI 3
oë 3
p. 3
rø 3
rü 3
s/ 3
t' 3
td 3
tj 3
tö 3
uw 3
uð 3
v9 3
wf 3
wp 3
xl 3
yh 3
yz 3
zp 3
zí 3
Ét 3
Íg 3
Óp 3
ål 3
éz 3
íx 3
öm 3
ør 3
úh 3
ōs 3
œu 3
κα 3
ρο 3
&l 2
'B 2
'D 2
'W 2
'l 2
'v 2
'œ 2
.G 2
.L 2
.R 2
.W 2
.X 2
.f 2
.l 2
.r 2
.s 2
.x 2
.ç 2
/d 2
/i 2
/k 2
/s 2
9C 2
9E 2
9G 2
9M 2
9X 2
9c 2
9l 2
9o 2
AY 2
BJ 2
BU 2
Bú 2
CK 2
CX 2
Cs 2
Ct 2
DB 2
Dz 2
Dó 2
Dö 2
Dú 2
EZ 2
FH 2
FN 2
FP 2
FX 2
GC 2
GI 2
GN 2
GV 2
Gs 2
Hö 2
IJ 2
JA 2
JE 2
JI 2
JJ 2
JK 2
JO 2
Jä 2
Jó 2
Jõ 2
KD 2
KI 2
KL 2
Km 2
Kó 2
Kö 2
Kō 2
LB 2
LD 2
LF 2
LR 2
LS 2
LT 2
LX 2
Lé 2
MG 2
MR 2
Ms 2
NK 2
NM 2
NR 2
NX 2
Nd 2
Ng 2
Nj 2
Ny 2
O9 2
OA 2
OB 2
OD 2
OF 2
OG 2
OH 2
OI 2
Oy 2
Oz 2
Oñ 2
PW 2
Pb 2
Pó 2
Qi 2
Qo 2
Rt 2
Rú 2
SF 2
SR 2
SV 2
SY 2
Sō 2
TG 2
TH 2
TU 2
UH 2
VR 2
Vä 2
WF 2
WL 2
XB 2
XL 2
XT 2
Xp 2
Y. 2
YU 2
Zy 2
Zá 2
`` 2
aD 2
aï 2
aü 2
b. 2
bč 2
bō 2
cA 2
cG 2
cM 2
cx 2
dà 2
eB 2
eT 2
f. 2
fn 2
g. 2
gx 2
h. 2
hC 2
hP 2
hf 2
hř 2
iM 2
iU 2
ií 2
ič 2
jd 2
jk 2
jp 2
jū 2
kB 2
kí 2
kó 2
kö 2
là 2
lä 2
lò 2
lö 2
lø 2
m/ 2
mv 2
mè 2
mə 2
nC 2
nö 2
nǚ 2
nɔ 2
pH 2
pb 2
pd 2
pf 2
pg 2
pz 2
qi 2
rL 2
rà 2
rã 2
ræ 2
rç 2
r� 2
s9 2
ső 2
t; 2
tō 2
u' 2
uM 2
uş 2
v. 2
x. 2
xm 2
xá 2
xé 2
y. 2
y/ 2
yv 2
yx 2
yū 2
zw 2
Ám 2
Át 2
Éc 2
Éf 2
Éx 2
Ín 2
Îl 2
Ób 2
Ól 2
Úl 2
àn 2
àr 2
âl 2
äk 2
äm 2
är 2
äs 2
çu 2
èg 2
èm 2
éq 2
íj 2
ît 2
ój 2
óo 2
ów 2
õh 2
ös 2
øn 2
új 2
üb 2
üé 2
či 2
Đu 2
ře 2
ši 2
əs 2
αλ 2
ια 2
ιλ 2
λι 2
λο 2
μm 2
ον 2
όρ 2
ви 2
ор 2
ات 2
بل 2
下第 2
天下 2
第一 2
E 2
L 2
�� 2
"R 1
'E 1
'I 1
'K 1
'M 1
'U 1
'c 1
'h 1
'i 1
't 1
'u 1
-( 1
-) 1
-E 1
-h 1
.N 1
.g 1
.i 1
.j 1
.t 1
.u 1
.v 1
/C 1
/L 1
/c 1
/r 1
/t 1
9" 1
9S 1
9a 1
9b 1
9e 1
9i 1
9p 1
9y 1
:) 1
:- 1
;- 1
;r 1
=" 1
AJ 1
Aj 1
Ao 1
AÑ 1
AÚ 1
Aí 1
Ağ 1
BK 1
BO 1
Bx 1
Bó 1
Bü 1
Bœ 1
C' 1
CQ 1
CY 1
Cc 1
Cf 1
Cz 1
Cè 1
D' 1
DD 1
DF 1
DJ 1
Dc 1
Dj 1
Dm 1
DÍ 1
Dà 1
Dô 1
Dü 1
EJ 1
EK 1
EW 1
EX 1
FD 1
FK 1
FO 1
FQ 1
FT 1
FV 1
Fb 1
Fh 1
Fè 1
Fë 1
GG 1
GK 1
GU 1
Gn 1
GÜ 1
Gä 1
HA 1
HB 1
HI 1
HR 1
HU 1
Hl 1
Hn 1
Hs 1
Há 1
IW 1
IZ 1
Ik 1
Iu 1
IÁ 1
IÑ 1
IÓ 1
Ió 1
JD 1
JG 1
JN 1
JP 1
JS 1
Jv 1
Jé 1
Jú 1
Jü 1
K' 1
K- 1
KA 1
KC 1
KE 1
KF 1
KM 1
KN 1
KO 1
KV 1
KY 1
Kf 1
Kw 1
KÖ 1
Kü 1
LQ 1
LV 1
LY 1
LZ 1
Lh 1
Lm 1
Ls 1
LÍ 1
Lä 1
MF 1
MJ 1
MK 1
MZ 1
Ml 1
MÉ 1
Mà 1
Må 1
Mö 1
NY 1
Nm 1
Nr 1
Ns 1
Nà 1
Ní 1
Nī 1
OJ 1
OU 1
OV 1
OW 1
OX 1
OY 1
OZ 1
Oo 1
PH 1
PQ 1
Pc 1
Pf 1
Pm 1
Pà 1
Q. 1
QC 1
QL 1
QM 1
RG 1
RL 1
RW 1
RY 1
Rb 1
Rc 1
Rs 1
Rä 1
Ró 1
SH 1
SJ 1
SK 1
SQ 1
SX 1
Sj 1
Ss 1
Sâ 1
Sö 1
TB 1
TM 1
Tc 1
Tz 1
Tâ 1
Tı 1
Tō 1
TΔ 1
U9 1
UB 1
UI 1
UJ 1
UK 1
UM 1
UO 1
UQ 1
UX 1
UY 1
Uv 1
Ux 1
VB 1
VC 1
VO 1
VT 1
VU 1
Vf 1
Vs 1
Vå 1
Væ 1
Vö 1
WD 1
WI 1
WK 1
WN 1
WO 1
WP 1
WR 1
WS 1
WT 1
Ws 1
Wö 1
Wü 1
XA 1
XC 1
XD 1
XF 1
XS 1
Xe 1
Xf 1
Xh 1
Xv 1
Xī 1
YC 1
YE 1
YO 1
YR 1
YT 1
Yb 1
Ym 1
Yp 1
Yá 1
Z9 1
ZE 1
ZS 1
ZT 1
ZU 1
Zd 1
Zv 1
Zí 1
Zö 1
_c 1
a- 1
a9 1
aA 1
aC 1
aG 1
aK 1
aM 1
aN 1
aZ 1
aî 1
að 1
ađ 1
ağ 1
ał 1
aš 1
bC 1
bH 1
bK 1
bg 1
bw 1
bz 1
bà 1
bö 1
bø 1
bü 1
bš 1
c' 1
cI 1
cQ 1
cV 1
cf 1
cv 1
cæ 1
dI 1
dL 1
dS 1
dp 1
dô 1
dā 1
dē 1
dō 1
dŵ 1
e9 1
e= 1
eC 1
eF 1
eI 1
eJ 1
eO 1
eQ 1
eS 1
eV 1
eW 1
eX 1
eß 1
eà 1
eé 1
eð 1
eü 1
f9 1
fL 1
fb 1
fc 1
fj 1
fk 1
fx 1
fâ 1
fü 1
gc 1
gù 1
gō 1
h- 1
h/ 1
hK 1
hM 1
hj 1
hq 1
hz 1
hè 1
hü 1
hā 1
hū 1
iD 1
iL 1
iR 1
iS 1
iã 1
iç 1
ið 1
iò 1
iş 1
j. 1
jl 1
jn 1
jw 1
jy 1
jö 1
jú 1
k' 1
kD 1
kF 1
kJ 1
kb 1
kc 1
kx 1
kä 1
l9 1
lI 1
lR 1
lâ 1
lè 1
lù 1
lı 1
mA 1
mG 1
mh 1
mj 1
mk 1
mq 1
mx 1
mà 1
mõ 1
mö 1
mû 1
mü 1
n/ 1
nP 1
n_ 1
nà 1
nä 1
nè 1
nê 1
nü 1
ný 1
nı 1
nō 1
nů 1
o! 1
oA 1
oB 1
oC 1
oK 1
oN 1
oO 1
oã 1
oç 1
oî 1
oï 1
oó 1
oğ 1
p9 1
pB 1
pK 1
pM 1
pR 1
pj 1
pk 1
pè 1
pù 1
q' 1
qc 1
qo 1
r9 1
rA 1
rD 1
rP 1
rV 1
râ 1
rå 1
rð 1
s' 1
sP 1
sR 1
sW 1
sj 1
sà 1
t/ 1
tC 1
tL 1
tW 1
tū 1
u. 1
u/ 1
uG 1
uà 1
uè 1
uþ 1
už 1
vg 1
vå 1
væ 1
vö 1
vý 1
wg 1
wu 1
wā 1
xB 1
xb 1
xd 1
xr 1
xs 1
xì 1
xò 1
yC 1
yF 1
yJ 1
yM 1
yj 1
yè 1
yí 1
yš 1
z. 1
zM 1
zW 1
zj 1
zr 1
zè 1
zô 1
zö 1
zī 1
ző 1
ÁN 1
Áy 1
Ås 1
Èz 1
ÉX 1
Éb 1
Éi 1
Ép 1
Éq 1
Ér 1
Év 1
ÍA 1
ÍT 1
Íc 1
ÑE 1
ÑO 1
Ña 1
Ñu 1
ÓN 1
Ór 1
Öl 1
Ör 1
Ös 1
ÚN 1
Új 1
Ún 1
ÜE 1
Üb 1
ße 1
às 1
ák 1
áo 1
áy 1
âo 1
äd 1
äf 1
äi 1
än 1
äu 1
äv 1
åg 1
åk 1
ån 1
år 1
æc 1
æd 1
æn 1
ær 1
æð 1
çl 1
èl 1
èt 1
éo 1
ëa 1
ëf 1
ën 1
ìn 1
ík 1
íu 1
íñ 1
íα 1
ïe 1
ïf 1
ða 1
ðb 1
ði 1
ðr 1
ðu 1
ñ9 1
ñt 1
ñu 1
ñé 1
òn 1
óa 1
óq 1
óy 1
óz 1
óð 1
óñ 1
óς 1
ôm 1
ôn 1
õe 1
öf 1
öh 1
öp 1
öt 1
öy 1
øk 1
øs 1
øu 1
øy 1
ùb 1
úf 1
úg 1
úq 1
úy 1
ûm 1
üa 1
üg 1
üm 1
üt 1
ýd 1
þr 1
ām 1
ās 1
āz 1
ći 1
čk 1
čí 1
ēm 1
ğa 1
ğd 1
ğl 1
ġd 1
īn 1
īt 1
İs 1
ık 1
ıl 1
Ła 1
Łu 1
łi 1
ōc 1
ōj 1
ōn 1
őb 1
őn 1
Śi 1
Št 1
Šu 1
šć 1
ūn 1
ūḥ 1
ůf 1
ŵr 1
ži 1
ǚx 1
ɔr 1
ɔʂ 1
ɛa 1
ΒΖ 1
Γα 1
Γρ 1
ΔG 1
ΔH 1
ΔS 1
ΖΒ 1
Κα 1
Νι 1
Φι 1
Φό 1
έλ 1
ίο 1
ίτ 1
αί 1
αδ 1
αρ 1
αυ 1
αφ 1
γο 1
δί 1
ε9 1
ελ 1
ηγ 1
ηφ 1
ικ 1
κη 1
λí 1
λó 1
λλ 1
λτ 1
μο 1
μπ 1
νο 1
οκ 1
ορ 1
ου 1
οῦ 1
πή 1
πε 1
ρη 1
ρκ 1
ρμ 1
ρᾶ 1
σα 1
τε 1
τη 1
το 1
υλ 1
υρ 1
φέ 1
φι 1
φυ 1
φό 1
АЗ 1
Ап 1
Иг 1
Ко 1
Кр 1
ПО 1
Ст 1
Фё 1
ав 1
ат 1
ге 1
гн 1
до 1
ев 1
ей 1
ие 1
ий 1
ин 1
ит 1
ич 1
ки 1
на 1
не 1
нс 1
ог 1
по 1
рА 1
ра 1
ри 1
ск 1
ти 1
тн 1
тр 1
ёд 1
ְר 1
ֵפ 1
ָה 1
טְ 1
סע 1
ער 1
פָ 1
רֵ 1
اء 1
اب 1
ال 1
ام 1
ان 1
بن 1
تا 1
تم 1
تو 1
جب 1
حا 1
حة 1
دا 1
را 1
سي 1
طر 1
غد 1
فت 1
لب 1
لس 1
لط 1
ما 1
مس 1
مف 1
نا 1
وح 1
ंग 1
और 1
गा 1
बा 1
भा 1
रं 1
वि 1
ाग 1
ाद 1
ाब 1
िभ 1
ভৌ 1
মি 1
মী 1
মৌ 1
সু 1
িক 1
ুম 1
ৌম 1
ৌস 1
ḥa 1
Ἀρ 1
ᾶς 1
ぎぐ 1
上海 1
申花 1
雄关 1
D 1
G 1
S 1
�n 1
32
case 56548
det 51438
punct 40104
nmod 33120
obl 20916
amod 19460
conj 14420
root 13477
nsubj 13214
obj 11448
cc 11100
mark 9681
advmod 9517
appos 7524
iobj 6239
flat 6110
nummod 6054
cop 5274
acl 4722
acl:relcl 4478
advcl 3547
aux 3483
fixed 2365
aux:pass 1578
parataxis 1370
ccomp 1320
xcomp 1188
dep 1021
nsubj:pass 1006
csubj 567
compound 357
csubj:pass 5
component {
name: "lookahead"
transition_system {
registered_name: "shift-only"
parameters {
key: "left_to_right"
value: "false"
}
}
fixed_feature {
name: "char"
fml: "input(-1).char input.char input(1).char"
embedding_dim: 32
vocabulary_size: 119
size: 3
}
fixed_feature {
name: "char-bigram"
fml: "input.char-bigram"
embedding_dim: 32
vocabulary_size: 1158
size: 1
}
network_unit {
registered_name: "wrapped_units.LayerNormBasicLSTMNetwork"
parameters {
key: "hidden_layer_sizes"
value: "256"
}
}
backend {
registered_name: "SyntaxNetComponent"
}
num_actions: 1
component_builder {
registered_name: "DynamicComponentBuilder"
}
}
component {
name: "segmenter"
transition_system {
registered_name: "binary-segment-transitions"
}
resource {
name: "suffix-table"
part {
file_pattern: "suffix-table"
}
}
linked_feature {
name: "lookahead"
fml: "input.focus stack.focus"
embedding_dim: 32
size: 2
source_component: "lookahead"
source_translator: "reverse-token"
source_layer: "state_h_0"
}
network_unit {
registered_name: "wrapped_units.LayerNormBasicLSTMNetwork"
parameters {
key: "hidden_layer_sizes"
value: "128"
}
}
backend {
registered_name: "SyntaxNetComponent"
}
num_actions: 2
component_builder {
registered_name: "DynamicComponentBuilder"
}
}
This diff is collapsed.
This diff is collapsed.
......@@ -6,70 +6,94 @@
"metadata": {
"collapsed": false,
"deletable": true,
"editable": true
"editable": true,
"scrolled": false
},
"outputs": [],
"source": [
"import os\n",
"import ipywidgets as widgets\n",
"import tensorflow as tf\n",
"import uuid\n",
"from IPython import display\n",
"from dragnn.protos import spec_pb2\n",
"from dragnn.python import graph_builder\n",
"from dragnn.python import spec_builder\n",
"from dragnn.python import load_dragnn_cc_impl # This loads the actual op definitions\n",
"from dragnn.python import render_parse_tree_graphviz\n",
"from dragnn.python import visualization\n",
"from google.protobuf import text_format\n",
"from syntaxnet import load_parser_ops # This loads the actual op definitions\n",
"from syntaxnet import sentence_pb2\n",
"from syntaxnet.ops import gen_parser_ops\n",
"from tensorflow.python.platform import tf_logging as logging\n",
"\n",
"# Read the master spec\n",
"master_spec = spec_pb2.MasterSpec()\n",
"with open(\"data/master_spec_es.prototext\", \"r\") as f:\n",
" text_format.Merge(f.read(), master_spec)\n",
"def load_model(base_dir, master_spec_name, checkpoint_name):\n",
" # Read the master spec\n",
" master_spec = spec_pb2.MasterSpec()\n",
" with open(os.path.join(base_dir, master_spec_name), \"r\") as f:\n",
" text_format.Merge(f.read(), master_spec)\n",
" spec_builder.complete_master_spec(master_spec, None, base_dir)\n",
" logging.set_verbosity(logging.WARN) # Turn off TensorFlow spam.\n",
"\n",
" # Initialize a graph\n",
" graph = tf.Graph()\n",
" with graph.as_default():\n",
" hyperparam_config = spec_pb2.GridPoint()\n",
" builder = graph_builder.MasterBuilder(master_spec, hyperparam_config)\n",
" # This is the component that will annotate test sentences.\n",
" annotator = builder.add_annotation(enable_tracing=True)\n",
" builder.add_saver() # \"Savers\" can save and load models; here, we're only going to load.\n",
"\n",
"logging.set_verbosity(logging.WARN) # Turn off TensorFlow spam.\n",
" sess = tf.Session(graph=graph)\n",
" with graph.as_default():\n",
" sess.run(tf.global_variables_initializer())\n",
" sess.run('save/restore_all', {'save/Const:0': os.path.join(base_dir, checkpoint_name)})\n",
" \n",
" def annotate_sentence(sentence):\n",
" with graph.as_default():\n",
" return sess.run([annotator['annotations'], annotator['traces']],\n",
" feed_dict={annotator['input_batch']: [sentence]})\n",
" return annotate_sentence\n",
"\n",
"# Initialize a graph\n",
"graph = tf.Graph()\n",
"with graph.as_default():\n",
" hyperparam_config = spec_pb2.GridPoint()\n",
" builder = graph_builder.MasterBuilder(master_spec, hyperparam_config)\n",
" # This is the component that will annotate test sentences.\n",
" annotator = builder.add_annotation(enable_tracing=True)\n",
" builder.add_saver() # \"Savers\" can save and load models; here, we're only going to load."
"segmenter_model = load_model(\"data/es/segmenter\", \"spec.textproto\", \"checkpoint\")\n",
"parser_model = load_model(\"data/es\", \"parser_spec.textproto\", \"checkpoint\")"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {
"collapsed": false
"collapsed": false,
"deletable": true,
"editable": true
},
"outputs": [],
"source": [
"sess = tf.Session(graph=graph)\n",
"with graph.as_default():\n",
" sess.run(tf.global_variables_initializer())\n",
" sess.run('save/restore_all', {'save/Const:0': \"data/mini-spanish.checkpoint\"})\n",
"\n",
"def annotate_text(text):\n",
" sentence = sentence_pb2.Sentence(\n",
" text=text,\n",
" token=[sentence_pb2.Token(word=word, start=-1, end=-1) for word in text.split()]\n",
" )\n",
" with graph.as_default():\n",
" annotations, traces = sess.run([annotator['annotations'], annotator['traces']],\n",
" feed_dict={annotator['input_batch']: [sentence.SerializeToString()]})\n",
" assert len(annotations) == 1\n",
" assert len(traces) == 1\n",
" return sentence_pb2.Sentence.FromString(annotations[0]), traces[0]\n",
"\n",
" # preprocess\n",
" with tf.Session(graph=tf.Graph()) as tmp_session:\n",
" char_input = gen_parser_ops.char_token_generator([sentence.SerializeToString()])\n",
" preprocessed = tmp_session.run(char_input)[0]\n",
" segmented, _ = segmenter_model(preprocessed)\n",
"\n",
" annotations, traces = parser_model(segmented[0])\n",
" assert len(annotations) == 1\n",
" assert len(traces) == 1\n",
" return sentence_pb2.Sentence.FromString(annotations[0]), traces[0]\n",
"annotate_text(\"casa\"); None # just make sure it works"
]
},
{
"cell_type": "markdown",
"metadata": {},
"metadata": {
"deletable": true,
"editable": true
},
"source": [
"# Interactive trace explorer\n",
"Run the cell below, and then enter text in the interactive widget."
......@@ -79,7 +103,9 @@
"cell_type": "code",
"execution_count": null,
"metadata": {
"collapsed": false
"collapsed": false,
"deletable": true,
"editable": true
},
"outputs": [],
"source": [
......@@ -102,7 +128,10 @@
},
{
"cell_type": "markdown",
"metadata": {},
"metadata": {
"deletable": true,
"editable": true
},
"source": [
"# Interactive parse tree explorer\n",
"Run the cell below, and then enter text in the interactive widget."
......@@ -112,7 +141,9 @@
"cell_type": "code",
"execution_count": null,
"metadata": {
"collapsed": false
"collapsed": false,
"deletable": true,
"editable": true
},
"outputs": [],
"source": [
......@@ -125,7 +156,10 @@
" def handle_submit(sender):\n",
" del sender # unused\n",
" parse_tree, trace = annotate_text(text.value)\n",
" html.value = render_parse_tree_graphviz.parse_tree_graph(parse_tree)\n",
" html.value = u\"\"\"\n",
" <div style=\"max-width: 100%\">{}</div>\n",
" <style type=\"text/css\">svg {{ max-width: 100%; }}</style>\n",
" \"\"\".format(render_parse_tree_graphviz.parse_tree_graph(parse_tree))\n",
"\n",
" text.on_submit(handle_submit)\n",
"_parse_tree_explorer()"
......
......@@ -11,8 +11,7 @@ Please see our [paper](paper.pdf) more technical details about the model.
* Install SyntaxNet/DRAGNN following the install instructions.
* Download the models [here](https://drive.google.com/file/d/0BxpbZGYVZsEeSFdrUnBNMUp1YzQ/view?usp=sharing)
* Download the contest [data data and
tools](https://lindat.mff.cuni.cz/repository/xmlui/handle/11234/1-1976]).
* Download the contest [data and tools](http://universaldependencies.org/conll17/)
* Run the baseline_eval.py to run the pre-trained tokenizer and evaluate on
the dev set.
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment