Add files using upload-large-folder tool
Browse files- runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.06.conllu.eval +13 -0
- runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.102.conllu.eval +13 -0
- runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.104.conllu.eval +13 -0
- runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.107.conllu +0 -0
- runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.119.conllu.eval +13 -0
- runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.12.conllu.eval +13 -0
- runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.120.conllu +0 -0
- runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.120.conllu.eval +13 -0
- runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.19.conllu.eval +13 -0
- runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.24.conllu.eval +13 -0
- runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.25.conllu.eval +13 -0
- runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.37.conllu +0 -0
- runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.51.conllu.eval +13 -0
- runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.61.conllu +0 -0
- runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.71.conllu.eval +13 -0
- runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.87.conllu.eval +13 -0
- runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.88.conllu +0 -0
- runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.88.conllu.eval +13 -0
- runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/mappings.pkl +3 -0
- runs/final_run-seed=1.log +307 -0
- runs/final_run.log +306 -0
runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.06.conllu.eval
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Tokens: 100.00%
|
| 2 |
+
Sentences: 100.00%
|
| 3 |
+
Words: 100.00%
|
| 4 |
+
UPOS: 95.55%
|
| 5 |
+
XPOS: 83.85%
|
| 6 |
+
UFeats: 86.15%
|
| 7 |
+
AllTags: 80.56%
|
| 8 |
+
Lemmas: 82.32%
|
| 9 |
+
UAS: 73.80%
|
| 10 |
+
LAS: 64.54%
|
| 11 |
+
CLAS: 0.00%
|
| 12 |
+
MLAS: 0.00%
|
| 13 |
+
BLEX: 0.00%
|
runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.102.conllu.eval
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Tokens: 100.00%
|
| 2 |
+
Sentences: 100.00%
|
| 3 |
+
Words: 100.00%
|
| 4 |
+
UPOS: 96.78%
|
| 5 |
+
XPOS: 90.91%
|
| 6 |
+
UFeats: 92.86%
|
| 7 |
+
AllTags: 90.23%
|
| 8 |
+
Lemmas: 91.14%
|
| 9 |
+
UAS: 82.45%
|
| 10 |
+
LAS: 75.89%
|
| 11 |
+
CLAS: 0.00%
|
| 12 |
+
MLAS: 0.00%
|
| 13 |
+
BLEX: 0.00%
|
runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.104.conllu.eval
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Tokens: 100.00%
|
| 2 |
+
Sentences: 100.00%
|
| 3 |
+
Words: 100.00%
|
| 4 |
+
UPOS: 96.75%
|
| 5 |
+
XPOS: 90.99%
|
| 6 |
+
UFeats: 92.86%
|
| 7 |
+
AllTags: 90.24%
|
| 8 |
+
Lemmas: 91.14%
|
| 9 |
+
UAS: 82.51%
|
| 10 |
+
LAS: 75.99%
|
| 11 |
+
CLAS: 0.00%
|
| 12 |
+
MLAS: 0.00%
|
| 13 |
+
BLEX: 0.00%
|
runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.107.conllu
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.119.conllu.eval
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Tokens: 100.00%
|
| 2 |
+
Sentences: 100.00%
|
| 3 |
+
Words: 100.00%
|
| 4 |
+
UPOS: 96.78%
|
| 5 |
+
XPOS: 90.97%
|
| 6 |
+
UFeats: 92.90%
|
| 7 |
+
AllTags: 90.29%
|
| 8 |
+
Lemmas: 91.15%
|
| 9 |
+
UAS: 82.49%
|
| 10 |
+
LAS: 76.01%
|
| 11 |
+
CLAS: 0.00%
|
| 12 |
+
MLAS: 0.00%
|
| 13 |
+
BLEX: 0.00%
|
runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.12.conllu.eval
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Tokens: 100.00%
|
| 2 |
+
Sentences: 100.00%
|
| 3 |
+
Words: 100.00%
|
| 4 |
+
UPOS: 95.92%
|
| 5 |
+
XPOS: 84.55%
|
| 6 |
+
UFeats: 86.83%
|
| 7 |
+
AllTags: 81.09%
|
| 8 |
+
Lemmas: 83.84%
|
| 9 |
+
UAS: 76.18%
|
| 10 |
+
LAS: 67.70%
|
| 11 |
+
CLAS: 0.00%
|
| 12 |
+
MLAS: 0.00%
|
| 13 |
+
BLEX: 0.00%
|
runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.120.conllu
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.120.conllu.eval
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Tokens: 100.00%
|
| 2 |
+
Sentences: 100.00%
|
| 3 |
+
Words: 100.00%
|
| 4 |
+
UPOS: 96.78%
|
| 5 |
+
XPOS: 90.97%
|
| 6 |
+
UFeats: 92.90%
|
| 7 |
+
AllTags: 90.29%
|
| 8 |
+
Lemmas: 91.15%
|
| 9 |
+
UAS: 82.49%
|
| 10 |
+
LAS: 76.01%
|
| 11 |
+
CLAS: 0.00%
|
| 12 |
+
MLAS: 0.00%
|
| 13 |
+
BLEX: 0.00%
|
runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.19.conllu.eval
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Tokens: 100.00%
|
| 2 |
+
Sentences: 100.00%
|
| 3 |
+
Words: 100.00%
|
| 4 |
+
UPOS: 95.94%
|
| 5 |
+
XPOS: 84.50%
|
| 6 |
+
UFeats: 86.87%
|
| 7 |
+
AllTags: 81.21%
|
| 8 |
+
Lemmas: 84.68%
|
| 9 |
+
UAS: 77.01%
|
| 10 |
+
LAS: 68.61%
|
| 11 |
+
CLAS: 0.00%
|
| 12 |
+
MLAS: 0.00%
|
| 13 |
+
BLEX: 0.00%
|
runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.24.conllu.eval
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Tokens: 100.00%
|
| 2 |
+
Sentences: 100.00%
|
| 3 |
+
Words: 100.00%
|
| 4 |
+
UPOS: 96.60%
|
| 5 |
+
XPOS: 88.48%
|
| 6 |
+
UFeats: 90.77%
|
| 7 |
+
AllTags: 86.45%
|
| 8 |
+
Lemmas: 87.96%
|
| 9 |
+
UAS: 79.42%
|
| 10 |
+
LAS: 71.96%
|
| 11 |
+
CLAS: 0.00%
|
| 12 |
+
MLAS: 0.00%
|
| 13 |
+
BLEX: 0.00%
|
runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.25.conllu.eval
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Tokens: 100.00%
|
| 2 |
+
Sentences: 100.00%
|
| 3 |
+
Words: 100.00%
|
| 4 |
+
UPOS: 96.46%
|
| 5 |
+
XPOS: 88.36%
|
| 6 |
+
UFeats: 90.76%
|
| 7 |
+
AllTags: 86.35%
|
| 8 |
+
Lemmas: 86.38%
|
| 9 |
+
UAS: 79.85%
|
| 10 |
+
LAS: 72.37%
|
| 11 |
+
CLAS: 0.00%
|
| 12 |
+
MLAS: 0.00%
|
| 13 |
+
BLEX: 0.00%
|
runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.37.conllu
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.51.conllu.eval
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Tokens: 100.00%
|
| 2 |
+
Sentences: 100.00%
|
| 3 |
+
Words: 100.00%
|
| 4 |
+
UPOS: 96.91%
|
| 5 |
+
XPOS: 90.75%
|
| 6 |
+
UFeats: 92.64%
|
| 7 |
+
AllTags: 89.86%
|
| 8 |
+
Lemmas: 90.44%
|
| 9 |
+
UAS: 81.85%
|
| 10 |
+
LAS: 75.11%
|
| 11 |
+
CLAS: 0.00%
|
| 12 |
+
MLAS: 0.00%
|
| 13 |
+
BLEX: 0.00%
|
runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.61.conllu
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.71.conllu.eval
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Tokens: 100.00%
|
| 2 |
+
Sentences: 100.00%
|
| 3 |
+
Words: 100.00%
|
| 4 |
+
UPOS: 96.78%
|
| 5 |
+
XPOS: 90.93%
|
| 6 |
+
UFeats: 92.73%
|
| 7 |
+
AllTags: 90.10%
|
| 8 |
+
Lemmas: 90.86%
|
| 9 |
+
UAS: 82.31%
|
| 10 |
+
LAS: 75.79%
|
| 11 |
+
CLAS: 0.00%
|
| 12 |
+
MLAS: 0.00%
|
| 13 |
+
BLEX: 0.00%
|
runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.87.conllu.eval
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Tokens: 100.00%
|
| 2 |
+
Sentences: 100.00%
|
| 3 |
+
Words: 100.00%
|
| 4 |
+
UPOS: 96.73%
|
| 5 |
+
XPOS: 91.03%
|
| 6 |
+
UFeats: 92.89%
|
| 7 |
+
AllTags: 90.31%
|
| 8 |
+
Lemmas: 91.07%
|
| 9 |
+
UAS: 82.43%
|
| 10 |
+
LAS: 75.75%
|
| 11 |
+
CLAS: 0.00%
|
| 12 |
+
MLAS: 0.00%
|
| 13 |
+
BLEX: 0.00%
|
runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.88.conllu
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/dev.88.conllu.eval
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Tokens: 100.00%
|
| 2 |
+
Sentences: 100.00%
|
| 3 |
+
Words: 100.00%
|
| 4 |
+
UPOS: 96.78%
|
| 5 |
+
XPOS: 90.99%
|
| 6 |
+
UFeats: 92.97%
|
| 7 |
+
AllTags: 90.30%
|
| 8 |
+
Lemmas: 91.17%
|
| 9 |
+
UAS: 82.34%
|
| 10 |
+
LAS: 75.69%
|
| 11 |
+
CLAS: 0.00%
|
| 12 |
+
MLAS: 0.00%
|
| 13 |
+
BLEX: 0.00%
|
runs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1/mappings.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:08870756edf1bd1ad1bbe09daf9ca77e374a228c2b1e6c3a918671a94109e1b1
|
| 3 |
+
size 291619
|
runs/final_run-seed=1.log
ADDED
|
@@ -0,0 +1,307 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
/gpfs/bwfor/home/hd/hd_hd/hd_ec199/reproduce/evalatin2024-latinpipe/.venv/lib/python3.12/site-packages/keras/src/models/functional.py:225: UserWarning: The structure of `inputs` doesn't match the expected structure: ['keras_tensor', 'keras_tensor_1', 'keras_tensor_2', 'keras_tensor_3', 'keras_tensor_4', 'keras_tensor_5']. Received: the structure of inputs=('*', '*', '*', '*', '*', '*')
|
| 2 |
+
warnings.warn(
|
| 3 |
+
{
|
| 4 |
+
"batch_size": 16,
|
| 5 |
+
"deprel": "full",
|
| 6 |
+
"dev": [
|
| 7 |
+
"la_giuseppe/dev.conllu"
|
| 8 |
+
],
|
| 9 |
+
"dropout": 0.5,
|
| 10 |
+
"embed_tags": [],
|
| 11 |
+
"epochs": 100,
|
| 12 |
+
"epochs_frozen": 20,
|
| 13 |
+
"exp": "all_three_100_epochs",
|
| 14 |
+
"label_smoothing": 0.03,
|
| 15 |
+
"learning_rate": 2e-05,
|
| 16 |
+
"learning_rate_decay": "cos",
|
| 17 |
+
"learning_rate_warmup": 2000,
|
| 18 |
+
"load": [],
|
| 19 |
+
"logdir": "logs/all_three_100_epochs-latinpipe_evalatin24-8211261-250407_204204-s1",
|
| 20 |
+
"max_train_sentence_len": 150,
|
| 21 |
+
"optimizer": "adam",
|
| 22 |
+
"parse": 1,
|
| 23 |
+
"parse_attention_dim": 512,
|
| 24 |
+
"rnn_dim": 512,
|
| 25 |
+
"rnn_layers": 2,
|
| 26 |
+
"rnn_type": "LSTMTorch",
|
| 27 |
+
"save_checkpoint": true,
|
| 28 |
+
"script": "latinpipe_evalatin24.py",
|
| 29 |
+
"seed": 1,
|
| 30 |
+
"single_root": 1,
|
| 31 |
+
"steps_per_epoch": 1000,
|
| 32 |
+
"subword_combination": "first",
|
| 33 |
+
"tags": [
|
| 34 |
+
3,
|
| 35 |
+
2,
|
| 36 |
+
1,
|
| 37 |
+
4
|
| 38 |
+
],
|
| 39 |
+
"task_hidden_layer": 2048,
|
| 40 |
+
"test": [
|
| 41 |
+
"la_giuseppe/test.conllu"
|
| 42 |
+
],
|
| 43 |
+
"threads": 4,
|
| 44 |
+
"train": [
|
| 45 |
+
"la_giuseppe/train.conllu"
|
| 46 |
+
],
|
| 47 |
+
"train_sampling_exponent": 0.5,
|
| 48 |
+
"transformers": [
|
| 49 |
+
"bowphs/LaBerta",
|
| 50 |
+
"bowphs/PhilBerta",
|
| 51 |
+
"FacebookAI/xlm-roberta-large"
|
| 52 |
+
],
|
| 53 |
+
"treebank_ids": false,
|
| 54 |
+
"verbose": 2,
|
| 55 |
+
"wandb": false,
|
| 56 |
+
"word_masking": null
|
| 57 |
+
}
|
| 58 |
+
Trimmed 2 out of 5089 sentences
|
| 59 |
+
Epoch 1/20
|
| 60 |
+
319/319 - 52s - 162ms/step - dense_1_loss: 0.8678 - dense_3_loss: 0.2504 - dense_5_loss: 0.9293 - dense_7_loss: 0.7376 - loss: 4.3685 - parsing_head_loss: 0.6798 - learning_rate: 1.0000e-03 - dev_UPOS: 93.9650 - dev_XPOS: 79.6019 - dev_UFeats: 82.6470 - dev_Lemmas: 73.2459 - dev_UAS: 58.1766 - dev_LAS: 47.1888
|
| 61 |
+
Epoch 2/20
|
| 62 |
+
319/319 - 49s - 153ms/step - dense_1_loss: 0.5792 - dense_3_loss: 0.1906 - dense_5_loss: 0.6756 - dense_7_loss: 0.5145 - loss: 3.1468 - parsing_head_loss: 0.5140 - learning_rate: 1.0000e-03 - dev_UPOS: 94.7812 - dev_XPOS: 81.7390 - dev_UFeats: 84.5180 - dev_Lemmas: 76.6211 - dev_UAS: 64.9821 - dev_LAS: 54.3520
|
| 63 |
+
Epoch 3/20
|
| 64 |
+
319/319 - 49s - 153ms/step - dense_1_loss: 0.5299 - dense_3_loss: 0.1807 - dense_5_loss: 0.6104 - dense_7_loss: 0.4751 - loss: 2.8852 - parsing_head_loss: 0.4821 - learning_rate: 1.0000e-03 - dev_UPOS: 95.2307 - dev_XPOS: 83.0047 - dev_UFeats: 85.3802 - dev_Lemmas: 79.6386 - dev_UAS: 68.8710 - dev_LAS: 59.1855
|
| 65 |
+
Epoch 4/20
|
| 66 |
+
319/319 - 49s - 153ms/step - dense_1_loss: 0.4924 - dense_3_loss: 0.1689 - dense_5_loss: 0.5584 - dense_7_loss: 0.4421 - loss: 2.6808 - parsing_head_loss: 0.4515 - learning_rate: 1.0000e-03 - dev_UPOS: 95.5700 - dev_XPOS: 83.1606 - dev_UFeats: 85.9030 - dev_Lemmas: 80.8585 - dev_UAS: 70.6778 - dev_LAS: 60.9282
|
| 67 |
+
Epoch 5/20
|
| 68 |
+
319/319 - 49s - 153ms/step - dense_1_loss: 0.4815 - dense_3_loss: 0.1662 - dense_5_loss: 0.5320 - dense_7_loss: 0.4299 - loss: 2.5825 - parsing_head_loss: 0.4342 - learning_rate: 1.0000e-03 - dev_UPOS: 95.4875 - dev_XPOS: 83.6926 - dev_UFeats: 86.1139 - dev_Lemmas: 81.3904 - dev_UAS: 71.9252 - dev_LAS: 62.8543
|
| 69 |
+
Epoch 6/20
|
| 70 |
+
319/319 - 49s - 153ms/step - dense_1_loss: 0.4669 - dense_3_loss: 0.1643 - dense_5_loss: 0.5157 - dense_7_loss: 0.4176 - loss: 2.5133 - parsing_head_loss: 0.4248 - learning_rate: 1.0000e-03 - dev_UPOS: 95.5517 - dev_XPOS: 83.8485 - dev_UFeats: 86.1506 - dev_Lemmas: 82.3168 - dev_UAS: 73.7962 - dev_LAS: 64.5419
|
| 71 |
+
Epoch 7/20
|
| 72 |
+
319/319 - 49s - 153ms/step - dense_1_loss: 0.4568 - dense_3_loss: 0.1626 - dense_5_loss: 0.5007 - dense_7_loss: 0.4142 - loss: 2.4572 - parsing_head_loss: 0.4159 - learning_rate: 1.0000e-03 - dev_UPOS: 95.4691 - dev_XPOS: 83.9219 - dev_UFeats: 86.2240 - dev_Lemmas: 82.5277 - dev_UAS: 73.0166 - dev_LAS: 64.1200
|
| 73 |
+
Epoch 8/20
|
| 74 |
+
319/319 - 49s - 153ms/step - dense_1_loss: 0.4537 - dense_3_loss: 0.1613 - dense_5_loss: 0.4864 - dense_7_loss: 0.4092 - loss: 2.4180 - parsing_head_loss: 0.4108 - learning_rate: 1.0000e-03 - dev_UPOS: 95.6984 - dev_XPOS: 84.2520 - dev_UFeats: 86.5908 - dev_Lemmas: 82.8763 - dev_UAS: 75.0436 - dev_LAS: 66.0369
|
| 75 |
+
Epoch 9/20
|
| 76 |
+
319/319 - 49s - 152ms/step - dense_1_loss: 0.4450 - dense_3_loss: 0.1581 - dense_5_loss: 0.4746 - dense_7_loss: 0.4028 - loss: 2.3641 - parsing_head_loss: 0.4006 - learning_rate: 1.0000e-03 - dev_UPOS: 95.7718 - dev_XPOS: 83.9769 - dev_UFeats: 86.6275 - dev_Lemmas: 83.3807 - dev_UAS: 74.9060 - dev_LAS: 66.4863
|
| 77 |
+
Epoch 10/20
|
| 78 |
+
319/319 - 48s - 152ms/step - dense_1_loss: 0.4476 - dense_3_loss: 0.1598 - dense_5_loss: 0.4745 - dense_7_loss: 0.4016 - loss: 2.3511 - parsing_head_loss: 0.3944 - learning_rate: 1.0000e-03 - dev_UPOS: 95.7718 - dev_XPOS: 84.6923 - dev_UFeats: 86.5725 - dev_Lemmas: 83.4174 - dev_UAS: 75.3921 - dev_LAS: 66.7798
|
| 79 |
+
Epoch 11/20
|
| 80 |
+
319/319 - 49s - 152ms/step - dense_1_loss: 0.4426 - dense_3_loss: 0.1575 - dense_5_loss: 0.4650 - dense_7_loss: 0.3990 - loss: 2.3272 - parsing_head_loss: 0.3929 - learning_rate: 1.0000e-03 - dev_UPOS: 95.7535 - dev_XPOS: 84.3804 - dev_UFeats: 86.4808 - dev_Lemmas: 83.6284 - dev_UAS: 75.6214 - dev_LAS: 67.3668
|
| 81 |
+
Epoch 12/20
|
| 82 |
+
319/319 - 48s - 152ms/step - dense_1_loss: 0.4343 - dense_3_loss: 0.1535 - dense_5_loss: 0.4519 - dense_7_loss: 0.3918 - loss: 2.2726 - parsing_head_loss: 0.3815 - learning_rate: 1.0000e-03 - dev_UPOS: 95.9186 - dev_XPOS: 84.5455 - dev_UFeats: 86.8293 - dev_Lemmas: 83.8393 - dev_UAS: 76.1809 - dev_LAS: 67.6970
|
| 83 |
+
Epoch 13/20
|
| 84 |
+
319/319 - 49s - 153ms/step - dense_1_loss: 0.4286 - dense_3_loss: 0.1513 - dense_5_loss: 0.4412 - dense_7_loss: 0.3859 - loss: 2.2285 - parsing_head_loss: 0.3742 - learning_rate: 1.0000e-03 - dev_UPOS: 95.9369 - dev_XPOS: 84.5364 - dev_UFeats: 86.4900 - dev_Lemmas: 84.1328 - dev_UAS: 76.3001 - dev_LAS: 67.6878
|
| 85 |
+
Epoch 14/20
|
| 86 |
+
319/319 - 49s - 153ms/step - dense_1_loss: 0.4221 - dense_3_loss: 0.1500 - dense_5_loss: 0.4348 - dense_7_loss: 0.3804 - loss: 2.1906 - parsing_head_loss: 0.3673 - learning_rate: 1.0000e-03 - dev_UPOS: 95.9736 - dev_XPOS: 84.4171 - dev_UFeats: 86.8477 - dev_Lemmas: 84.4355 - dev_UAS: 76.7679 - dev_LAS: 68.5041
|
| 87 |
+
Epoch 15/20
|
| 88 |
+
319/319 - 49s - 153ms/step - dense_1_loss: 0.4217 - dense_3_loss: 0.1507 - dense_5_loss: 0.4300 - dense_7_loss: 0.3797 - loss: 2.1797 - parsing_head_loss: 0.3635 - learning_rate: 1.0000e-03 - dev_UPOS: 95.9002 - dev_XPOS: 84.5914 - dev_UFeats: 86.9669 - dev_Lemmas: 84.4630 - dev_UAS: 76.5111 - dev_LAS: 68.3023
|
| 89 |
+
Epoch 16/20
|
| 90 |
+
319/319 - 49s - 152ms/step - dense_1_loss: 0.4201 - dense_3_loss: 0.1499 - dense_5_loss: 0.4255 - dense_7_loss: 0.3768 - loss: 2.1593 - parsing_head_loss: 0.3597 - learning_rate: 1.0000e-03 - dev_UPOS: 95.6984 - dev_XPOS: 84.3804 - dev_UFeats: 86.7376 - dev_Lemmas: 84.5180 - dev_UAS: 76.4835 - dev_LAS: 68.2289
|
| 91 |
+
Epoch 17/20
|
| 92 |
+
319/319 - 48s - 152ms/step - dense_1_loss: 0.4182 - dense_3_loss: 0.1491 - dense_5_loss: 0.4235 - dense_7_loss: 0.3740 - loss: 2.1431 - parsing_head_loss: 0.3562 - learning_rate: 1.0000e-03 - dev_UPOS: 96.0286 - dev_XPOS: 84.3529 - dev_UFeats: 86.7926 - dev_Lemmas: 84.5180 - dev_UAS: 77.5016 - dev_LAS: 69.3937
|
| 93 |
+
Epoch 18/20
|
| 94 |
+
319/319 - 49s - 153ms/step - dense_1_loss: 0.4205 - dense_3_loss: 0.1486 - dense_5_loss: 0.4218 - dense_7_loss: 0.3745 - loss: 2.1476 - parsing_head_loss: 0.3588 - learning_rate: 1.0000e-03 - dev_UPOS: 96.1203 - dev_XPOS: 84.4997 - dev_UFeats: 87.0403 - dev_Lemmas: 84.7932 - dev_UAS: 77.0338 - dev_LAS: 68.7425
|
| 95 |
+
Epoch 19/20
|
| 96 |
+
319/319 - 49s - 153ms/step - dense_1_loss: 0.4118 - dense_3_loss: 0.1447 - dense_5_loss: 0.4157 - dense_7_loss: 0.3703 - loss: 2.1044 - parsing_head_loss: 0.3493 - learning_rate: 1.0000e-03 - dev_UPOS: 95.9369 - dev_XPOS: 84.4997 - dev_UFeats: 86.8660 - dev_Lemmas: 84.6831 - dev_UAS: 77.0063 - dev_LAS: 68.6141
|
| 97 |
+
Epoch 20/20
|
| 98 |
+
319/319 - 48s - 152ms/step - dense_1_loss: 0.4171 - dense_3_loss: 0.1463 - dense_5_loss: 0.4134 - dense_7_loss: 0.3704 - loss: 2.1090 - parsing_head_loss: 0.3496 - learning_rate: 1.0000e-03 - dev_UPOS: 96.0011 - dev_XPOS: 84.1878 - dev_UFeats: 87.0036 - dev_Lemmas: 84.7840 - dev_UAS: 77.2540 - dev_LAS: 69.2378
|
| 99 |
+
Epoch 21/120
|
| 100 |
+
/gpfs/bwfor/home/hd/hd_hd/hd_ec199/reproduce/evalatin2024-latinpipe/.venv/lib/python3.12/site-packages/keras/src/optimizers/base_optimizer.py:731: UserWarning: Gradients do not exist for variables ['variable_783', 'variable_784'] when minimizing the loss. If using `model.compile()`, did you forget to provide a `loss` argument?
|
| 101 |
+
warnings.warn(
|
| 102 |
+
319/319 - 147s - 461ms/step - dense_1_loss: 0.3760 - dense_3_loss: 0.1387 - dense_5_loss: 0.3820 - dense_7_loss: 0.3365 - loss: 1.9480 - parsing_head_loss: 0.3283 - learning_rate: 3.1900e-06 - dev_UPOS: 96.2304 - dev_XPOS: 86.2882 - dev_UFeats: 88.7829 - dev_Lemmas: 86.0314 - dev_UAS: 77.8685 - dev_LAS: 70.1917
|
| 103 |
+
Epoch 22/120
|
| 104 |
+
319/319 - 147s - 462ms/step - dense_1_loss: 0.3386 - dense_3_loss: 0.1307 - dense_5_loss: 0.3570 - dense_7_loss: 0.3032 - loss: 1.8115 - parsing_head_loss: 0.3104 - learning_rate: 6.3800e-06 - dev_UPOS: 96.5055 - dev_XPOS: 87.4530 - dev_UFeats: 90.0761 - dev_Lemmas: 87.0036 - dev_UAS: 78.7306 - dev_LAS: 71.0997
|
| 105 |
+
Epoch 23/120
|
| 106 |
+
319/319 - 146s - 458ms/step - dense_1_loss: 0.3274 - dense_3_loss: 0.1301 - dense_5_loss: 0.3522 - dense_7_loss: 0.2938 - loss: 1.7772 - parsing_head_loss: 0.3070 - learning_rate: 9.5700e-06 - dev_UPOS: 96.5973 - dev_XPOS: 88.0767 - dev_UFeats: 90.5531 - dev_Lemmas: 87.4897 - dev_UAS: 79.1342 - dev_LAS: 71.7509
|
| 107 |
+
Epoch 24/120
|
| 108 |
+
319/319 - 146s - 459ms/step - dense_1_loss: 0.3160 - dense_3_loss: 0.1275 - dense_5_loss: 0.3407 - dense_7_loss: 0.2817 - loss: 1.7205 - parsing_head_loss: 0.2982 - learning_rate: 1.2760e-05 - dev_UPOS: 96.5973 - dev_XPOS: 88.4802 - dev_UFeats: 90.7732 - dev_Lemmas: 87.9574 - dev_UAS: 79.4185 - dev_LAS: 71.9618
|
| 109 |
+
Epoch 25/120
|
| 110 |
+
319/319 - 146s - 456ms/step - dense_1_loss: 0.3254 - dense_3_loss: 0.1321 - dense_5_loss: 0.3818 - dense_7_loss: 0.2892 - loss: 1.7946 - parsing_head_loss: 0.3047 - learning_rate: 1.5950e-05 - dev_UPOS: 96.4597 - dev_XPOS: 88.3610 - dev_UFeats: 90.7640 - dev_Lemmas: 86.3799 - dev_UAS: 79.8496 - dev_LAS: 72.3654
|
| 111 |
+
Epoch 26/120
|
| 112 |
+
319/319 - 146s - 457ms/step - dense_1_loss: 0.3142 - dense_3_loss: 0.1290 - dense_5_loss: 0.3826 - dense_7_loss: 0.2786 - loss: 1.7518 - parsing_head_loss: 0.2961 - learning_rate: 1.9140e-05 - dev_UPOS: 96.4413 - dev_XPOS: 88.9663 - dev_UFeats: 91.0759 - dev_Lemmas: 86.8660 - dev_UAS: 79.9138 - dev_LAS: 72.4755
|
| 113 |
+
Epoch 27/120
|
| 114 |
+
319/319 - 147s - 460ms/step - dense_1_loss: 0.2977 - dense_3_loss: 0.1245 - dense_5_loss: 0.3606 - dense_7_loss: 0.2657 - loss: 1.6733 - parsing_head_loss: 0.2850 - learning_rate: 1.9997e-05 - dev_UPOS: 96.6064 - dev_XPOS: 89.0856 - dev_UFeats: 91.1951 - dev_Lemmas: 87.1962 - dev_UAS: 80.0055 - dev_LAS: 72.7231
|
| 115 |
+
Epoch 28/120
|
| 116 |
+
319/319 - 146s - 459ms/step - dense_1_loss: 0.2848 - dense_3_loss: 0.1217 - dense_5_loss: 0.3443 - dense_7_loss: 0.2552 - loss: 1.6123 - parsing_head_loss: 0.2773 - learning_rate: 1.9983e-05 - dev_UPOS: 96.6064 - dev_XPOS: 89.3974 - dev_UFeats: 91.5711 - dev_Lemmas: 87.5172 - dev_UAS: 80.2715 - dev_LAS: 72.9891
|
| 117 |
+
Epoch 29/120
|
| 118 |
+
319/319 - 147s - 460ms/step - dense_1_loss: 0.2752 - dense_3_loss: 0.1179 - dense_5_loss: 0.3319 - dense_7_loss: 0.2470 - loss: 1.5659 - parsing_head_loss: 0.2714 - learning_rate: 1.9958e-05 - dev_UPOS: 96.6340 - dev_XPOS: 89.3699 - dev_UFeats: 91.6262 - dev_Lemmas: 87.7648 - dev_UAS: 80.4366 - dev_LAS: 73.3835
|
| 119 |
+
Epoch 30/120
|
| 120 |
+
319/319 - 146s - 458ms/step - dense_1_loss: 0.2716 - dense_3_loss: 0.1181 - dense_5_loss: 0.3250 - dense_7_loss: 0.2436 - loss: 1.5461 - parsing_head_loss: 0.2696 - learning_rate: 1.9922e-05 - dev_UPOS: 96.5606 - dev_XPOS: 89.5992 - dev_UFeats: 91.6995 - dev_Lemmas: 87.9208 - dev_UAS: 80.5558 - dev_LAS: 73.4293
|
| 121 |
+
Epoch 31/120
|
| 122 |
+
319/319 - 147s - 460ms/step - dense_1_loss: 0.2623 - dense_3_loss: 0.1152 - dense_5_loss: 0.3152 - dense_7_loss: 0.2353 - loss: 1.4984 - parsing_head_loss: 0.2611 - learning_rate: 1.9875e-05 - dev_UPOS: 96.7073 - dev_XPOS: 89.8652 - dev_UFeats: 91.8371 - dev_Lemmas: 88.1409 - dev_UAS: 80.7026 - dev_LAS: 73.6861
|
| 123 |
+
Epoch 32/120
|
| 124 |
+
319/319 - 146s - 459ms/step - dense_1_loss: 0.2588 - dense_3_loss: 0.1144 - dense_5_loss: 0.3098 - dense_7_loss: 0.2318 - loss: 1.4784 - parsing_head_loss: 0.2584 - learning_rate: 1.9816e-05 - dev_UPOS: 96.6706 - dev_XPOS: 89.7918 - dev_UFeats: 92.0114 - dev_Lemmas: 88.3977 - dev_UAS: 80.9227 - dev_LAS: 73.9521
|
| 125 |
+
Epoch 33/120
|
| 126 |
+
319/319 - 146s - 459ms/step - dense_1_loss: 0.2520 - dense_3_loss: 0.1117 - dense_5_loss: 0.2977 - dense_7_loss: 0.2254 - loss: 1.4380 - parsing_head_loss: 0.2536 - learning_rate: 1.9747e-05 - dev_UPOS: 96.7073 - dev_XPOS: 89.8285 - dev_UFeats: 92.0939 - dev_Lemmas: 88.5995 - dev_UAS: 80.6842 - dev_LAS: 73.6219
|
| 127 |
+
Epoch 34/120
|
| 128 |
+
319/319 - 146s - 457ms/step - dense_1_loss: 0.2506 - dense_3_loss: 0.1122 - dense_5_loss: 0.2948 - dense_7_loss: 0.2257 - loss: 1.4329 - parsing_head_loss: 0.2533 - learning_rate: 1.9666e-05 - dev_UPOS: 96.5881 - dev_XPOS: 90.1036 - dev_UFeats: 92.1123 - dev_Lemmas: 88.7554 - dev_UAS: 80.7484 - dev_LAS: 73.8054
|
| 129 |
+
Epoch 35/120
|
| 130 |
+
319/319 - 147s - 460ms/step - dense_1_loss: 0.2435 - dense_3_loss: 0.1095 - dense_5_loss: 0.2888 - dense_7_loss: 0.2193 - loss: 1.3952 - parsing_head_loss: 0.2462 - learning_rate: 1.9575e-05 - dev_UPOS: 96.7624 - dev_XPOS: 90.1862 - dev_UFeats: 92.2498 - dev_Lemmas: 89.0030 - dev_UAS: 80.9869 - dev_LAS: 74.2273
|
| 131 |
+
Epoch 36/120
|
| 132 |
+
319/319 - 146s - 458ms/step - dense_1_loss: 0.2394 - dense_3_loss: 0.1084 - dense_5_loss: 0.2822 - dense_7_loss: 0.2166 - loss: 1.3777 - parsing_head_loss: 0.2450 - learning_rate: 1.9473e-05 - dev_UPOS: 96.7440 - dev_XPOS: 90.0670 - dev_UFeats: 92.2498 - dev_Lemmas: 89.0672 - dev_UAS: 80.7209 - dev_LAS: 73.8329
|
| 133 |
+
Epoch 37/120
|
| 134 |
+
319/319 - 146s - 459ms/step - dense_1_loss: 0.2359 - dense_3_loss: 0.1071 - dense_5_loss: 0.2772 - dense_7_loss: 0.2137 - loss: 1.3535 - parsing_head_loss: 0.2400 - learning_rate: 1.9360e-05 - dev_UPOS: 96.8082 - dev_XPOS: 90.0945 - dev_UFeats: 92.2315 - dev_Lemmas: 89.2415 - dev_UAS: 81.2437 - dev_LAS: 74.3373
|
| 135 |
+
Epoch 38/120
|
| 136 |
+
319/319 - 146s - 457ms/step - dense_1_loss: 0.2365 - dense_3_loss: 0.1074 - dense_5_loss: 0.2784 - dense_7_loss: 0.2133 - loss: 1.3513 - parsing_head_loss: 0.2367 - learning_rate: 1.9237e-05 - dev_UPOS: 96.7715 - dev_XPOS: 90.2504 - dev_UFeats: 92.3599 - dev_Lemmas: 89.3516 - dev_UAS: 81.1978 - dev_LAS: 74.2823
|
| 137 |
+
Epoch 39/120
|
| 138 |
+
319/319 - 146s - 458ms/step - dense_1_loss: 0.2303 - dense_3_loss: 0.1060 - dense_5_loss: 0.2684 - dense_7_loss: 0.2087 - loss: 1.3204 - parsing_head_loss: 0.2341 - learning_rate: 1.9103e-05 - dev_UPOS: 96.7257 - dev_XPOS: 90.2871 - dev_UFeats: 92.3599 - dev_Lemmas: 89.3882 - dev_UAS: 81.0969 - dev_LAS: 74.3832
|
| 139 |
+
Epoch 40/120
|
| 140 |
+
319/319 - 147s - 461ms/step - dense_1_loss: 0.2257 - dense_3_loss: 0.1036 - dense_5_loss: 0.2645 - dense_7_loss: 0.2048 - loss: 1.2952 - parsing_head_loss: 0.2285 - learning_rate: 1.8960e-05 - dev_UPOS: 96.7348 - dev_XPOS: 90.2596 - dev_UFeats: 92.3966 - dev_Lemmas: 89.7459 - dev_UAS: 81.2162 - dev_LAS: 74.3649
|
| 141 |
+
Epoch 41/120
|
| 142 |
+
319/319 - 147s - 461ms/step - dense_1_loss: 0.2221 - dense_3_loss: 0.1027 - dense_5_loss: 0.2581 - dense_7_loss: 0.2028 - loss: 1.2754 - parsing_head_loss: 0.2251 - learning_rate: 1.8806e-05 - dev_UPOS: 96.7715 - dev_XPOS: 90.2871 - dev_UFeats: 92.5617 - dev_Lemmas: 89.6817 - dev_UAS: 81.3446 - dev_LAS: 74.5116
|
| 143 |
+
Epoch 42/120
|
| 144 |
+
319/319 - 147s - 460ms/step - dense_1_loss: 0.2193 - dense_3_loss: 0.1025 - dense_5_loss: 0.2518 - dense_7_loss: 0.2004 - loss: 1.2575 - parsing_head_loss: 0.2228 - learning_rate: 1.8642e-05 - dev_UPOS: 96.8082 - dev_XPOS: 90.3788 - dev_UFeats: 92.6717 - dev_Lemmas: 89.7643 - dev_UAS: 81.4363 - dev_LAS: 74.5850
|
| 145 |
+
Epoch 43/120
|
| 146 |
+
319/319 - 146s - 456ms/step - dense_1_loss: 0.2209 - dense_3_loss: 0.1032 - dense_5_loss: 0.2548 - dense_7_loss: 0.2016 - loss: 1.2632 - parsing_head_loss: 0.2231 - learning_rate: 1.8469e-05 - dev_UPOS: 96.8357 - dev_XPOS: 90.4338 - dev_UFeats: 92.5709 - dev_Lemmas: 89.8560 - dev_UAS: 81.2620 - dev_LAS: 74.5299
|
| 147 |
+
Epoch 44/120
|
| 148 |
+
319/319 - 147s - 462ms/step - dense_1_loss: 0.2160 - dense_3_loss: 0.1009 - dense_5_loss: 0.2470 - dense_7_loss: 0.1973 - loss: 1.2318 - parsing_head_loss: 0.2167 - learning_rate: 1.8286e-05 - dev_UPOS: 96.8541 - dev_XPOS: 90.4613 - dev_UFeats: 92.5158 - dev_Lemmas: 90.0119 - dev_UAS: 81.6381 - dev_LAS: 74.8968
|
| 149 |
+
Epoch 45/120
|
| 150 |
+
319/319 - 146s - 459ms/step - dense_1_loss: 0.2170 - dense_3_loss: 0.1018 - dense_5_loss: 0.2480 - dense_7_loss: 0.1982 - loss: 1.2357 - parsing_head_loss: 0.2178 - learning_rate: 1.8093e-05 - dev_UPOS: 96.8541 - dev_XPOS: 90.5714 - dev_UFeats: 92.6167 - dev_Lemmas: 90.1036 - dev_UAS: 81.8307 - dev_LAS: 75.0344
|
| 151 |
+
Epoch 46/120
|
| 152 |
+
319/319 - 146s - 458ms/step - dense_1_loss: 0.2124 - dense_3_loss: 0.1007 - dense_5_loss: 0.2431 - dense_7_loss: 0.1958 - loss: 1.2196 - parsing_head_loss: 0.2156 - learning_rate: 1.7892e-05 - dev_UPOS: 96.7807 - dev_XPOS: 90.5806 - dev_UFeats: 92.5892 - dev_Lemmas: 90.0945 - dev_UAS: 81.8857 - dev_LAS: 74.9702
|
| 153 |
+
Epoch 47/120
|
| 154 |
+
319/319 - 146s - 459ms/step - dense_1_loss: 0.2113 - dense_3_loss: 0.1005 - dense_5_loss: 0.2404 - dense_7_loss: 0.1945 - loss: 1.2107 - parsing_head_loss: 0.2138 - learning_rate: 1.7682e-05 - dev_UPOS: 96.8633 - dev_XPOS: 90.7181 - dev_UFeats: 92.7268 - dev_Lemmas: 90.1862 - dev_UAS: 81.7206 - dev_LAS: 75.0161
|
| 155 |
+
Epoch 48/120
|
| 156 |
+
319/319 - 147s - 460ms/step - dense_1_loss: 0.2085 - dense_3_loss: 0.0990 - dense_5_loss: 0.2356 - dense_7_loss: 0.1922 - loss: 1.1878 - parsing_head_loss: 0.2086 - learning_rate: 1.7463e-05 - dev_UPOS: 96.8908 - dev_XPOS: 90.6448 - dev_UFeats: 92.6626 - dev_Lemmas: 90.2320 - dev_UAS: 81.9958 - dev_LAS: 75.1078
|
| 157 |
+
Epoch 49/120
|
| 158 |
+
319/319 - 145s - 456ms/step - dense_1_loss: 0.2085 - dense_3_loss: 0.0995 - dense_5_loss: 0.2360 - dense_7_loss: 0.1926 - loss: 1.1882 - parsing_head_loss: 0.2082 - learning_rate: 1.7236e-05 - dev_UPOS: 96.8816 - dev_XPOS: 90.4247 - dev_UFeats: 92.5250 - dev_Lemmas: 90.3696 - dev_UAS: 81.9316 - dev_LAS: 75.1811
|
| 159 |
+
Epoch 50/120
|
| 160 |
+
319/319 - 146s - 459ms/step - dense_1_loss: 0.2056 - dense_3_loss: 0.0981 - dense_5_loss: 0.2322 - dense_7_loss: 0.1901 - loss: 1.1703 - parsing_head_loss: 0.2048 - learning_rate: 1.7000e-05 - dev_UPOS: 96.8082 - dev_XPOS: 90.6998 - dev_UFeats: 92.6351 - dev_Lemmas: 90.4889 - dev_UAS: 81.8674 - dev_LAS: 75.1078
|
| 161 |
+
Epoch 51/120
|
| 162 |
+
319/319 - 146s - 458ms/step - dense_1_loss: 0.2037 - dense_3_loss: 0.0975 - dense_5_loss: 0.2299 - dense_7_loss: 0.1888 - loss: 1.1568 - parsing_head_loss: 0.2021 - learning_rate: 1.6757e-05 - dev_UPOS: 96.9091 - dev_XPOS: 90.7548 - dev_UFeats: 92.6351 - dev_Lemmas: 90.4430 - dev_UAS: 81.8490 - dev_LAS: 75.1078
|
| 163 |
+
Epoch 52/120
|
| 164 |
+
319/319 - 147s - 461ms/step - dense_1_loss: 0.2002 - dense_3_loss: 0.0960 - dense_5_loss: 0.2245 - dense_7_loss: 0.1856 - loss: 1.1381 - parsing_head_loss: 0.1997 - learning_rate: 1.6506e-05 - dev_UPOS: 96.8541 - dev_XPOS: 90.7640 - dev_UFeats: 92.6993 - dev_Lemmas: 90.5164 - dev_UAS: 81.9499 - dev_LAS: 75.1628
|
| 165 |
+
Epoch 53/120
|
| 166 |
+
319/319 - 147s - 460ms/step - dense_1_loss: 0.1975 - dense_3_loss: 0.0954 - dense_5_loss: 0.2218 - dense_7_loss: 0.1832 - loss: 1.1236 - parsing_head_loss: 0.1955 - learning_rate: 1.6248e-05 - dev_UPOS: 96.8357 - dev_XPOS: 90.5897 - dev_UFeats: 92.7359 - dev_Lemmas: 90.6081 - dev_UAS: 81.7206 - dev_LAS: 75.0527
|
| 167 |
+
Epoch 54/120
|
| 168 |
+
319/319 - 146s - 459ms/step - dense_1_loss: 0.1973 - dense_3_loss: 0.0956 - dense_5_loss: 0.2215 - dense_7_loss: 0.1841 - loss: 1.1213 - parsing_head_loss: 0.1948 - learning_rate: 1.5983e-05 - dev_UPOS: 96.7532 - dev_XPOS: 90.7640 - dev_UFeats: 92.9286 - dev_Lemmas: 90.6448 - dev_UAS: 81.9132 - dev_LAS: 75.1720
|
| 169 |
+
Epoch 55/120
|
| 170 |
+
319/319 - 146s - 458ms/step - dense_1_loss: 0.1994 - dense_3_loss: 0.0969 - dense_5_loss: 0.2234 - dense_7_loss: 0.1855 - loss: 1.1330 - parsing_head_loss: 0.1974 - learning_rate: 1.5711e-05 - dev_UPOS: 96.7715 - dev_XPOS: 90.7732 - dev_UFeats: 92.7543 - dev_Lemmas: 90.5714 - dev_UAS: 82.0050 - dev_LAS: 75.1353
|
| 171 |
+
Epoch 56/120
|
| 172 |
+
319/319 - 147s - 460ms/step - dense_1_loss: 0.1959 - dense_3_loss: 0.0951 - dense_5_loss: 0.2182 - dense_7_loss: 0.1823 - loss: 1.1075 - parsing_head_loss: 0.1916 - learning_rate: 1.5433e-05 - dev_UPOS: 96.8082 - dev_XPOS: 90.7640 - dev_UFeats: 92.7084 - dev_Lemmas: 90.6448 - dev_UAS: 82.1150 - dev_LAS: 75.3921
|
| 173 |
+
Epoch 57/120
|
| 174 |
+
319/319 - 147s - 460ms/step - dense_1_loss: 0.1957 - dense_3_loss: 0.0954 - dense_5_loss: 0.2177 - dense_7_loss: 0.1824 - loss: 1.1073 - parsing_head_loss: 0.1916 - learning_rate: 1.5148e-05 - dev_UPOS: 96.8541 - dev_XPOS: 90.7824 - dev_UFeats: 92.6626 - dev_Lemmas: 90.6264 - dev_UAS: 82.2618 - dev_LAS: 75.4838
|
| 175 |
+
Epoch 58/120
|
| 176 |
+
319/319 - 147s - 462ms/step - dense_1_loss: 0.1916 - dense_3_loss: 0.0936 - dense_5_loss: 0.2133 - dense_7_loss: 0.1790 - loss: 1.0840 - parsing_head_loss: 0.1868 - learning_rate: 1.4858e-05 - dev_UPOS: 96.7715 - dev_XPOS: 90.6081 - dev_UFeats: 92.6075 - dev_Lemmas: 90.7548 - dev_UAS: 82.1150 - dev_LAS: 75.5022
|
| 177 |
+
Epoch 59/120
|
| 178 |
+
319/319 - 148s - 463ms/step - dense_1_loss: 0.1902 - dense_3_loss: 0.0931 - dense_5_loss: 0.2117 - dense_7_loss: 0.1773 - loss: 1.0751 - parsing_head_loss: 0.1845 - learning_rate: 1.4562e-05 - dev_UPOS: 96.7440 - dev_XPOS: 90.8007 - dev_UFeats: 92.5617 - dev_Lemmas: 90.8282 - dev_UAS: 82.1700 - dev_LAS: 75.4380
|
| 179 |
+
Epoch 60/120
|
| 180 |
+
319/319 - 147s - 460ms/step - dense_1_loss: 0.1908 - dense_3_loss: 0.0937 - dense_5_loss: 0.2113 - dense_7_loss: 0.1780 - loss: 1.0754 - parsing_head_loss: 0.1847 - learning_rate: 1.4262e-05 - dev_UPOS: 96.7990 - dev_XPOS: 90.8282 - dev_UFeats: 92.7084 - dev_Lemmas: 90.7915 - dev_UAS: 82.2342 - dev_LAS: 75.5847
|
| 181 |
+
Epoch 61/120
|
| 182 |
+
319/319 - 147s - 459ms/step - dense_1_loss: 0.1934 - dense_3_loss: 0.0949 - dense_5_loss: 0.2138 - dense_7_loss: 0.1805 - loss: 1.0866 - parsing_head_loss: 0.1861 - learning_rate: 1.3956e-05 - dev_UPOS: 96.8266 - dev_XPOS: 90.6539 - dev_UFeats: 92.5433 - dev_Lemmas: 90.7090 - dev_UAS: 82.1609 - dev_LAS: 75.5388
|
| 183 |
+
Epoch 62/120
|
| 184 |
+
319/319 - 146s - 457ms/step - dense_1_loss: 0.1909 - dense_3_loss: 0.0936 - dense_5_loss: 0.2095 - dense_7_loss: 0.1780 - loss: 1.0694 - parsing_head_loss: 0.1823 - learning_rate: 1.3646e-05 - dev_UPOS: 96.7348 - dev_XPOS: 90.7732 - dev_UFeats: 92.5433 - dev_Lemmas: 90.7273 - dev_UAS: 82.1425 - dev_LAS: 75.4838
|
| 185 |
+
Epoch 63/120
|
| 186 |
+
319/319 - 146s - 457ms/step - dense_1_loss: 0.1897 - dense_3_loss: 0.0935 - dense_5_loss: 0.2084 - dense_7_loss: 0.1772 - loss: 1.0655 - parsing_head_loss: 0.1823 - learning_rate: 1.3332e-05 - dev_UPOS: 96.8174 - dev_XPOS: 90.7365 - dev_UFeats: 92.6901 - dev_Lemmas: 90.8374 - dev_UAS: 82.2709 - dev_LAS: 75.6214
|
| 187 |
+
Epoch 64/120
|
| 188 |
+
319/319 - 147s - 460ms/step - dense_1_loss: 0.1884 - dense_3_loss: 0.0930 - dense_5_loss: 0.2073 - dense_7_loss: 0.1765 - loss: 1.0573 - parsing_head_loss: 0.1804 - learning_rate: 1.3014e-05 - dev_UPOS: 96.7532 - dev_XPOS: 90.7181 - dev_UFeats: 92.6901 - dev_Lemmas: 90.8007 - dev_UAS: 82.2893 - dev_LAS: 75.7957
|
| 189 |
+
Epoch 65/120
|
| 190 |
+
319/319 - 147s - 461ms/step - dense_1_loss: 0.1849 - dense_3_loss: 0.0917 - dense_5_loss: 0.2034 - dense_7_loss: 0.1733 - loss: 1.0376 - parsing_head_loss: 0.1761 - learning_rate: 1.2693e-05 - dev_UPOS: 96.7348 - dev_XPOS: 90.8190 - dev_UFeats: 92.6993 - dev_Lemmas: 90.8557 - dev_UAS: 81.9224 - dev_LAS: 75.3462
|
| 191 |
+
Epoch 66/120
|
| 192 |
+
319/319 - 147s - 460ms/step - dense_1_loss: 0.1857 - dense_3_loss: 0.0921 - dense_5_loss: 0.2043 - dense_7_loss: 0.1738 - loss: 1.0389 - parsing_head_loss: 0.1764 - learning_rate: 1.2369e-05 - dev_UPOS: 96.7899 - dev_XPOS: 90.8099 - dev_UFeats: 92.7635 - dev_Lemmas: 90.8099 - dev_UAS: 82.0783 - dev_LAS: 75.5022
|
| 193 |
+
Epoch 67/120
|
| 194 |
+
319/319 - 146s - 459ms/step - dense_1_loss: 0.1858 - dense_3_loss: 0.0924 - dense_5_loss: 0.2031 - dense_7_loss: 0.1745 - loss: 1.0393 - parsing_head_loss: 0.1758 - learning_rate: 1.2042e-05 - dev_UPOS: 96.6798 - dev_XPOS: 90.8007 - dev_UFeats: 92.7910 - dev_Lemmas: 90.7824 - dev_UAS: 82.1242 - dev_LAS: 75.6489
|
| 195 |
+
Epoch 68/120
|
| 196 |
+
319/319 - 147s - 460ms/step - dense_1_loss: 0.1849 - dense_3_loss: 0.0923 - dense_5_loss: 0.2019 - dense_7_loss: 0.1738 - loss: 1.0337 - parsing_head_loss: 0.1749 - learning_rate: 1.1713e-05 - dev_UPOS: 96.8174 - dev_XPOS: 90.8190 - dev_UFeats: 92.7268 - dev_Lemmas: 90.8466 - dev_UAS: 82.1884 - dev_LAS: 75.4746
|
| 197 |
+
Epoch 69/120
|
| 198 |
+
319/319 - 147s - 459ms/step - dense_1_loss: 0.1825 - dense_3_loss: 0.0911 - dense_5_loss: 0.1997 - dense_7_loss: 0.1711 - loss: 1.0199 - parsing_head_loss: 0.1729 - learning_rate: 1.1381e-05 - dev_UPOS: 96.7807 - dev_XPOS: 90.8466 - dev_UFeats: 92.7451 - dev_Lemmas: 90.8741 - dev_UAS: 82.3260 - dev_LAS: 75.7957
|
| 199 |
+
Epoch 70/120
|
| 200 |
+
319/319 - 147s - 461ms/step - dense_1_loss: 0.1826 - dense_3_loss: 0.0912 - dense_5_loss: 0.1985 - dense_7_loss: 0.1714 - loss: 1.0182 - parsing_head_loss: 0.1715 - learning_rate: 1.1049e-05 - dev_UPOS: 96.7807 - dev_XPOS: 90.8282 - dev_UFeats: 92.6626 - dev_Lemmas: 90.8007 - dev_UAS: 82.4360 - dev_LAS: 75.8048
|
| 201 |
+
Epoch 71/120
|
| 202 |
+
319/319 - 147s - 460ms/step - dense_1_loss: 0.1829 - dense_3_loss: 0.0916 - dense_5_loss: 0.1989 - dense_7_loss: 0.1714 - loss: 1.0170 - parsing_head_loss: 0.1714 - learning_rate: 1.0715e-05 - dev_UPOS: 96.7807 - dev_XPOS: 90.9291 - dev_UFeats: 92.7268 - dev_Lemmas: 90.8557 - dev_UAS: 82.3076 - dev_LAS: 75.7865
|
| 203 |
+
Epoch 72/120
|
| 204 |
+
319/319 - 147s - 460ms/step - dense_1_loss: 0.1811 - dense_3_loss: 0.0910 - dense_5_loss: 0.1969 - dense_7_loss: 0.1707 - loss: 1.0095 - parsing_head_loss: 0.1699 - learning_rate: 1.0380e-05 - dev_UPOS: 96.8082 - dev_XPOS: 90.8832 - dev_UFeats: 92.7359 - dev_Lemmas: 90.8924 - dev_UAS: 82.2709 - dev_LAS: 75.7865
|
| 205 |
+
Epoch 73/120
|
| 206 |
+
319/319 - 146s - 457ms/step - dense_1_loss: 0.1834 - dense_3_loss: 0.0921 - dense_5_loss: 0.1984 - dense_7_loss: 0.1725 - loss: 1.0190 - parsing_head_loss: 0.1709 - learning_rate: 1.0045e-05 - dev_UPOS: 96.7807 - dev_XPOS: 90.8374 - dev_UFeats: 92.8185 - dev_Lemmas: 90.9383 - dev_UAS: 82.0600 - dev_LAS: 75.4471
|
| 207 |
+
Epoch 74/120
|
| 208 |
+
319/319 - 147s - 461ms/step - dense_1_loss: 0.1797 - dense_3_loss: 0.0904 - dense_5_loss: 0.1953 - dense_7_loss: 0.1693 - loss: 0.9992 - parsing_head_loss: 0.1677 - learning_rate: 9.7100e-06 - dev_UPOS: 96.7440 - dev_XPOS: 90.8557 - dev_UFeats: 92.7543 - dev_Lemmas: 91.0117 - dev_UAS: 82.3076 - dev_LAS: 75.6948
|
| 209 |
+
Epoch 75/120
|
| 210 |
+
319/319 - 146s - 458ms/step - dense_1_loss: 0.1803 - dense_3_loss: 0.0911 - dense_5_loss: 0.1954 - dense_7_loss: 0.1700 - loss: 1.0017 - parsing_head_loss: 0.1683 - learning_rate: 9.3752e-06 - dev_UPOS: 96.7624 - dev_XPOS: 90.8649 - dev_UFeats: 92.7451 - dev_Lemmas: 91.0208 - dev_UAS: 82.3718 - dev_LAS: 75.7773
|
| 211 |
+
Epoch 76/120
|
| 212 |
+
319/319 - 147s - 461ms/step - dense_1_loss: 0.1795 - dense_3_loss: 0.0904 - dense_5_loss: 0.1947 - dense_7_loss: 0.1691 - loss: 0.9972 - parsing_head_loss: 0.1675 - learning_rate: 9.0411e-06 - dev_UPOS: 96.7440 - dev_XPOS: 90.9291 - dev_UFeats: 92.7818 - dev_Lemmas: 90.9291 - dev_UAS: 82.1700 - dev_LAS: 75.5388
|
| 213 |
+
Epoch 77/120
|
| 214 |
+
319/319 - 146s - 457ms/step - dense_1_loss: 0.1816 - dense_3_loss: 0.0918 - dense_5_loss: 0.1970 - dense_7_loss: 0.1713 - loss: 1.0070 - parsing_head_loss: 0.1687 - learning_rate: 8.7081e-06 - dev_UPOS: 96.7257 - dev_XPOS: 90.9383 - dev_UFeats: 92.8185 - dev_Lemmas: 90.9658 - dev_UAS: 82.1884 - dev_LAS: 75.5572
|
| 215 |
+
Epoch 78/120
|
| 216 |
+
319/319 - 147s - 461ms/step - dense_1_loss: 0.1775 - dense_3_loss: 0.0896 - dense_5_loss: 0.1916 - dense_7_loss: 0.1672 - loss: 0.9818 - parsing_head_loss: 0.1633 - learning_rate: 8.3765e-06 - dev_UPOS: 96.7624 - dev_XPOS: 90.9199 - dev_UFeats: 92.8735 - dev_Lemmas: 90.9383 - dev_UAS: 82.4360 - dev_LAS: 75.7131
|
| 217 |
+
Epoch 79/120
|
| 218 |
+
319/319 - 146s - 458ms/step - dense_1_loss: 0.1804 - dense_3_loss: 0.0912 - dense_5_loss: 0.1949 - dense_7_loss: 0.1700 - loss: 0.9980 - parsing_head_loss: 0.1673 - learning_rate: 8.0468e-06 - dev_UPOS: 96.7715 - dev_XPOS: 90.8924 - dev_UFeats: 92.8827 - dev_Lemmas: 91.0025 - dev_UAS: 82.3902 - dev_LAS: 75.5847
|
| 219 |
+
Epoch 80/120
|
| 220 |
+
319/319 - 146s - 458ms/step - dense_1_loss: 0.1773 - dense_3_loss: 0.0898 - dense_5_loss: 0.1912 - dense_7_loss: 0.1673 - loss: 0.9786 - parsing_head_loss: 0.1623 - learning_rate: 7.7192e-06 - dev_UPOS: 96.7165 - dev_XPOS: 91.0667 - dev_UFeats: 92.8368 - dev_Lemmas: 91.0575 - dev_UAS: 82.4085 - dev_LAS: 75.7131
|
| 221 |
+
Epoch 81/120
|
| 222 |
+
319/319 - 146s - 458ms/step - dense_1_loss: 0.1789 - dense_3_loss: 0.0906 - dense_5_loss: 0.1932 - dense_7_loss: 0.1688 - loss: 0.9884 - parsing_head_loss: 0.1647 - learning_rate: 7.3942e-06 - dev_UPOS: 96.7715 - dev_XPOS: 90.8466 - dev_UFeats: 92.8735 - dev_Lemmas: 90.9658 - dev_UAS: 82.4911 - dev_LAS: 75.7315
|
| 223 |
+
Epoch 82/120
|
| 224 |
+
319/319 - 147s - 461ms/step - dense_1_loss: 0.1742 - dense_3_loss: 0.0885 - dense_5_loss: 0.1881 - dense_7_loss: 0.1644 - loss: 0.9638 - parsing_head_loss: 0.1606 - learning_rate: 7.0722e-06 - dev_UPOS: 96.7807 - dev_XPOS: 90.8741 - dev_UFeats: 92.8460 - dev_Lemmas: 91.0759 - dev_UAS: 82.3443 - dev_LAS: 75.6948
|
| 225 |
+
Epoch 83/120
|
| 226 |
+
319/319 - 147s - 460ms/step - dense_1_loss: 0.1755 - dense_3_loss: 0.0893 - dense_5_loss: 0.1897 - dense_7_loss: 0.1656 - loss: 0.9704 - parsing_head_loss: 0.1615 - learning_rate: 6.7534e-06 - dev_UPOS: 96.7165 - dev_XPOS: 90.9108 - dev_UFeats: 92.8919 - dev_Lemmas: 91.0575 - dev_UAS: 82.4544 - dev_LAS: 75.7498
|
| 227 |
+
Epoch 84/120
|
| 228 |
+
319/319 - 146s - 457ms/step - dense_1_loss: 0.1784 - dense_3_loss: 0.0909 - dense_5_loss: 0.1921 - dense_7_loss: 0.1686 - loss: 0.9852 - parsing_head_loss: 0.1644 - learning_rate: 6.4382e-06 - dev_UPOS: 96.6706 - dev_XPOS: 90.9841 - dev_UFeats: 92.8643 - dev_Lemmas: 91.0025 - dev_UAS: 82.4819 - dev_LAS: 75.6948
|
| 229 |
+
Epoch 85/120
|
| 230 |
+
319/319 - 146s - 458ms/step - dense_1_loss: 0.1782 - dense_3_loss: 0.0908 - dense_5_loss: 0.1910 - dense_7_loss: 0.1681 - loss: 0.9804 - parsing_head_loss: 0.1629 - learning_rate: 6.1271e-06 - dev_UPOS: 96.7715 - dev_XPOS: 90.9750 - dev_UFeats: 92.8277 - dev_Lemmas: 91.0208 - dev_UAS: 82.3535 - dev_LAS: 75.6306
|
| 231 |
+
Epoch 86/120
|
| 232 |
+
319/319 - 147s - 461ms/step - dense_1_loss: 0.1736 - dense_3_loss: 0.0885 - dense_5_loss: 0.1864 - dense_7_loss: 0.1641 - loss: 0.9561 - parsing_head_loss: 0.1589 - learning_rate: 5.8203e-06 - dev_UPOS: 96.7807 - dev_XPOS: 90.9841 - dev_UFeats: 92.8185 - dev_Lemmas: 91.0759 - dev_UAS: 82.4544 - dev_LAS: 75.7406
|
| 233 |
+
Epoch 87/120
|
| 234 |
+
319/319 - 146s - 457ms/step - dense_1_loss: 0.1779 - dense_3_loss: 0.0907 - dense_5_loss: 0.1908 - dense_7_loss: 0.1682 - loss: 0.9789 - parsing_head_loss: 0.1628 - learning_rate: 5.5182e-06 - dev_UPOS: 96.7348 - dev_XPOS: 91.0300 - dev_UFeats: 92.8919 - dev_Lemmas: 91.0667 - dev_UAS: 82.4269 - dev_LAS: 75.7498
|
| 235 |
+
Epoch 88/120
|
| 236 |
+
319/319 - 147s - 460ms/step - dense_1_loss: 0.1744 - dense_3_loss: 0.0890 - dense_5_loss: 0.1868 - dense_7_loss: 0.1646 - loss: 0.9592 - parsing_head_loss: 0.1594 - learning_rate: 5.2212e-06 - dev_UPOS: 96.7807 - dev_XPOS: 90.9933 - dev_UFeats: 92.9652 - dev_Lemmas: 91.1676 - dev_UAS: 82.3351 - dev_LAS: 75.6948
|
| 237 |
+
Epoch 89/120
|
| 238 |
+
319/319 - 147s - 460ms/step - dense_1_loss: 0.1738 - dense_3_loss: 0.0886 - dense_5_loss: 0.1858 - dense_7_loss: 0.1642 - loss: 0.9532 - parsing_head_loss: 0.1581 - learning_rate: 4.9295e-06 - dev_UPOS: 96.7899 - dev_XPOS: 91.0117 - dev_UFeats: 92.8735 - dev_Lemmas: 91.1492 - dev_UAS: 82.5461 - dev_LAS: 75.8782
|
| 239 |
+
Epoch 90/120
|
| 240 |
+
319/319 - 145s - 455ms/step - dense_1_loss: 0.1784 - dense_3_loss: 0.0914 - dense_5_loss: 0.1921 - dense_7_loss: 0.1689 - loss: 0.9820 - parsing_head_loss: 0.1629 - learning_rate: 4.6435e-06 - dev_UPOS: 96.8082 - dev_XPOS: 90.8741 - dev_UFeats: 92.8001 - dev_Lemmas: 91.1125 - dev_UAS: 82.4635 - dev_LAS: 75.8323
|
| 241 |
+
Epoch 91/120
|
| 242 |
+
319/319 - 147s - 460ms/step - dense_1_loss: 0.1737 - dense_3_loss: 0.0888 - dense_5_loss: 0.1862 - dense_7_loss: 0.1639 - loss: 0.9538 - parsing_head_loss: 0.1580 - learning_rate: 4.3635e-06 - dev_UPOS: 96.7624 - dev_XPOS: 90.8741 - dev_UFeats: 92.7268 - dev_Lemmas: 91.1034 - dev_UAS: 82.3076 - dev_LAS: 75.7406
|
| 243 |
+
Epoch 92/120
|
| 244 |
+
319/319 - 146s - 457ms/step - dense_1_loss: 0.1759 - dense_3_loss: 0.0900 - dense_5_loss: 0.1881 - dense_7_loss: 0.1660 - loss: 0.9631 - parsing_head_loss: 0.1592 - learning_rate: 4.0899e-06 - dev_UPOS: 96.7715 - dev_XPOS: 90.8649 - dev_UFeats: 92.8460 - dev_Lemmas: 91.1034 - dev_UAS: 82.3168 - dev_LAS: 75.7131
|
| 245 |
+
Epoch 93/120
|
| 246 |
+
319/319 - 147s - 460ms/step - dense_1_loss: 0.1728 - dense_3_loss: 0.0887 - dense_5_loss: 0.1845 - dense_7_loss: 0.1634 - loss: 0.9481 - parsing_head_loss: 0.1569 - learning_rate: 3.8229e-06 - dev_UPOS: 96.7807 - dev_XPOS: 90.9108 - dev_UFeats: 92.8552 - dev_Lemmas: 91.0942 - dev_UAS: 82.3260 - dev_LAS: 75.7681
|
| 247 |
+
Epoch 94/120
|
| 248 |
+
319/319 - 147s - 459ms/step - dense_1_loss: 0.1742 - dense_3_loss: 0.0893 - dense_5_loss: 0.1869 - dense_7_loss: 0.1650 - loss: 0.9565 - parsing_head_loss: 0.1584 - learning_rate: 3.5628e-06 - dev_UPOS: 96.7990 - dev_XPOS: 90.9016 - dev_UFeats: 92.8643 - dev_Lemmas: 91.1217 - dev_UAS: 82.4085 - dev_LAS: 75.7957
|
| 249 |
+
Epoch 95/120
|
| 250 |
+
319/319 - 146s - 459ms/step - dense_1_loss: 0.1744 - dense_3_loss: 0.0895 - dense_5_loss: 0.1867 - dense_7_loss: 0.1652 - loss: 0.9577 - parsing_head_loss: 0.1587 - learning_rate: 3.3100e-06 - dev_UPOS: 96.7624 - dev_XPOS: 90.9291 - dev_UFeats: 92.9102 - dev_Lemmas: 91.1492 - dev_UAS: 82.4177 - dev_LAS: 75.8048
|
| 251 |
+
Epoch 96/120
|
| 252 |
+
319/319 - 146s - 458ms/step - dense_1_loss: 0.1748 - dense_3_loss: 0.0896 - dense_5_loss: 0.1872 - dense_7_loss: 0.1655 - loss: 0.9582 - parsing_head_loss: 0.1588 - learning_rate: 3.0647e-06 - dev_UPOS: 96.7715 - dev_XPOS: 90.9933 - dev_UFeats: 92.9286 - dev_Lemmas: 91.1492 - dev_UAS: 82.4544 - dev_LAS: 75.8323
|
| 253 |
+
Epoch 97/120
|
| 254 |
+
319/319 - 147s - 460ms/step - dense_1_loss: 0.1731 - dense_3_loss: 0.0889 - dense_5_loss: 0.1852 - dense_7_loss: 0.1637 - loss: 0.9508 - parsing_head_loss: 0.1575 - learning_rate: 2.8272e-06 - dev_UPOS: 96.7532 - dev_XPOS: 90.9750 - dev_UFeats: 92.9286 - dev_Lemmas: 91.1676 - dev_UAS: 82.4177 - dev_LAS: 75.8140
|
| 255 |
+
Epoch 98/120
|
| 256 |
+
319/319 - 146s - 458ms/step - dense_1_loss: 0.1754 - dense_3_loss: 0.0901 - dense_5_loss: 0.1873 - dense_7_loss: 0.1659 - loss: 0.9622 - parsing_head_loss: 0.1589 - learning_rate: 2.5977e-06 - dev_UPOS: 96.7715 - dev_XPOS: 90.9566 - dev_UFeats: 92.9102 - dev_Lemmas: 91.1859 - dev_UAS: 82.3718 - dev_LAS: 75.7957
|
| 257 |
+
Epoch 99/120
|
| 258 |
+
319/319 - 147s - 459ms/step - dense_1_loss: 0.1726 - dense_3_loss: 0.0886 - dense_5_loss: 0.1846 - dense_7_loss: 0.1636 - loss: 0.9465 - parsing_head_loss: 0.1567 - learning_rate: 2.3765e-06 - dev_UPOS: 96.8174 - dev_XPOS: 90.9658 - dev_UFeats: 92.8919 - dev_Lemmas: 91.1676 - dev_UAS: 82.4819 - dev_LAS: 76.0066
|
| 259 |
+
Epoch 100/120
|
| 260 |
+
319/319 - 146s - 459ms/step - dense_1_loss: 0.1736 - dense_3_loss: 0.0895 - dense_5_loss: 0.1860 - dense_7_loss: 0.1646 - loss: 0.9531 - parsing_head_loss: 0.1579 - learning_rate: 2.1639e-06 - dev_UPOS: 96.8174 - dev_XPOS: 90.8741 - dev_UFeats: 92.9102 - dev_Lemmas: 91.2043 - dev_UAS: 82.6011 - dev_LAS: 76.0066
|
| 261 |
+
Epoch 101/120
|
| 262 |
+
319/319 - 146s - 457ms/step - dense_1_loss: 0.1748 - dense_3_loss: 0.0900 - dense_5_loss: 0.1867 - dense_7_loss: 0.1652 - loss: 0.9568 - parsing_head_loss: 0.1583 - learning_rate: 1.9601e-06 - dev_UPOS: 96.7715 - dev_XPOS: 90.9291 - dev_UFeats: 92.8552 - dev_Lemmas: 91.1492 - dev_UAS: 82.4544 - dev_LAS: 75.8874
|
| 263 |
+
Epoch 102/120
|
| 264 |
+
319/319 - 146s - 459ms/step - dense_1_loss: 0.1738 - dense_3_loss: 0.0894 - dense_5_loss: 0.1853 - dense_7_loss: 0.1647 - loss: 0.9510 - parsing_head_loss: 0.1576 - learning_rate: 1.7654e-06 - dev_UPOS: 96.7807 - dev_XPOS: 90.9108 - dev_UFeats: 92.8643 - dev_Lemmas: 91.1401 - dev_UAS: 82.4452 - dev_LAS: 75.8874
|
| 265 |
+
Epoch 103/120
|
| 266 |
+
319/319 - 146s - 458ms/step - dense_1_loss: 0.1741 - dense_3_loss: 0.0896 - dense_5_loss: 0.1860 - dense_7_loss: 0.1649 - loss: 0.9535 - parsing_head_loss: 0.1579 - learning_rate: 1.5799e-06 - dev_UPOS: 96.7532 - dev_XPOS: 90.9291 - dev_UFeats: 92.8735 - dev_Lemmas: 91.1401 - dev_UAS: 82.3810 - dev_LAS: 75.8232
|
| 267 |
+
Epoch 104/120
|
| 268 |
+
319/319 - 147s - 460ms/step - dense_1_loss: 0.1730 - dense_3_loss: 0.0890 - dense_5_loss: 0.1849 - dense_7_loss: 0.1639 - loss: 0.9468 - parsing_head_loss: 0.1566 - learning_rate: 1.4038e-06 - dev_UPOS: 96.7532 - dev_XPOS: 90.9933 - dev_UFeats: 92.8643 - dev_Lemmas: 91.1401 - dev_UAS: 82.5094 - dev_LAS: 75.9883
|
| 269 |
+
Epoch 105/120
|
| 270 |
+
319/319 - 147s - 460ms/step - dense_1_loss: 0.1714 - dense_3_loss: 0.0883 - dense_5_loss: 0.1831 - dense_7_loss: 0.1624 - loss: 0.9393 - parsing_head_loss: 0.1552 - learning_rate: 1.2374e-06 - dev_UPOS: 96.7624 - dev_XPOS: 90.9566 - dev_UFeats: 92.9010 - dev_Lemmas: 91.1859 - dev_UAS: 82.4911 - dev_LAS: 75.9791
|
| 271 |
+
Epoch 106/120
|
| 272 |
+
319/319 - 150s - 469ms/step - dense_1_loss: 0.1712 - dense_3_loss: 0.0882 - dense_5_loss: 0.1829 - dense_7_loss: 0.1620 - loss: 0.9370 - parsing_head_loss: 0.1551 - learning_rate: 1.0809e-06 - dev_UPOS: 96.7257 - dev_XPOS: 90.9016 - dev_UFeats: 92.9010 - dev_Lemmas: 91.1767 - dev_UAS: 82.4727 - dev_LAS: 75.9516
|
| 273 |
+
Epoch 107/120
|
| 274 |
+
319/319 - 146s - 458ms/step - dense_1_loss: 0.1725 - dense_3_loss: 0.0887 - dense_5_loss: 0.1838 - dense_7_loss: 0.1629 - loss: 0.9424 - parsing_head_loss: 0.1563 - learning_rate: 9.3436e-07 - dev_UPOS: 96.7348 - dev_XPOS: 90.8924 - dev_UFeats: 92.8643 - dev_Lemmas: 91.1676 - dev_UAS: 82.4360 - dev_LAS: 75.8965
|
| 275 |
+
Epoch 108/120
|
| 276 |
+
319/319 - 147s - 461ms/step - dense_1_loss: 0.1708 - dense_3_loss: 0.0880 - dense_5_loss: 0.1826 - dense_7_loss: 0.1620 - loss: 0.9361 - parsing_head_loss: 0.1549 - learning_rate: 7.9801e-07 - dev_UPOS: 96.7348 - dev_XPOS: 90.9199 - dev_UFeats: 92.8643 - dev_Lemmas: 91.1859 - dev_UAS: 82.5094 - dev_LAS: 75.9974
|
| 277 |
+
Epoch 109/120
|
| 278 |
+
319/319 - 147s - 460ms/step - dense_1_loss: 0.1714 - dense_3_loss: 0.0884 - dense_5_loss: 0.1835 - dense_7_loss: 0.1624 - loss: 0.9383 - parsing_head_loss: 0.1554 - learning_rate: 6.7200e-07 - dev_UPOS: 96.7807 - dev_XPOS: 90.8741 - dev_UFeats: 92.9010 - dev_Lemmas: 91.1951 - dev_UAS: 82.5369 - dev_LAS: 75.9791
|
| 279 |
+
Epoch 110/120
|
| 280 |
+
319/319 - 147s - 461ms/step - dense_1_loss: 0.1712 - dense_3_loss: 0.0881 - dense_5_loss: 0.1828 - dense_7_loss: 0.1619 - loss: 0.9359 - parsing_head_loss: 0.1549 - learning_rate: 5.5647e-07 - dev_UPOS: 96.7624 - dev_XPOS: 90.9566 - dev_UFeats: 92.9102 - dev_Lemmas: 91.1676 - dev_UAS: 82.5644 - dev_LAS: 76.0708
|
| 281 |
+
Epoch 111/120
|
| 282 |
+
319/319 - 147s - 460ms/step - dense_1_loss: 0.1715 - dense_3_loss: 0.0884 - dense_5_loss: 0.1837 - dense_7_loss: 0.1626 - loss: 0.9384 - parsing_head_loss: 0.1548 - learning_rate: 4.5154e-07 - dev_UPOS: 96.7624 - dev_XPOS: 90.9841 - dev_UFeats: 92.8919 - dev_Lemmas: 91.1309 - dev_UAS: 82.5644 - dev_LAS: 76.1075
|
| 283 |
+
Epoch 112/120
|
| 284 |
+
319/319 - 147s - 460ms/step - dense_1_loss: 0.1720 - dense_3_loss: 0.0886 - dense_5_loss: 0.1837 - dense_7_loss: 0.1627 - loss: 0.9398 - parsing_head_loss: 0.1546 - learning_rate: 3.5734e-07 - dev_UPOS: 96.7899 - dev_XPOS: 91.0208 - dev_UFeats: 92.9010 - dev_Lemmas: 91.1584 - dev_UAS: 82.4544 - dev_LAS: 75.9699
|
| 285 |
+
Epoch 113/120
|
| 286 |
+
319/319 - 147s - 460ms/step - dense_1_loss: 0.1717 - dense_3_loss: 0.0884 - dense_5_loss: 0.1835 - dense_7_loss: 0.1625 - loss: 0.9397 - parsing_head_loss: 0.1554 - learning_rate: 2.7398e-07 - dev_UPOS: 96.7807 - dev_XPOS: 90.9933 - dev_UFeats: 92.9194 - dev_Lemmas: 91.1676 - dev_UAS: 82.5186 - dev_LAS: 76.0433
|
| 287 |
+
Epoch 114/120
|
| 288 |
+
319/319 - 146s - 458ms/step - dense_1_loss: 0.1724 - dense_3_loss: 0.0888 - dense_5_loss: 0.1845 - dense_7_loss: 0.1633 - loss: 0.9423 - parsing_head_loss: 0.1549 - learning_rate: 2.0153e-07 - dev_UPOS: 96.7807 - dev_XPOS: 90.9933 - dev_UFeats: 92.9194 - dev_Lemmas: 91.1676 - dev_UAS: 82.4911 - dev_LAS: 76.0249
|
| 289 |
+
Epoch 115/120
|
| 290 |
+
319/319 - 147s - 462ms/step - dense_1_loss: 0.1707 - dense_3_loss: 0.0879 - dense_5_loss: 0.1818 - dense_7_loss: 0.1617 - loss: 0.9331 - parsing_head_loss: 0.1541 - learning_rate: 1.4010e-07 - dev_UPOS: 96.7807 - dev_XPOS: 91.0025 - dev_UFeats: 92.8919 - dev_Lemmas: 91.1676 - dev_UAS: 82.4819 - dev_LAS: 75.9791
|
| 291 |
+
Epoch 116/120
|
| 292 |
+
319/319 - 147s - 461ms/step - dense_1_loss: 0.1707 - dense_3_loss: 0.0880 - dense_5_loss: 0.1817 - dense_7_loss: 0.1616 - loss: 0.9327 - parsing_head_loss: 0.1540 - learning_rate: 8.9738e-08 - dev_UPOS: 96.7807 - dev_XPOS: 90.9658 - dev_UFeats: 92.9102 - dev_Lemmas: 91.1584 - dev_UAS: 82.4819 - dev_LAS: 75.9791
|
| 293 |
+
Epoch 117/120
|
| 294 |
+
319/319 - 146s - 458ms/step - dense_1_loss: 0.1725 - dense_3_loss: 0.0890 - dense_5_loss: 0.1838 - dense_7_loss: 0.1637 - loss: 0.9431 - parsing_head_loss: 0.1555 - learning_rate: 5.0511e-08 - dev_UPOS: 96.7807 - dev_XPOS: 90.9750 - dev_UFeats: 92.8919 - dev_Lemmas: 91.1676 - dev_UAS: 82.4819 - dev_LAS: 75.9974
|
| 295 |
+
Epoch 118/120
|
| 296 |
+
319/319 - 147s - 461ms/step - dense_1_loss: 0.1705 - dense_3_loss: 0.0880 - dense_5_loss: 0.1821 - dense_7_loss: 0.1615 - loss: 0.9339 - parsing_head_loss: 0.1543 - learning_rate: 2.2460e-08 - dev_UPOS: 96.7715 - dev_XPOS: 90.9750 - dev_UFeats: 92.9010 - dev_Lemmas: 91.1492 - dev_UAS: 82.4911 - dev_LAS: 76.0158
|
| 297 |
+
Epoch 119/120
|
| 298 |
+
319/319 - 147s - 460ms/step - dense_1_loss: 0.1725 - dense_3_loss: 0.0888 - dense_5_loss: 0.1838 - dense_7_loss: 0.1633 - loss: 0.9425 - parsing_head_loss: 0.1555 - learning_rate: 5.6165e-09 - dev_UPOS: 96.7807 - dev_XPOS: 90.9750 - dev_UFeats: 92.9010 - dev_Lemmas: 91.1492 - dev_UAS: 82.4911 - dev_LAS: 76.0066
|
| 299 |
+
Epoch 120/120
|
| 300 |
+
319/319 - 151s - 473ms/step - dense_1_loss: 0.1724 - dense_3_loss: 0.0888 - dense_5_loss: 0.1834 - dense_7_loss: 0.1632 - loss: 0.9398 - parsing_head_loss: 0.1548 - learning_rate: 0.0000e+00 - dev_UPOS: 96.7807 - dev_XPOS: 90.9750 - dev_UFeats: 92.9010 - dev_Lemmas: 91.1492 - dev_UAS: 82.4911 - dev_LAS: 76.0066 - test_UPOS: 97.0846 - test_XPOS: 91.7291 - test_UFeats: 93.3924 - test_Lemmas: 90.6050 - test_UAS: 83.6227 - test_LAS: 77.2071
|
| 301 |
+
Traceback (most recent call last):
|
| 302 |
+
File "/gpfs/bwfor/home/hd/hd_hd/hd_ec199/reproduce/evalatin2024-latinpipe/latinpipe_evalatin24.py", line 935, in <module>
|
| 303 |
+
main([] if "__file__" not in globals() else None)
|
| 304 |
+
File "/gpfs/bwfor/home/hd/hd_hd/hd_ec199/reproduce/evalatin2024-latinpipe/latinpipe_evalatin24.py", line 819, in main
|
| 305 |
+
with open(os.path.join(os.path.dirname(args.load[0]), "options.json"), mode="r") as options_file:
|
| 306 |
+
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
|
| 307 |
+
FileNotFoundError: [Errno 2] No such file or directory: '/home/hd/hd_hd/hd_ec199/evalatin2024-latinpipe/latinpipe-evalatin/options.json'
|
runs/final_run.log
ADDED
|
@@ -0,0 +1,306 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
/gpfs/bwfor/home/hd/hd_hd/hd_ec199/reproduce/evalatin2024-latinpipe/.venv/lib/python3.12/site-packages/keras/src/models/functional.py:225: UserWarning: The structure of `inputs` doesn't match the expected structure: ['keras_tensor', 'keras_tensor_1', 'keras_tensor_2', 'keras_tensor_3', 'keras_tensor_4', 'keras_tensor_5']. Received: the structure of inputs=('*', '*', '*', '*', '*', '*')
|
| 2 |
+
warnings.warn(
|
| 3 |
+
{
|
| 4 |
+
"batch_size": 16,
|
| 5 |
+
"deprel": "full",
|
| 6 |
+
"dev": [
|
| 7 |
+
"la_giuseppe/dev.conllu"
|
| 8 |
+
],
|
| 9 |
+
"dropout": 0.5,
|
| 10 |
+
"embed_tags": [],
|
| 11 |
+
"epochs": 100,
|
| 12 |
+
"epochs_frozen": 20,
|
| 13 |
+
"exp": "all_three_100_epochs",
|
| 14 |
+
"label_smoothing": 0.03,
|
| 15 |
+
"learning_rate": 2e-05,
|
| 16 |
+
"learning_rate_decay": "cos",
|
| 17 |
+
"learning_rate_warmup": 2000,
|
| 18 |
+
"load": [],
|
| 19 |
+
"logdir": "logs/all_three_100_epochs-latinpipe_evalatin24-8201717-250407_140047-s2",
|
| 20 |
+
"max_train_sentence_len": 150,
|
| 21 |
+
"optimizer": "adam",
|
| 22 |
+
"parse": 1,
|
| 23 |
+
"parse_attention_dim": 512,
|
| 24 |
+
"rnn_dim": 512,
|
| 25 |
+
"rnn_layers": 2,
|
| 26 |
+
"rnn_type": "LSTMTorch",
|
| 27 |
+
"save_checkpoint": true,
|
| 28 |
+
"script": "latinpipe_evalatin24.py",
|
| 29 |
+
"seed": 2,
|
| 30 |
+
"single_root": 1,
|
| 31 |
+
"steps_per_epoch": 1000,
|
| 32 |
+
"subword_combination": "first",
|
| 33 |
+
"tags": [
|
| 34 |
+
2,
|
| 35 |
+
1,
|
| 36 |
+
4
|
| 37 |
+
],
|
| 38 |
+
"task_hidden_layer": 2048,
|
| 39 |
+
"test": [
|
| 40 |
+
"la_giuseppe/test.conllu"
|
| 41 |
+
],
|
| 42 |
+
"threads": 4,
|
| 43 |
+
"train": [
|
| 44 |
+
"la_giuseppe/train.conllu"
|
| 45 |
+
],
|
| 46 |
+
"train_sampling_exponent": 0.5,
|
| 47 |
+
"transformers": [
|
| 48 |
+
"bowphs/LaBerta",
|
| 49 |
+
"bowphs/PhilBerta",
|
| 50 |
+
"FacebookAI/xlm-roberta-large"
|
| 51 |
+
],
|
| 52 |
+
"treebank_ids": false,
|
| 53 |
+
"verbose": 2,
|
| 54 |
+
"wandb": false,
|
| 55 |
+
"word_masking": null
|
| 56 |
+
}
|
| 57 |
+
Trimmed 2 out of 5089 sentences
|
| 58 |
+
Epoch 1/20
|
| 59 |
+
319/319 - 50s - 158ms/step - dense_1_loss: 0.2477 - dense_3_loss: 0.9185 - dense_5_loss: 0.7275 - loss: 3.4780 - parsing_head_loss: 0.6817 - learning_rate: 1.0000e-03 - dev_UPOS: 93.9191 - dev_UFeats: 82.3443 - dev_Lemmas: 73.4568 - dev_UAS: 60.3320 - dev_LAS: 49.1975
|
| 60 |
+
Epoch 2/20
|
| 61 |
+
319/319 - 47s - 147ms/step - dense_1_loss: 0.1904 - dense_3_loss: 0.6759 - dense_5_loss: 0.5141 - loss: 2.5663 - parsing_head_loss: 0.5140 - learning_rate: 1.0000e-03 - dev_UPOS: 94.6804 - dev_UFeats: 83.8577 - dev_Lemmas: 77.2998 - dev_UAS: 66.0552 - dev_LAS: 56.0304
|
| 62 |
+
Epoch 3/20
|
| 63 |
+
319/319 - 47s - 147ms/step - dense_1_loss: 0.1783 - dense_3_loss: 0.6080 - dense_5_loss: 0.4744 - loss: 2.3521 - parsing_head_loss: 0.4798 - learning_rate: 1.0000e-03 - dev_UPOS: 95.2674 - dev_UFeats: 85.1876 - dev_Lemmas: 79.2993 - dev_UAS: 69.1920 - dev_LAS: 59.4607
|
| 64 |
+
Epoch 4/20
|
| 65 |
+
319/319 - 47s - 148ms/step - dense_1_loss: 0.1717 - dense_3_loss: 0.5644 - dense_5_loss: 0.4464 - loss: 2.2021 - parsing_head_loss: 0.4540 - learning_rate: 1.0000e-03 - dev_UPOS: 95.0197 - dev_UFeats: 85.6370 - dev_Lemmas: 80.7209 - dev_UAS: 70.3476 - dev_LAS: 61.0382
|
| 66 |
+
Epoch 5/20
|
| 67 |
+
319/319 - 47s - 149ms/step - dense_1_loss: 0.1690 - dense_3_loss: 0.5288 - dense_5_loss: 0.4247 - loss: 2.0944 - parsing_head_loss: 0.4340 - learning_rate: 1.0000e-03 - dev_UPOS: 94.8088 - dev_UFeats: 86.0772 - dev_Lemmas: 81.4455 - dev_UAS: 71.7784 - dev_LAS: 62.4415
|
| 68 |
+
Epoch 6/20
|
| 69 |
+
319/319 - 47s - 148ms/step - dense_1_loss: 0.1705 - dense_3_loss: 0.5209 - dense_5_loss: 0.4314 - loss: 2.0831 - parsing_head_loss: 0.4325 - learning_rate: 1.0000e-03 - dev_UPOS: 95.4600 - dev_UFeats: 85.8571 - dev_Lemmas: 81.7940 - dev_UAS: 73.0808 - dev_LAS: 64.3034
|
| 70 |
+
Epoch 7/20
|
| 71 |
+
319/319 - 47s - 147ms/step - dense_1_loss: 0.1616 - dense_3_loss: 0.4974 - dense_5_loss: 0.4151 - loss: 1.9977 - parsing_head_loss: 0.4142 - learning_rate: 1.0000e-03 - dev_UPOS: 95.5242 - dev_UFeats: 86.4533 - dev_Lemmas: 82.2801 - dev_UAS: 74.3282 - dev_LAS: 65.0738
|
| 72 |
+
Epoch 8/20
|
| 73 |
+
319/319 - 47s - 148ms/step - dense_1_loss: 0.1619 - dense_3_loss: 0.4869 - dense_5_loss: 0.4090 - loss: 1.9691 - parsing_head_loss: 0.4101 - learning_rate: 1.0000e-03 - dev_UPOS: 95.6984 - dev_UFeats: 86.4074 - dev_Lemmas: 82.7020 - dev_UAS: 74.1631 - dev_LAS: 65.8993
|
| 74 |
+
Epoch 9/20
|
| 75 |
+
319/319 - 47s - 148ms/step - dense_1_loss: 0.1561 - dense_3_loss: 0.4713 - dense_5_loss: 0.3972 - loss: 1.8996 - parsing_head_loss: 0.3948 - learning_rate: 1.0000e-03 - dev_UPOS: 95.6709 - dev_UFeats: 86.2973 - dev_Lemmas: 83.0872 - dev_UAS: 75.0344 - dev_LAS: 66.3487
|
| 76 |
+
Epoch 10/20
|
| 77 |
+
319/319 - 47s - 146ms/step - dense_1_loss: 0.1590 - dense_3_loss: 0.4727 - dense_5_loss: 0.3997 - loss: 1.9004 - parsing_head_loss: 0.3945 - learning_rate: 1.0000e-03 - dev_UPOS: 95.6984 - dev_UFeats: 86.5175 - dev_Lemmas: 83.3165 - dev_UAS: 75.2637 - dev_LAS: 67.0549
|
| 78 |
+
Epoch 11/20
|
| 79 |
+
319/319 - 47s - 148ms/step - dense_1_loss: 0.1544 - dense_3_loss: 0.4592 - dense_5_loss: 0.3919 - loss: 1.8534 - parsing_head_loss: 0.3850 - learning_rate: 1.0000e-03 - dev_UPOS: 95.9277 - dev_UFeats: 86.5175 - dev_Lemmas: 83.1514 - dev_UAS: 75.9974 - dev_LAS: 67.4035
|
| 80 |
+
Epoch 12/20
|
| 81 |
+
319/319 - 47s - 148ms/step - dense_1_loss: 0.1530 - dense_3_loss: 0.4516 - dense_5_loss: 0.3868 - loss: 1.8219 - parsing_head_loss: 0.3785 - learning_rate: 1.0000e-03 - dev_UPOS: 95.7810 - dev_UFeats: 86.7376 - dev_Lemmas: 83.7843 - dev_UAS: 76.0066 - dev_LAS: 67.4952
|
| 82 |
+
Epoch 13/20
|
| 83 |
+
319/319 - 48s - 149ms/step - dense_1_loss: 0.1497 - dense_3_loss: 0.4368 - dense_5_loss: 0.3795 - loss: 1.7703 - parsing_head_loss: 0.3676 - learning_rate: 1.0000e-03 - dev_UPOS: 96.0378 - dev_UFeats: 86.5175 - dev_Lemmas: 83.8118 - dev_UAS: 76.4652 - dev_LAS: 68.5041
|
| 84 |
+
Epoch 14/20
|
| 85 |
+
319/319 - 47s - 148ms/step - dense_1_loss: 0.1495 - dense_3_loss: 0.4314 - dense_5_loss: 0.3793 - loss: 1.7641 - parsing_head_loss: 0.3651 - learning_rate: 1.0000e-03 - dev_UPOS: 95.7810 - dev_UFeats: 86.8018 - dev_Lemmas: 83.8852 - dev_UAS: 76.1992 - dev_LAS: 68.1189
|
| 86 |
+
Epoch 15/20
|
| 87 |
+
319/319 - 47s - 148ms/step - dense_1_loss: 0.1507 - dense_3_loss: 0.4319 - dense_5_loss: 0.3804 - loss: 1.7555 - parsing_head_loss: 0.3631 - learning_rate: 1.0000e-03 - dev_UPOS: 95.9094 - dev_UFeats: 86.7009 - dev_Lemmas: 84.0044 - dev_UAS: 76.6028 - dev_LAS: 68.3482
|
| 88 |
+
Epoch 16/20
|
| 89 |
+
319/319 - 47s - 148ms/step - dense_1_loss: 0.1488 - dense_3_loss: 0.4267 - dense_5_loss: 0.3816 - loss: 1.7477 - parsing_head_loss: 0.3629 - learning_rate: 1.0000e-03 - dev_UPOS: 95.9919 - dev_UFeats: 86.6459 - dev_Lemmas: 83.9585 - dev_UAS: 76.9880 - dev_LAS: 69.0085
|
| 90 |
+
Epoch 17/20
|
| 91 |
+
319/319 - 47s - 148ms/step - dense_1_loss: 0.1462 - dense_3_loss: 0.4171 - dense_5_loss: 0.3698 - loss: 1.7093 - parsing_head_loss: 0.3555 - learning_rate: 1.0000e-03 - dev_UPOS: 95.8544 - dev_UFeats: 86.7193 - dev_Lemmas: 84.4722 - dev_UAS: 77.1898 - dev_LAS: 69.0911
|
| 92 |
+
Epoch 18/20
|
| 93 |
+
319/319 - 47s - 148ms/step - dense_1_loss: 0.1462 - dense_3_loss: 0.4209 - dense_5_loss: 0.3700 - loss: 1.7049 - parsing_head_loss: 0.3523 - learning_rate: 1.0000e-03 - dev_UPOS: 96.0103 - dev_UFeats: 86.5542 - dev_Lemmas: 84.4630 - dev_UAS: 77.4741 - dev_LAS: 69.0085
|
| 94 |
+
Epoch 19/20
|
| 95 |
+
319/319 - 47s - 147ms/step - dense_1_loss: 0.1462 - dense_3_loss: 0.4230 - dense_5_loss: 0.3723 - loss: 1.7028 - parsing_head_loss: 0.3499 - learning_rate: 1.0000e-03 - dev_UPOS: 96.2121 - dev_UFeats: 86.6917 - dev_Lemmas: 84.5914 - dev_UAS: 77.4191 - dev_LAS: 69.3020
|
| 96 |
+
Epoch 20/20
|
| 97 |
+
319/319 - 47s - 147ms/step - dense_1_loss: 0.1449 - dense_3_loss: 0.4171 - dense_5_loss: 0.3664 - loss: 1.6902 - parsing_head_loss: 0.3478 - learning_rate: 1.0000e-03 - dev_UPOS: 96.0286 - dev_UFeats: 86.6000 - dev_Lemmas: 84.5364 - dev_UAS: 77.5750 - dev_LAS: 69.1828
|
| 98 |
+
Epoch 21/120
|
| 99 |
+
/gpfs/bwfor/home/hd/hd_hd/hd_ec199/reproduce/evalatin2024-latinpipe/.venv/lib/python3.12/site-packages/keras/src/optimizers/base_optimizer.py:731: UserWarning: Gradients do not exist for variables ['variable_783', 'variable_784'] when minimizing the loss. If using `model.compile()`, did you forget to provide a `loss` argument?
|
| 100 |
+
warnings.warn(
|
| 101 |
+
319/319 - 119s - 373ms/step - dense_1_loss: 0.1385 - dense_3_loss: 0.3823 - dense_5_loss: 0.3379 - loss: 1.5763 - parsing_head_loss: 0.3282 - learning_rate: 3.1900e-06 - dev_UPOS: 96.2579 - dev_UFeats: 88.3610 - dev_Lemmas: 85.7746 - dev_UAS: 78.2812 - dev_LAS: 70.1458
|
| 102 |
+
Epoch 22/120
|
| 103 |
+
319/319 - 118s - 371ms/step - dense_1_loss: 0.1323 - dense_3_loss: 0.3601 - dense_5_loss: 0.3065 - loss: 1.4845 - parsing_head_loss: 0.3118 - learning_rate: 6.3800e-06 - dev_UPOS: 96.4047 - dev_UFeats: 89.5258 - dev_Lemmas: 86.3432 - dev_UAS: 78.8957 - dev_LAS: 70.9346
|
| 104 |
+
Epoch 23/120
|
| 105 |
+
319/319 - 118s - 371ms/step - dense_1_loss: 0.1313 - dense_3_loss: 0.3562 - dense_5_loss: 0.2980 - loss: 1.4578 - parsing_head_loss: 0.3071 - learning_rate: 9.5700e-06 - dev_UPOS: 96.4964 - dev_UFeats: 90.1403 - dev_Lemmas: 86.9669 - dev_UAS: 79.2901 - dev_LAS: 71.6684
|
| 106 |
+
Epoch 24/120
|
| 107 |
+
319/319 - 119s - 372ms/step - dense_1_loss: 0.1284 - dense_3_loss: 0.3436 - dense_5_loss: 0.2849 - loss: 1.4103 - parsing_head_loss: 0.2982 - learning_rate: 1.2760e-05 - dev_UPOS: 96.6064 - dev_UFeats: 90.6906 - dev_Lemmas: 87.4255 - dev_UAS: 79.4827 - dev_LAS: 71.9894
|
| 108 |
+
Epoch 25/120
|
| 109 |
+
319/319 - 118s - 370ms/step - dense_1_loss: 0.1280 - dense_3_loss: 0.3364 - dense_5_loss: 0.2808 - loss: 1.3872 - parsing_head_loss: 0.2948 - learning_rate: 1.5950e-05 - dev_UPOS: 96.5973 - dev_UFeats: 90.7732 - dev_Lemmas: 87.8382 - dev_UAS: 79.8588 - dev_LAS: 72.3654
|
| 110 |
+
Epoch 26/120
|
| 111 |
+
319/319 - 119s - 373ms/step - dense_1_loss: 0.1241 - dense_3_loss: 0.3243 - dense_5_loss: 0.2704 - loss: 1.3395 - parsing_head_loss: 0.2844 - learning_rate: 1.9140e-05 - dev_UPOS: 96.7348 - dev_UFeats: 91.1401 - dev_Lemmas: 88.2876 - dev_UAS: 79.9780 - dev_LAS: 72.5672
|
| 112 |
+
Epoch 27/120
|
| 113 |
+
319/319 - 118s - 371ms/step - dense_1_loss: 0.1227 - dense_3_loss: 0.3165 - dense_5_loss: 0.2652 - loss: 1.3156 - parsing_head_loss: 0.2804 - learning_rate: 1.9997e-05 - dev_UPOS: 96.7257 - dev_UFeats: 91.4427 - dev_Lemmas: 88.3702 - dev_UAS: 80.7301 - dev_LAS: 73.5027
|
| 114 |
+
Epoch 28/120
|
| 115 |
+
319/319 - 118s - 371ms/step - dense_1_loss: 0.1247 - dense_3_loss: 0.3399 - dense_5_loss: 0.2654 - loss: 1.3321 - parsing_head_loss: 0.2761 - learning_rate: 1.9983e-05 - dev_UPOS: 96.5697 - dev_UFeats: 91.1401 - dev_Lemmas: 87.2329 - dev_UAS: 80.4733 - dev_LAS: 73.1725
|
| 116 |
+
Epoch 29/120
|
| 117 |
+
319/319 - 118s - 369ms/step - dense_1_loss: 0.1240 - dense_3_loss: 0.3514 - dense_5_loss: 0.2657 - loss: 1.3377 - parsing_head_loss: 0.2733 - learning_rate: 1.9958e-05 - dev_UPOS: 96.5422 - dev_UFeats: 91.4702 - dev_Lemmas: 87.5997 - dev_UAS: 80.2807 - dev_LAS: 73.2276
|
| 118 |
+
Epoch 30/120
|
| 119 |
+
319/319 - 118s - 370ms/step - dense_1_loss: 0.1213 - dense_3_loss: 0.3353 - dense_5_loss: 0.2564 - loss: 1.2933 - parsing_head_loss: 0.2668 - learning_rate: 1.9922e-05 - dev_UPOS: 96.6156 - dev_UFeats: 91.5711 - dev_Lemmas: 88.0125 - dev_UAS: 80.7209 - dev_LAS: 73.6586
|
| 120 |
+
Epoch 31/120
|
| 121 |
+
319/319 - 119s - 372ms/step - dense_1_loss: 0.1189 - dense_3_loss: 0.3207 - dense_5_loss: 0.2492 - loss: 1.2555 - parsing_head_loss: 0.2600 - learning_rate: 1.9875e-05 - dev_UPOS: 96.6248 - dev_UFeats: 91.5528 - dev_Lemmas: 88.0950 - dev_UAS: 80.5191 - dev_LAS: 73.3926
|
| 122 |
+
Epoch 32/120
|
| 123 |
+
319/319 - 119s - 372ms/step - dense_1_loss: 0.1176 - dense_3_loss: 0.3127 - dense_5_loss: 0.2456 - loss: 1.2358 - parsing_head_loss: 0.2577 - learning_rate: 1.9816e-05 - dev_UPOS: 96.5881 - dev_UFeats: 91.7913 - dev_Lemmas: 88.5903 - dev_UAS: 80.7484 - dev_LAS: 73.5394
|
| 124 |
+
Epoch 33/120
|
| 125 |
+
319/319 - 118s - 369ms/step - dense_1_loss: 0.1171 - dense_3_loss: 0.3062 - dense_5_loss: 0.2440 - loss: 1.2205 - parsing_head_loss: 0.2546 - learning_rate: 1.9747e-05 - dev_UPOS: 96.6248 - dev_UFeats: 91.9105 - dev_Lemmas: 88.7279 - dev_UAS: 81.0694 - dev_LAS: 74.1631
|
| 126 |
+
Epoch 34/120
|
| 127 |
+
319/319 - 117s - 367ms/step - dense_1_loss: 0.1170 - dense_3_loss: 0.3011 - dense_5_loss: 0.2414 - loss: 1.2074 - parsing_head_loss: 0.2520 - learning_rate: 1.9666e-05 - dev_UPOS: 96.6982 - dev_UFeats: 92.0114 - dev_Lemmas: 88.9480 - dev_UAS: 81.2070 - dev_LAS: 74.1906
|
| 128 |
+
Epoch 35/120
|
| 129 |
+
319/319 - 118s - 369ms/step - dense_1_loss: 0.1131 - dense_3_loss: 0.2862 - dense_5_loss: 0.2331 - loss: 1.1602 - parsing_head_loss: 0.2428 - learning_rate: 1.9575e-05 - dev_UPOS: 96.6340 - dev_UFeats: 92.0205 - dev_Lemmas: 89.0672 - dev_UAS: 81.0969 - dev_LAS: 74.0989
|
| 130 |
+
Epoch 36/120
|
| 131 |
+
319/319 - 119s - 373ms/step - dense_1_loss: 0.1107 - dense_3_loss: 0.2792 - dense_5_loss: 0.2267 - loss: 1.1310 - parsing_head_loss: 0.2381 - learning_rate: 1.9473e-05 - dev_UPOS: 96.6798 - dev_UFeats: 92.0022 - dev_Lemmas: 89.2048 - dev_UAS: 81.4546 - dev_LAS: 74.4749
|
| 132 |
+
Epoch 37/120
|
| 133 |
+
319/319 - 119s - 373ms/step - dense_1_loss: 0.1103 - dense_3_loss: 0.2745 - dense_5_loss: 0.2243 - loss: 1.1184 - parsing_head_loss: 0.2335 - learning_rate: 1.9360e-05 - dev_UPOS: 96.7440 - dev_UFeats: 92.1123 - dev_Lemmas: 89.2782 - dev_UAS: 81.4638 - dev_LAS: 74.4749
|
| 134 |
+
Epoch 38/120
|
| 135 |
+
319/319 - 119s - 373ms/step - dense_1_loss: 0.1095 - dense_3_loss: 0.2741 - dense_5_loss: 0.2221 - loss: 1.1060 - parsing_head_loss: 0.2301 - learning_rate: 1.9237e-05 - dev_UPOS: 96.7073 - dev_UFeats: 92.1948 - dev_Lemmas: 89.4433 - dev_UAS: 81.5922 - dev_LAS: 74.6767
|
| 136 |
+
Epoch 39/120
|
| 137 |
+
319/319 - 119s - 373ms/step - dense_1_loss: 0.1083 - dense_3_loss: 0.2663 - dense_5_loss: 0.2203 - loss: 1.0912 - parsing_head_loss: 0.2287 - learning_rate: 1.9103e-05 - dev_UPOS: 96.7899 - dev_UFeats: 92.2040 - dev_Lemmas: 89.5900 - dev_UAS: 81.6564 - dev_LAS: 74.5208
|
| 138 |
+
Epoch 40/120
|
| 139 |
+
319/319 - 119s - 371ms/step - dense_1_loss: 0.1078 - dense_3_loss: 0.2597 - dense_5_loss: 0.2181 - loss: 1.0751 - parsing_head_loss: 0.2262 - learning_rate: 1.8960e-05 - dev_UPOS: 96.7348 - dev_UFeats: 92.0572 - dev_Lemmas: 89.6451 - dev_UAS: 81.8674 - dev_LAS: 74.9610
|
| 140 |
+
Epoch 41/120
|
| 141 |
+
319/319 - 118s - 370ms/step - dense_1_loss: 0.1073 - dense_3_loss: 0.2565 - dense_5_loss: 0.2161 - loss: 1.0628 - parsing_head_loss: 0.2227 - learning_rate: 1.8806e-05 - dev_UPOS: 96.7715 - dev_UFeats: 92.1856 - dev_Lemmas: 89.7826 - dev_UAS: 81.6106 - dev_LAS: 74.6492
|
| 142 |
+
Epoch 42/120
|
| 143 |
+
319/319 - 119s - 372ms/step - dense_1_loss: 0.1068 - dense_3_loss: 0.2524 - dense_5_loss: 0.2135 - loss: 1.0497 - parsing_head_loss: 0.2197 - learning_rate: 1.8642e-05 - dev_UPOS: 96.7990 - dev_UFeats: 92.2223 - dev_Lemmas: 89.9385 - dev_UAS: 81.8765 - dev_LAS: 74.9794
|
| 144 |
+
Epoch 43/120
|
| 145 |
+
319/319 - 119s - 372ms/step - dense_1_loss: 0.1050 - dense_3_loss: 0.2498 - dense_5_loss: 0.2108 - loss: 1.0346 - parsing_head_loss: 0.2162 - learning_rate: 1.8469e-05 - dev_UPOS: 96.8449 - dev_UFeats: 92.3324 - dev_Lemmas: 90.0486 - dev_UAS: 81.9041 - dev_LAS: 74.9885
|
| 146 |
+
Epoch 44/120
|
| 147 |
+
319/319 - 120s - 375ms/step - dense_1_loss: 0.1037 - dense_3_loss: 0.2427 - dense_5_loss: 0.2060 - loss: 1.0097 - parsing_head_loss: 0.2098 - learning_rate: 1.8286e-05 - dev_UPOS: 96.7165 - dev_UFeats: 92.1581 - dev_Lemmas: 90.0486 - dev_UAS: 81.3446 - dev_LAS: 74.4749
|
| 148 |
+
Epoch 45/120
|
| 149 |
+
319/319 - 119s - 374ms/step - dense_1_loss: 0.1055 - dense_3_loss: 0.2472 - dense_5_loss: 0.2106 - loss: 1.0258 - parsing_head_loss: 0.2135 - learning_rate: 1.8093e-05 - dev_UPOS: 96.6890 - dev_UFeats: 92.3232 - dev_Lemmas: 90.2320 - dev_UAS: 81.9316 - dev_LAS: 74.9885
|
| 150 |
+
Epoch 46/120
|
| 151 |
+
319/319 - 118s - 370ms/step - dense_1_loss: 0.1047 - dense_3_loss: 0.2424 - dense_5_loss: 0.2084 - loss: 1.0162 - parsing_head_loss: 0.2131 - learning_rate: 1.7892e-05 - dev_UPOS: 96.7899 - dev_UFeats: 92.3049 - dev_Lemmas: 90.3971 - dev_UAS: 82.1976 - dev_LAS: 75.3004
|
| 152 |
+
Epoch 47/120
|
| 153 |
+
319/319 - 119s - 373ms/step - dense_1_loss: 0.1033 - dense_3_loss: 0.2379 - dense_5_loss: 0.2035 - loss: 0.9938 - parsing_head_loss: 0.2076 - learning_rate: 1.7682e-05 - dev_UPOS: 96.7990 - dev_UFeats: 92.2590 - dev_Lemmas: 90.3513 - dev_UAS: 81.9774 - dev_LAS: 75.1169
|
| 154 |
+
Epoch 48/120
|
| 155 |
+
319/319 - 119s - 374ms/step - dense_1_loss: 0.1016 - dense_3_loss: 0.2314 - dense_5_loss: 0.2006 - loss: 0.9747 - parsing_head_loss: 0.2033 - learning_rate: 1.7463e-05 - dev_UPOS: 96.8633 - dev_UFeats: 92.4058 - dev_Lemmas: 90.5164 - dev_UAS: 82.1242 - dev_LAS: 75.2637
|
| 156 |
+
Epoch 49/120
|
| 157 |
+
319/319 - 118s - 370ms/step - dense_1_loss: 0.1031 - dense_3_loss: 0.2358 - dense_5_loss: 0.2034 - loss: 0.9852 - parsing_head_loss: 0.2051 - learning_rate: 1.7236e-05 - dev_UPOS: 96.7990 - dev_UFeats: 92.2498 - dev_Lemmas: 90.3605 - dev_UAS: 81.9683 - dev_LAS: 75.1628
|
| 158 |
+
Epoch 50/120
|
| 159 |
+
319/319 - 118s - 371ms/step - dense_1_loss: 0.1018 - dense_3_loss: 0.2317 - dense_5_loss: 0.2006 - loss: 0.9704 - parsing_head_loss: 0.2007 - learning_rate: 1.7000e-05 - dev_UPOS: 96.7990 - dev_UFeats: 92.3874 - dev_Lemmas: 90.5164 - dev_UAS: 81.9591 - dev_LAS: 75.3554
|
| 160 |
+
Epoch 51/120
|
| 161 |
+
319/319 - 118s - 371ms/step - dense_1_loss: 0.1018 - dense_3_loss: 0.2302 - dense_5_loss: 0.2006 - loss: 0.9660 - parsing_head_loss: 0.1994 - learning_rate: 1.6757e-05 - dev_UPOS: 96.7990 - dev_UFeats: 92.2774 - dev_Lemmas: 90.4797 - dev_UAS: 82.1334 - dev_LAS: 75.4196
|
| 162 |
+
Epoch 52/120
|
| 163 |
+
319/319 - 118s - 370ms/step - dense_1_loss: 0.1019 - dense_3_loss: 0.2286 - dense_5_loss: 0.1995 - loss: 0.9613 - parsing_head_loss: 0.1988 - learning_rate: 1.6506e-05 - dev_UPOS: 96.7807 - dev_UFeats: 92.3507 - dev_Lemmas: 90.5806 - dev_UAS: 82.1425 - dev_LAS: 75.3371
|
| 164 |
+
Epoch 53/120
|
| 165 |
+
319/319 - 119s - 372ms/step - dense_1_loss: 0.1000 - dense_3_loss: 0.2238 - dense_5_loss: 0.1956 - loss: 0.9408 - parsing_head_loss: 0.1941 - learning_rate: 1.6248e-05 - dev_UPOS: 96.7165 - dev_UFeats: 92.4149 - dev_Lemmas: 90.5622 - dev_UAS: 82.2159 - dev_LAS: 75.2820
|
| 166 |
+
Epoch 54/120
|
| 167 |
+
319/319 - 118s - 370ms/step - dense_1_loss: 0.1001 - dense_3_loss: 0.2233 - dense_5_loss: 0.1957 - loss: 0.9387 - parsing_head_loss: 0.1936 - learning_rate: 1.5983e-05 - dev_UPOS: 96.7990 - dev_UFeats: 92.4149 - dev_Lemmas: 90.7548 - dev_UAS: 82.2159 - dev_LAS: 75.4380
|
| 168 |
+
Epoch 55/120
|
| 169 |
+
319/319 - 119s - 372ms/step - dense_1_loss: 0.0982 - dense_3_loss: 0.2167 - dense_5_loss: 0.1912 - loss: 0.9150 - parsing_head_loss: 0.1883 - learning_rate: 1.5711e-05 - dev_UPOS: 96.8541 - dev_UFeats: 92.4516 - dev_Lemmas: 90.7824 - dev_UAS: 82.4819 - dev_LAS: 75.8599
|
| 170 |
+
Epoch 56/120
|
| 171 |
+
319/319 - 117s - 368ms/step - dense_1_loss: 0.1010 - dense_3_loss: 0.2218 - dense_5_loss: 0.1963 - loss: 0.9380 - parsing_head_loss: 0.1933 - learning_rate: 1.5433e-05 - dev_UPOS: 96.8449 - dev_UFeats: 92.3966 - dev_Lemmas: 90.7273 - dev_UAS: 82.2709 - dev_LAS: 75.6306
|
| 172 |
+
Epoch 57/120
|
| 173 |
+
319/319 - 118s - 370ms/step - dense_1_loss: 0.1000 - dense_3_loss: 0.2185 - dense_5_loss: 0.1936 - loss: 0.9218 - parsing_head_loss: 0.1890 - learning_rate: 1.5148e-05 - dev_UPOS: 96.7715 - dev_UFeats: 92.4975 - dev_Lemmas: 90.7365 - dev_UAS: 82.3535 - dev_LAS: 75.6306
|
| 174 |
+
Epoch 58/120
|
| 175 |
+
319/319 - 119s - 373ms/step - dense_1_loss: 0.0968 - dense_3_loss: 0.2121 - dense_5_loss: 0.1874 - loss: 0.8931 - parsing_head_loss: 0.1823 - learning_rate: 1.4858e-05 - dev_UPOS: 96.8633 - dev_UFeats: 92.6167 - dev_Lemmas: 90.7732 - dev_UAS: 82.4635 - dev_LAS: 75.6948
|
| 176 |
+
Epoch 59/120
|
| 177 |
+
319/319 - 118s - 369ms/step - dense_1_loss: 0.0988 - dense_3_loss: 0.2156 - dense_5_loss: 0.1914 - loss: 0.9091 - parsing_head_loss: 0.1852 - learning_rate: 1.4562e-05 - dev_UPOS: 96.8541 - dev_UFeats: 92.5158 - dev_Lemmas: 90.7915 - dev_UAS: 82.2801 - dev_LAS: 75.7315
|
| 178 |
+
Epoch 60/120
|
| 179 |
+
319/319 - 118s - 369ms/step - dense_1_loss: 0.0977 - dense_3_loss: 0.2126 - dense_5_loss: 0.1890 - loss: 0.8969 - parsing_head_loss: 0.1826 - learning_rate: 1.4262e-05 - dev_UPOS: 96.7899 - dev_UFeats: 92.5617 - dev_Lemmas: 90.8557 - dev_UAS: 82.4911 - dev_LAS: 75.8323
|
| 180 |
+
Epoch 61/120
|
| 181 |
+
319/319 - 118s - 371ms/step - dense_1_loss: 0.0961 - dense_3_loss: 0.2089 - dense_5_loss: 0.1857 - loss: 0.8822 - parsing_head_loss: 0.1799 - learning_rate: 1.3956e-05 - dev_UPOS: 96.8174 - dev_UFeats: 92.4608 - dev_Lemmas: 90.9474 - dev_UAS: 82.2526 - dev_LAS: 75.5388
|
| 182 |
+
Epoch 62/120
|
| 183 |
+
319/319 - 117s - 368ms/step - dense_1_loss: 0.0974 - dense_3_loss: 0.2105 - dense_5_loss: 0.1882 - loss: 0.8906 - parsing_head_loss: 0.1812 - learning_rate: 1.3646e-05 - dev_UPOS: 96.8816 - dev_UFeats: 92.4791 - dev_Lemmas: 90.8741 - dev_UAS: 82.5094 - dev_LAS: 75.9607
|
| 184 |
+
Epoch 63/120
|
| 185 |
+
319/319 - 118s - 369ms/step - dense_1_loss: 0.0971 - dense_3_loss: 0.2096 - dense_5_loss: 0.1874 - loss: 0.8835 - parsing_head_loss: 0.1789 - learning_rate: 1.3332e-05 - dev_UPOS: 96.8266 - dev_UFeats: 92.3874 - dev_Lemmas: 90.8924 - dev_UAS: 82.5186 - dev_LAS: 75.7957
|
| 186 |
+
Epoch 64/120
|
| 187 |
+
319/319 - 118s - 369ms/step - dense_1_loss: 0.0969 - dense_3_loss: 0.2081 - dense_5_loss: 0.1864 - loss: 0.8806 - parsing_head_loss: 0.1789 - learning_rate: 1.3014e-05 - dev_UPOS: 96.7990 - dev_UFeats: 92.5433 - dev_Lemmas: 90.9658 - dev_UAS: 82.4085 - dev_LAS: 75.7865
|
| 188 |
+
Epoch 65/120
|
| 189 |
+
319/319 - 119s - 372ms/step - dense_1_loss: 0.0951 - dense_3_loss: 0.2036 - dense_5_loss: 0.1826 - loss: 0.8593 - parsing_head_loss: 0.1732 - learning_rate: 1.2693e-05 - dev_UPOS: 96.8724 - dev_UFeats: 92.5158 - dev_Lemmas: 90.9750 - dev_UAS: 82.3810 - dev_LAS: 75.7681
|
| 190 |
+
Epoch 66/120
|
| 191 |
+
319/319 - 118s - 371ms/step - dense_1_loss: 0.0954 - dense_3_loss: 0.2046 - dense_5_loss: 0.1836 - loss: 0.8627 - parsing_head_loss: 0.1741 - learning_rate: 1.2369e-05 - dev_UPOS: 96.8449 - dev_UFeats: 92.5342 - dev_Lemmas: 90.9199 - dev_UAS: 82.6286 - dev_LAS: 75.9974
|
| 192 |
+
Epoch 67/120
|
| 193 |
+
319/319 - 118s - 370ms/step - dense_1_loss: 0.0952 - dense_3_loss: 0.2028 - dense_5_loss: 0.1825 - loss: 0.8563 - parsing_head_loss: 0.1719 - learning_rate: 1.2042e-05 - dev_UPOS: 96.7990 - dev_UFeats: 92.5342 - dev_Lemmas: 90.9566 - dev_UAS: 82.4085 - dev_LAS: 75.7865
|
| 194 |
+
Epoch 68/120
|
| 195 |
+
319/319 - 117s - 366ms/step - dense_1_loss: 0.0961 - dense_3_loss: 0.2042 - dense_5_loss: 0.1841 - loss: 0.8612 - parsing_head_loss: 0.1740 - learning_rate: 1.1713e-05 - dev_UPOS: 96.7990 - dev_UFeats: 92.5433 - dev_Lemmas: 91.0025 - dev_UAS: 82.4360 - dev_LAS: 75.9057
|
| 196 |
+
Epoch 69/120
|
| 197 |
+
319/319 - 118s - 371ms/step - dense_1_loss: 0.0943 - dense_3_loss: 0.2004 - dense_5_loss: 0.1807 - loss: 0.8462 - parsing_head_loss: 0.1700 - learning_rate: 1.1381e-05 - dev_UPOS: 96.8724 - dev_UFeats: 92.6993 - dev_Lemmas: 91.0759 - dev_UAS: 82.4452 - dev_LAS: 75.8048
|
| 198 |
+
Epoch 70/120
|
| 199 |
+
319/319 - 118s - 371ms/step - dense_1_loss: 0.0945 - dense_3_loss: 0.2005 - dense_5_loss: 0.1809 - loss: 0.8462 - parsing_head_loss: 0.1703 - learning_rate: 1.1049e-05 - dev_UPOS: 96.7990 - dev_UFeats: 92.5433 - dev_Lemmas: 90.9841 - dev_UAS: 82.5644 - dev_LAS: 75.9699
|
| 200 |
+
Epoch 71/120
|
| 201 |
+
319/319 - 118s - 368ms/step - dense_1_loss: 0.0949 - dense_3_loss: 0.2006 - dense_5_loss: 0.1819 - loss: 0.8481 - parsing_head_loss: 0.1705 - learning_rate: 1.0715e-05 - dev_UPOS: 96.7807 - dev_UFeats: 92.6809 - dev_Lemmas: 90.9016 - dev_UAS: 82.5277 - dev_LAS: 75.7681
|
| 202 |
+
Epoch 72/120
|
| 203 |
+
319/319 - 118s - 369ms/step - dense_1_loss: 0.0946 - dense_3_loss: 0.1989 - dense_5_loss: 0.1808 - loss: 0.8418 - parsing_head_loss: 0.1688 - learning_rate: 1.0380e-05 - dev_UPOS: 96.8449 - dev_UFeats: 92.6442 - dev_Lemmas: 91.0300 - dev_UAS: 82.7662 - dev_LAS: 76.1075
|
| 204 |
+
Epoch 73/120
|
| 205 |
+
319/319 - 118s - 371ms/step - dense_1_loss: 0.0941 - dense_3_loss: 0.1976 - dense_5_loss: 0.1795 - loss: 0.8370 - parsing_head_loss: 0.1682 - learning_rate: 1.0045e-05 - dev_UPOS: 96.8082 - dev_UFeats: 92.6442 - dev_Lemmas: 91.1401 - dev_UAS: 82.6195 - dev_LAS: 76.0525
|
| 206 |
+
Epoch 74/120
|
| 207 |
+
319/319 - 118s - 369ms/step - dense_1_loss: 0.0941 - dense_3_loss: 0.1984 - dense_5_loss: 0.1792 - loss: 0.8365 - parsing_head_loss: 0.1677 - learning_rate: 9.7100e-06 - dev_UPOS: 96.8724 - dev_UFeats: 92.5709 - dev_Lemmas: 91.0208 - dev_UAS: 82.7295 - dev_LAS: 75.8782
|
| 208 |
+
Epoch 75/120
|
| 209 |
+
319/319 - 119s - 373ms/step - dense_1_loss: 0.0924 - dense_3_loss: 0.1937 - dense_5_loss: 0.1759 - loss: 0.8182 - parsing_head_loss: 0.1641 - learning_rate: 9.3752e-06 - dev_UPOS: 96.8633 - dev_UFeats: 92.6351 - dev_Lemmas: 90.9933 - dev_UAS: 82.7112 - dev_LAS: 76.1167
|
| 210 |
+
Epoch 76/120
|
| 211 |
+
319/319 - 119s - 373ms/step - dense_1_loss: 0.0923 - dense_3_loss: 0.1932 - dense_5_loss: 0.1756 - loss: 0.8164 - parsing_head_loss: 0.1638 - learning_rate: 9.0411e-06 - dev_UPOS: 96.8449 - dev_UFeats: 92.5525 - dev_Lemmas: 91.0759 - dev_UAS: 82.9038 - dev_LAS: 76.2176
|
| 212 |
+
Epoch 77/120
|
| 213 |
+
319/319 - 118s - 369ms/step - dense_1_loss: 0.0938 - dense_3_loss: 0.1958 - dense_5_loss: 0.1777 - loss: 0.8261 - parsing_head_loss: 0.1656 - learning_rate: 8.7081e-06 - dev_UPOS: 96.8266 - dev_UFeats: 92.6626 - dev_Lemmas: 91.0575 - dev_UAS: 82.6103 - dev_LAS: 75.7590
|
| 214 |
+
Epoch 78/120
|
| 215 |
+
319/319 - 118s - 368ms/step - dense_1_loss: 0.0941 - dense_3_loss: 0.1964 - dense_5_loss: 0.1783 - loss: 0.8268 - parsing_head_loss: 0.1653 - learning_rate: 8.3765e-06 - dev_UPOS: 96.8174 - dev_UFeats: 92.6075 - dev_Lemmas: 91.0850 - dev_UAS: 82.8121 - dev_LAS: 76.1625
|
| 216 |
+
Epoch 79/120
|
| 217 |
+
319/319 - 118s - 371ms/step - dense_1_loss: 0.0921 - dense_3_loss: 0.1916 - dense_5_loss: 0.1748 - loss: 0.8098 - parsing_head_loss: 0.1615 - learning_rate: 8.0468e-06 - dev_UPOS: 96.8357 - dev_UFeats: 92.5617 - dev_Lemmas: 91.1125 - dev_UAS: 82.6011 - dev_LAS: 76.0066
|
| 218 |
+
Epoch 80/120
|
| 219 |
+
319/319 - 118s - 370ms/step - dense_1_loss: 0.0928 - dense_3_loss: 0.1932 - dense_5_loss: 0.1763 - loss: 0.8147 - parsing_head_loss: 0.1624 - learning_rate: 7.7192e-06 - dev_UPOS: 96.8266 - dev_UFeats: 92.5433 - dev_Lemmas: 91.1217 - dev_UAS: 82.4819 - dev_LAS: 75.8507
|
| 220 |
+
Epoch 81/120
|
| 221 |
+
319/319 - 119s - 372ms/step - dense_1_loss: 0.0922 - dense_3_loss: 0.1912 - dense_5_loss: 0.1746 - loss: 0.8088 - parsing_head_loss: 0.1618 - learning_rate: 7.3942e-06 - dev_UPOS: 96.8541 - dev_UFeats: 92.5892 - dev_Lemmas: 91.1401 - dev_UAS: 82.8212 - dev_LAS: 76.1900
|
| 222 |
+
Epoch 82/120
|
| 223 |
+
319/319 - 119s - 372ms/step - dense_1_loss: 0.0917 - dense_3_loss: 0.1904 - dense_5_loss: 0.1734 - loss: 0.8012 - parsing_head_loss: 0.1596 - learning_rate: 7.0722e-06 - dev_UPOS: 96.8266 - dev_UFeats: 92.5800 - dev_Lemmas: 91.1767 - dev_UAS: 82.6928 - dev_LAS: 76.0433
|
| 224 |
+
Epoch 83/120
|
| 225 |
+
319/319 - 117s - 368ms/step - dense_1_loss: 0.0929 - dense_3_loss: 0.1923 - dense_5_loss: 0.1755 - loss: 0.8112 - parsing_head_loss: 0.1623 - learning_rate: 6.7534e-06 - dev_UPOS: 96.8724 - dev_UFeats: 92.6167 - dev_Lemmas: 91.1951 - dev_UAS: 82.6837 - dev_LAS: 75.9699
|
| 226 |
+
Epoch 84/120
|
| 227 |
+
319/319 - 119s - 372ms/step - dense_1_loss: 0.0919 - dense_3_loss: 0.1904 - dense_5_loss: 0.1736 - loss: 0.8032 - parsing_head_loss: 0.1605 - learning_rate: 6.4382e-06 - dev_UPOS: 96.8357 - dev_UFeats: 92.5984 - dev_Lemmas: 91.2409 - dev_UAS: 82.8671 - dev_LAS: 76.2726
|
| 228 |
+
Epoch 85/120
|
| 229 |
+
319/319 - 118s - 369ms/step - dense_1_loss: 0.0926 - dense_3_loss: 0.1914 - dense_5_loss: 0.1743 - loss: 0.8058 - parsing_head_loss: 0.1609 - learning_rate: 6.1271e-06 - dev_UPOS: 96.8633 - dev_UFeats: 92.6259 - dev_Lemmas: 91.2134 - dev_UAS: 82.8029 - dev_LAS: 76.1900
|
| 230 |
+
Epoch 86/120
|
| 231 |
+
319/319 - 119s - 372ms/step - dense_1_loss: 0.0915 - dense_3_loss: 0.1895 - dense_5_loss: 0.1732 - loss: 0.7982 - parsing_head_loss: 0.1595 - learning_rate: 5.8203e-06 - dev_UPOS: 96.8266 - dev_UFeats: 92.6626 - dev_Lemmas: 91.2685 - dev_UAS: 82.8854 - dev_LAS: 76.2176
|
| 232 |
+
Epoch 87/120
|
| 233 |
+
319/319 - 118s - 370ms/step - dense_1_loss: 0.0916 - dense_3_loss: 0.1888 - dense_5_loss: 0.1731 - loss: 0.7967 - parsing_head_loss: 0.1592 - learning_rate: 5.5182e-06 - dev_UPOS: 96.8082 - dev_UFeats: 92.5342 - dev_Lemmas: 91.1492 - dev_UAS: 82.8121 - dev_LAS: 76.1809
|
| 234 |
+
Epoch 88/120
|
| 235 |
+
319/319 - 119s - 372ms/step - dense_1_loss: 0.0912 - dense_3_loss: 0.1870 - dense_5_loss: 0.1717 - loss: 0.7896 - parsing_head_loss: 0.1573 - learning_rate: 5.2212e-06 - dev_UPOS: 96.8541 - dev_UFeats: 92.5525 - dev_Lemmas: 91.1584 - dev_UAS: 82.8396 - dev_LAS: 76.2359
|
| 236 |
+
Epoch 89/120
|
| 237 |
+
319/319 - 119s - 374ms/step - dense_1_loss: 0.0902 - dense_3_loss: 0.1852 - dense_5_loss: 0.1699 - loss: 0.7832 - parsing_head_loss: 0.1564 - learning_rate: 4.9295e-06 - dev_UPOS: 96.8357 - dev_UFeats: 92.5158 - dev_Lemmas: 91.1951 - dev_UAS: 82.8488 - dev_LAS: 76.2451
|
| 238 |
+
Epoch 90/120
|
| 239 |
+
319/319 - 119s - 372ms/step - dense_1_loss: 0.0908 - dense_3_loss: 0.1866 - dense_5_loss: 0.1711 - loss: 0.7863 - parsing_head_loss: 0.1566 - learning_rate: 4.6435e-06 - dev_UPOS: 96.8633 - dev_UFeats: 92.5709 - dev_Lemmas: 91.1584 - dev_UAS: 82.8121 - dev_LAS: 76.1258
|
| 240 |
+
Epoch 91/120
|
| 241 |
+
319/319 - 117s - 367ms/step - dense_1_loss: 0.0928 - dense_3_loss: 0.1897 - dense_5_loss: 0.1743 - loss: 0.8008 - parsing_head_loss: 0.1597 - learning_rate: 4.3635e-06 - dev_UPOS: 96.8357 - dev_UFeats: 92.6442 - dev_Lemmas: 91.2318 - dev_UAS: 82.9221 - dev_LAS: 76.1992
|
| 242 |
+
Epoch 92/120
|
| 243 |
+
319/319 - 118s - 371ms/step - dense_1_loss: 0.0916 - dense_3_loss: 0.1877 - dense_5_loss: 0.1720 - loss: 0.7908 - parsing_head_loss: 0.1573 - learning_rate: 4.0899e-06 - dev_UPOS: 96.8724 - dev_UFeats: 92.5617 - dev_Lemmas: 91.1584 - dev_UAS: 82.8671 - dev_LAS: 76.2084
|
| 244 |
+
Epoch 93/120
|
| 245 |
+
319/319 - 118s - 371ms/step - dense_1_loss: 0.0915 - dense_3_loss: 0.1874 - dense_5_loss: 0.1716 - loss: 0.7898 - parsing_head_loss: 0.1573 - learning_rate: 3.8229e-06 - dev_UPOS: 96.8449 - dev_UFeats: 92.6167 - dev_Lemmas: 91.2226 - dev_UAS: 83.0047 - dev_LAS: 76.4652
|
| 246 |
+
Epoch 94/120
|
| 247 |
+
319/319 - 118s - 370ms/step - dense_1_loss: 0.0906 - dense_3_loss: 0.1859 - dense_5_loss: 0.1707 - loss: 0.7818 - parsing_head_loss: 0.1557 - learning_rate: 3.5628e-06 - dev_UPOS: 96.8724 - dev_UFeats: 92.6167 - dev_Lemmas: 91.1859 - dev_UAS: 82.9405 - dev_LAS: 76.3643
|
| 248 |
+
Epoch 95/120
|
| 249 |
+
319/319 - 118s - 369ms/step - dense_1_loss: 0.0910 - dense_3_loss: 0.1860 - dense_5_loss: 0.1708 - loss: 0.7825 - parsing_head_loss: 0.1559 - learning_rate: 3.3100e-06 - dev_UPOS: 96.8082 - dev_UFeats: 92.5800 - dev_Lemmas: 91.2501 - dev_UAS: 82.9680 - dev_LAS: 76.3368
|
| 250 |
+
Epoch 96/120
|
| 251 |
+
319/319 - 118s - 370ms/step - dense_1_loss: 0.0911 - dense_3_loss: 0.1862 - dense_5_loss: 0.1707 - loss: 0.7841 - parsing_head_loss: 0.1562 - learning_rate: 3.0647e-06 - dev_UPOS: 96.8541 - dev_UFeats: 92.6259 - dev_Lemmas: 91.2501 - dev_UAS: 82.9772 - dev_LAS: 76.3184
|
| 252 |
+
Epoch 97/120
|
| 253 |
+
319/319 - 118s - 370ms/step - dense_1_loss: 0.0909 - dense_3_loss: 0.1858 - dense_5_loss: 0.1702 - loss: 0.7812 - parsing_head_loss: 0.1550 - learning_rate: 2.8272e-06 - dev_UPOS: 96.8633 - dev_UFeats: 92.6351 - dev_Lemmas: 91.2226 - dev_UAS: 82.9496 - dev_LAS: 76.1992
|
| 254 |
+
Epoch 98/120
|
| 255 |
+
319/319 - 118s - 369ms/step - dense_1_loss: 0.0916 - dense_3_loss: 0.1872 - dense_5_loss: 0.1721 - loss: 0.7876 - parsing_head_loss: 0.1568 - learning_rate: 2.5977e-06 - dev_UPOS: 96.8816 - dev_UFeats: 92.6442 - dev_Lemmas: 91.2501 - dev_UAS: 83.1056 - dev_LAS: 76.3918
|
| 256 |
+
Epoch 99/120
|
| 257 |
+
319/319 - 118s - 371ms/step - dense_1_loss: 0.0911 - dense_3_loss: 0.1858 - dense_5_loss: 0.1709 - loss: 0.7825 - parsing_head_loss: 0.1560 - learning_rate: 2.3765e-06 - dev_UPOS: 96.8908 - dev_UFeats: 92.6351 - dev_Lemmas: 91.2868 - dev_UAS: 83.0780 - dev_LAS: 76.4193
|
| 258 |
+
Epoch 100/120
|
| 259 |
+
319/319 - 118s - 370ms/step - dense_1_loss: 0.0910 - dense_3_loss: 0.1860 - dense_5_loss: 0.1707 - loss: 0.7828 - parsing_head_loss: 0.1563 - learning_rate: 2.1639e-06 - dev_UPOS: 96.8724 - dev_UFeats: 92.6259 - dev_Lemmas: 91.2868 - dev_UAS: 83.0597 - dev_LAS: 76.3460
|
| 260 |
+
Epoch 101/120
|
| 261 |
+
319/319 - 118s - 371ms/step - dense_1_loss: 0.0910 - dense_3_loss: 0.1853 - dense_5_loss: 0.1701 - loss: 0.7803 - parsing_head_loss: 0.1553 - learning_rate: 1.9601e-06 - dev_UPOS: 96.8816 - dev_UFeats: 92.6075 - dev_Lemmas: 91.2501 - dev_UAS: 82.9405 - dev_LAS: 76.2176
|
| 262 |
+
Epoch 102/120
|
| 263 |
+
319/319 - 118s - 369ms/step - dense_1_loss: 0.0917 - dense_3_loss: 0.1868 - dense_5_loss: 0.1715 - loss: 0.7851 - parsing_head_loss: 0.1563 - learning_rate: 1.7654e-06 - dev_UPOS: 96.8908 - dev_UFeats: 92.6626 - dev_Lemmas: 91.2043 - dev_UAS: 83.0322 - dev_LAS: 76.3093
|
| 264 |
+
Epoch 103/120
|
| 265 |
+
319/319 - 118s - 371ms/step - dense_1_loss: 0.0904 - dense_3_loss: 0.1838 - dense_5_loss: 0.1689 - loss: 0.7747 - parsing_head_loss: 0.1546 - learning_rate: 1.5799e-06 - dev_UPOS: 96.8633 - dev_UFeats: 92.6534 - dev_Lemmas: 91.2226 - dev_UAS: 83.0597 - dev_LAS: 76.3093
|
| 266 |
+
Epoch 104/120
|
| 267 |
+
319/319 - 118s - 369ms/step - dense_1_loss: 0.0914 - dense_3_loss: 0.1863 - dense_5_loss: 0.1716 - loss: 0.7853 - parsing_head_loss: 0.1562 - learning_rate: 1.4038e-06 - dev_UPOS: 96.8357 - dev_UFeats: 92.6717 - dev_Lemmas: 91.2318 - dev_UAS: 82.9588 - dev_LAS: 76.2542
|
| 268 |
+
Epoch 105/120
|
| 269 |
+
319/319 - 118s - 371ms/step - dense_1_loss: 0.0907 - dense_3_loss: 0.1852 - dense_5_loss: 0.1694 - loss: 0.7765 - parsing_head_loss: 0.1546 - learning_rate: 1.2374e-06 - dev_UPOS: 96.8724 - dev_UFeats: 92.6626 - dev_Lemmas: 91.2593 - dev_UAS: 82.9221 - dev_LAS: 76.2909
|
| 270 |
+
Epoch 106/120
|
| 271 |
+
319/319 - 117s - 367ms/step - dense_1_loss: 0.0920 - dense_3_loss: 0.1871 - dense_5_loss: 0.1720 - loss: 0.7874 - parsing_head_loss: 0.1566 - learning_rate: 1.0809e-06 - dev_UPOS: 96.8633 - dev_UFeats: 92.6442 - dev_Lemmas: 91.2685 - dev_UAS: 82.9772 - dev_LAS: 76.3551
|
| 272 |
+
Epoch 107/120
|
| 273 |
+
319/319 - 119s - 372ms/step - dense_1_loss: 0.0896 - dense_3_loss: 0.1819 - dense_5_loss: 0.1674 - loss: 0.7668 - parsing_head_loss: 0.1535 - learning_rate: 9.3436e-07 - dev_UPOS: 96.8816 - dev_UFeats: 92.6534 - dev_Lemmas: 91.2685 - dev_UAS: 82.9863 - dev_LAS: 76.3551
|
| 274 |
+
Epoch 108/120
|
| 275 |
+
319/319 - 118s - 369ms/step - dense_1_loss: 0.0919 - dense_3_loss: 0.1867 - dense_5_loss: 0.1718 - loss: 0.7850 - parsing_head_loss: 0.1558 - learning_rate: 7.9801e-07 - dev_UPOS: 96.8633 - dev_UFeats: 92.6534 - dev_Lemmas: 91.3143 - dev_UAS: 83.0047 - dev_LAS: 76.3918
|
| 276 |
+
Epoch 109/120
|
| 277 |
+
319/319 - 117s - 367ms/step - dense_1_loss: 0.0925 - dense_3_loss: 0.1879 - dense_5_loss: 0.1728 - loss: 0.7907 - parsing_head_loss: 0.1576 - learning_rate: 6.7200e-07 - dev_UPOS: 96.8633 - dev_UFeats: 92.6167 - dev_Lemmas: 91.2685 - dev_UAS: 82.9772 - dev_LAS: 76.3368
|
| 278 |
+
Epoch 110/120
|
| 279 |
+
319/319 - 118s - 369ms/step - dense_1_loss: 0.0914 - dense_3_loss: 0.1859 - dense_5_loss: 0.1708 - loss: 0.7818 - parsing_head_loss: 0.1556 - learning_rate: 5.5647e-07 - dev_UPOS: 96.8816 - dev_UFeats: 92.5892 - dev_Lemmas: 91.2501 - dev_UAS: 82.9863 - dev_LAS: 76.3643
|
| 280 |
+
Epoch 111/120
|
| 281 |
+
319/319 - 118s - 371ms/step - dense_1_loss: 0.0912 - dense_3_loss: 0.1860 - dense_5_loss: 0.1704 - loss: 0.7807 - parsing_head_loss: 0.1554 - learning_rate: 4.5154e-07 - dev_UPOS: 96.8724 - dev_UFeats: 92.6717 - dev_Lemmas: 91.2685 - dev_UAS: 83.0414 - dev_LAS: 76.4010
|
| 282 |
+
Epoch 112/120
|
| 283 |
+
319/319 - 119s - 372ms/step - dense_1_loss: 0.0903 - dense_3_loss: 0.1832 - dense_5_loss: 0.1688 - loss: 0.7721 - parsing_head_loss: 0.1538 - learning_rate: 3.5734e-07 - dev_UPOS: 96.8724 - dev_UFeats: 92.6534 - dev_Lemmas: 91.2409 - dev_UAS: 83.0505 - dev_LAS: 76.3918
|
| 284 |
+
Epoch 113/120
|
| 285 |
+
319/319 - 118s - 369ms/step - dense_1_loss: 0.0908 - dense_3_loss: 0.1843 - dense_5_loss: 0.1694 - loss: 0.7747 - parsing_head_loss: 0.1537 - learning_rate: 2.7398e-07 - dev_UPOS: 96.8724 - dev_UFeats: 92.6259 - dev_Lemmas: 91.2868 - dev_UAS: 83.0230 - dev_LAS: 76.3735
|
| 286 |
+
Epoch 114/120
|
| 287 |
+
319/319 - 117s - 368ms/step - dense_1_loss: 0.0922 - dense_3_loss: 0.1875 - dense_5_loss: 0.1721 - loss: 0.7869 - parsing_head_loss: 0.1569 - learning_rate: 2.0153e-07 - dev_UPOS: 96.8816 - dev_UFeats: 92.6534 - dev_Lemmas: 91.2868 - dev_UAS: 83.0505 - dev_LAS: 76.3826
|
| 288 |
+
Epoch 115/120
|
| 289 |
+
319/319 - 119s - 372ms/step - dense_1_loss: 0.0904 - dense_3_loss: 0.1836 - dense_5_loss: 0.1691 - loss: 0.7736 - parsing_head_loss: 0.1540 - learning_rate: 1.4010e-07 - dev_UPOS: 96.8816 - dev_UFeats: 92.6626 - dev_Lemmas: 91.2868 - dev_UAS: 83.0230 - dev_LAS: 76.3735
|
| 290 |
+
Epoch 116/120
|
| 291 |
+
319/319 - 118s - 369ms/step - dense_1_loss: 0.0914 - dense_3_loss: 0.1856 - dense_5_loss: 0.1708 - loss: 0.7800 - parsing_head_loss: 0.1554 - learning_rate: 8.9738e-08 - dev_UPOS: 96.8633 - dev_UFeats: 92.6626 - dev_Lemmas: 91.2776 - dev_UAS: 82.9772 - dev_LAS: 76.3460
|
| 292 |
+
Epoch 117/120
|
| 293 |
+
319/319 - 118s - 370ms/step - dense_1_loss: 0.0909 - dense_3_loss: 0.1848 - dense_5_loss: 0.1697 - loss: 0.7763 - parsing_head_loss: 0.1545 - learning_rate: 5.0511e-08 - dev_UPOS: 96.8633 - dev_UFeats: 92.6259 - dev_Lemmas: 91.2868 - dev_UAS: 83.0138 - dev_LAS: 76.3551
|
| 294 |
+
Epoch 118/120
|
| 295 |
+
319/319 - 117s - 368ms/step - dense_1_loss: 0.0918 - dense_3_loss: 0.1864 - dense_5_loss: 0.1715 - loss: 0.7834 - parsing_head_loss: 0.1561 - learning_rate: 2.2460e-08 - dev_UPOS: 96.8816 - dev_UFeats: 92.6259 - dev_Lemmas: 91.2868 - dev_UAS: 83.0047 - dev_LAS: 76.3643
|
| 296 |
+
Epoch 119/120
|
| 297 |
+
319/319 - 118s - 370ms/step - dense_1_loss: 0.0910 - dense_3_loss: 0.1845 - dense_5_loss: 0.1698 - loss: 0.7767 - parsing_head_loss: 0.1546 - learning_rate: 5.6165e-09 - dev_UPOS: 96.8816 - dev_UFeats: 92.6259 - dev_Lemmas: 91.2868 - dev_UAS: 82.9955 - dev_LAS: 76.3643
|
| 298 |
+
Epoch 120/120
|
| 299 |
+
319/319 - 123s - 385ms/step - dense_1_loss: 0.0898 - dense_3_loss: 0.1824 - dense_5_loss: 0.1676 - loss: 0.7677 - parsing_head_loss: 0.1526 - learning_rate: 0.0000e+00 - dev_UPOS: 96.8816 - dev_UFeats: 92.6259 - dev_Lemmas: 91.2868 - dev_UAS: 82.9955 - dev_LAS: 76.3643 - test_UPOS: 97.1577 - test_UFeats: 93.5661 - test_Lemmas: 90.6416 - test_UAS: 83.7141 - test_LAS: 77.1614
|
| 300 |
+
Traceback (most recent call last):
|
| 301 |
+
File "/gpfs/bwfor/home/hd/hd_hd/hd_ec199/reproduce/evalatin2024-latinpipe/latinpipe_evalatin24.py", line 935, in <module>
|
| 302 |
+
main([] if "__file__" not in globals() else None)
|
| 303 |
+
File "/gpfs/bwfor/home/hd/hd_hd/hd_ec199/reproduce/evalatin2024-latinpipe/latinpipe_evalatin24.py", line 819, in main
|
| 304 |
+
with open(os.path.join(os.path.dirname(args.load[0]), "options.json"), mode="r") as options_file:
|
| 305 |
+
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
|
| 306 |
+
FileNotFoundError: [Errno 2] No such file or directory: '/home/hd/hd_hd/hd_ec199/evalatin2024-latinpipe/latinpipe-evalatin/options.json'
|