Jacobo commited on
Commit
c20efa3
1 Parent(s): 354f8cf

Update spaCy pipeline

Browse files
README.md CHANGED
@@ -13,57 +13,57 @@ model-index:
13
  metrics:
14
  - name: TAG (XPOS) Accuracy
15
  type: accuracy
16
- value: 0.8956201577
17
  - task:
18
  name: POS
19
  type: token-classification
20
  metrics:
21
  - name: POS (UPOS) Accuracy
22
  type: accuracy
23
- value: 0.8900634727
24
  - task:
25
  name: MORPH
26
  type: token-classification
27
  metrics:
28
  - name: Morph (UFeats) Accuracy
29
  type: accuracy
30
- value: 0.833069799
31
  - task:
32
  name: LEMMA
33
  type: token-classification
34
  metrics:
35
  - name: Lemma Accuracy
36
  type: accuracy
37
- value: 0.9104912479
38
  - task:
39
  name: UNLABELED_DEPENDENCIES
40
  type: token-classification
41
  metrics:
42
  - name: Unlabeled Attachment Score (UAS)
43
  type: f_score
44
- value: 0.6668855274
45
  - task:
46
  name: LABELED_DEPENDENCIES
47
  type: token-classification
48
  metrics:
49
  - name: Labeled Attachment Score (LAS)
50
  type: f_score
51
- value: 0.5832828283
52
  - task:
53
  name: SENTS
54
  type: token-classification
55
  metrics:
56
  - name: Sentences F-Score
57
  type: f_score
58
- value: 0.9851138354
59
  ---
60
  | Feature | Description |
61
  | --- | --- |
62
  | **Name** | `grc_perseus_sm` |
63
- | **Version** | `3.5.2` |
64
- | **spaCy** | `>=3.5.2,<3.6.0` |
65
- | **Default Pipeline** | `tok2vec`, `morphologizer`, `tagger`, `parser`, `senter`, `lemmatizer`, `attribute_ruler` |
66
- | **Components** | `tok2vec`, `morphologizer`, `tagger`, `parser`, `senter`, `lemmatizer`, `attribute_ruler` |
67
  | **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
68
  | **Sources** | n/a |
69
  | **License** | n/a |
@@ -87,16 +87,16 @@ model-index:
87
 
88
  | Type | Score |
89
  | --- | --- |
90
- | `POS_ACC` | 89.01 |
91
- | `MORPH_ACC` | 83.31 |
92
- | `TAG_ACC` | 89.56 |
93
- | `DEP_UAS` | 66.69 |
94
- | `DEP_LAS` | 58.33 |
95
- | `SENTS_P` | 98.08 |
96
- | `SENTS_R` | 98.94 |
97
- | `SENTS_F` | 98.51 |
98
- | `LEMMA_ACC` | 91.05 |
99
- | `TOK2VEC_LOSS` | 3400933.71 |
100
- | `MORPHOLOGIZER_LOSS` | 173976.78 |
101
- | `TAGGER_LOSS` | 76908.63 |
102
- | `PARSER_LOSS` | 1643447.20 |
 
13
  metrics:
14
  - name: TAG (XPOS) Accuracy
15
  type: accuracy
16
+ value: 0.8967495652
17
  - task:
18
  name: POS
19
  type: token-classification
20
  metrics:
21
  - name: POS (UPOS) Accuracy
22
  type: accuracy
23
+ value: 0.8929297493
24
  - task:
25
  name: MORPH
26
  type: token-classification
27
  metrics:
28
  - name: Morph (UFeats) Accuracy
29
  type: accuracy
30
+ value: 0.8346510052
31
  - task:
32
  name: LEMMA
33
  type: token-classification
34
  metrics:
35
  - name: Lemma Accuracy
36
  type: accuracy
37
+ value: 0.9723320158
38
  - task:
39
  name: UNLABELED_DEPENDENCIES
40
  type: token-classification
41
  metrics:
42
  - name: Unlabeled Attachment Score (UAS)
43
  type: f_score
44
+ value: 0.6605898394
45
  - task:
46
  name: LABELED_DEPENDENCIES
47
  type: token-classification
48
  metrics:
49
  - name: Labeled Attachment Score (LAS)
50
  type: f_score
51
+ value: 0.5799121345
52
  - task:
53
  name: SENTS
54
  type: token-classification
55
  metrics:
56
  - name: Sentences F-Score
57
  type: f_score
58
+ value: 0.9868421053
59
  ---
60
  | Feature | Description |
61
  | --- | --- |
62
  | **Name** | `grc_perseus_sm` |
63
+ | **Version** | `3.5.3` |
64
+ | **spaCy** | `>=3.5.3,<3.6.0` |
65
+ | **Default Pipeline** | `tok2vec`, `morphologizer`, `tagger`, `parser`, `lemmatizer`, `attribute_ruler` |
66
+ | **Components** | `tok2vec`, `morphologizer`, `tagger`, `parser`, `lemmatizer`, `attribute_ruler` |
67
  | **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
68
  | **Sources** | n/a |
69
  | **License** | n/a |
 
87
 
88
  | Type | Score |
89
  | --- | --- |
90
+ | `POS_ACC` | 89.25 |
91
+ | `MORPH_ACC` | 83.52 |
92
+ | `TAG_ACC` | 89.55 |
93
+ | `DEP_UAS` | 65.61 |
94
+ | `DEP_LAS` | 57.82 |
95
+ | `SENTS_P` | 96.53 |
96
+ | `SENTS_R` | 97.98 |
97
+ | `SENTS_F` | 97.25 |
98
+ | `LEMMA_ACC` | 97.23 |
99
+ | `TOK2VEC_LOSS` | 3135697.59 |
100
+ | `MORPHOLOGIZER_LOSS` | 245681.24 |
101
+ | `TAGGER_LOSS` | 107655.17 |
102
+ | `PARSER_LOSS` | 1960197.14 |
accuracy.json CHANGED
@@ -3,196 +3,196 @@
3
  "token_p":0.9983307102,
4
  "token_r":0.9987117706,
5
  "token_f":0.998521204,
6
- "pos_acc":0.8719160105,
7
- "morph_acc":0.8214464673,
8
- "morph_micro_p":0.8816652914,
9
- "morph_micro_r":0.8722568857,
10
- "morph_micro_f":0.8769358542,
11
  "morph_per_feat":{
12
  "Mood":{
13
- "p":0.8664416586,
14
- "r":0.8714839961,
15
- "f":0.8689555126
16
  },
17
  "Number":{
18
- "p":0.9432498848,
19
- "r":0.9342105263,
20
- "f":0.9387084448
21
  },
22
  "Person":{
23
- "p":0.8688760807,
24
- "r":0.8413953488,
25
- "f":0.8549149338
26
  },
27
  "Tense":{
28
- "p":0.7710973308,
29
- "r":0.767167382,
30
- "f":0.7691273363
31
  },
32
  "VerbForm":{
33
- "p":0.8935022917,
34
- "r":0.8899033298,
35
- "f":0.8916991793
36
  },
37
  "Voice":{
38
- "p":0.8777987591,
39
- "r":0.8728540773,
40
- "f":0.8753194351
41
  },
42
  "Case":{
43
- "p":0.901890929,
44
- "r":0.8909845682,
45
- "f":0.896404576
46
  },
47
  "Gender":{
48
- "p":0.8426442352,
49
- "r":0.8335745297,
50
- "f":0.8380848452
51
  },
52
  "Aspect":{
53
- "p":0.6860986547,
54
- "r":0.6789940828,
55
- "f":0.682527881
56
  },
57
  "Degree":{
58
- "p":0.2380952381,
59
- "r":0.1063829787,
60
- "f":0.1470588235
61
  }
62
  },
63
- "tag_acc":0.8770489848,
64
- "sents_p":0.9504132231,
65
- "sents_r":0.9686064319,
66
- "sents_f":0.9594235874,
67
- "dep_uas":0.6455083378,
68
- "dep_las":0.5632916499,
69
  "dep_las_per_type":{
70
  "root":{
71
- "p":0.7969924812,
72
- "r":0.8116385911,
73
- "f":0.8042488619
74
  },
75
  "advmod":{
76
- "p":0.5846343468,
77
- "r":0.5528360528,
78
- "f":0.5682907348
79
  },
80
  "nsubj":{
81
- "p":0.5756266206,
82
- "r":0.4970149254,
83
- "f":0.5334401282
84
  },
85
  "det":{
86
- "p":0.7866666667,
87
- "r":0.7639933166,
88
- "f":0.7751642297
89
  },
90
  "nmod":{
91
- "p":0.4362121876,
92
- "r":0.4418294849,
93
- "f":0.4390028679
94
  },
95
  "obj":{
96
- "p":0.4490521327,
97
- "r":0.501986755,
98
- "f":0.4740462789
99
  },
100
  "advcl":{
101
- "p":0.4595375723,
102
- "r":0.4779559118,
103
- "f":0.4685658153
104
  },
105
  "cc":{
106
- "p":0.4134727062,
107
- "r":0.5460122699,
108
- "f":0.4705882353
109
  },
110
  "conj":{
111
- "p":0.4285714286,
112
- "r":0.4342629482,
113
- "f":0.4313984169
114
  },
115
  "amod":{
116
- "p":0.1388888889,
117
- "r":0.0344827586,
118
- "f":0.0552486188
119
  },
120
  "cop":{
121
- "p":0.5211267606,
122
- "r":0.524822695,
123
- "f":0.5229681979
124
  },
125
  "obl":{
126
- "p":0.5133282559,
127
- "r":0.4835007174,
128
- "f":0.4979682305
129
  },
130
  "case":{
131
- "p":0.8221757322,
132
- "r":0.817047817,
133
- "f":0.8196037539
134
  },
135
  "xcomp":{
136
- "p":0.2685714286,
137
- "r":0.2706333973,
138
- "f":0.2695984704
139
  },
140
  "csubj":{
141
- "p":0.2631578947,
142
- "r":0.1282051282,
143
- "f":0.1724137931
144
  },
145
  "mark":{
146
- "p":0.733974359,
147
- "r":0.661849711,
148
- "f":0.6960486322
149
  },
150
  "ccomp":{
151
- "p":0.5222222222,
152
- "r":0.3560606061,
153
- "f":0.4234234234
154
- },
155
- "parataxis":{
156
- "p":0.0689655172,
157
- "r":0.2222222222,
158
- "f":0.1052631579
159
  },
160
  "dep":{
161
  "p":0.0,
162
  "r":0.0,
163
  "f":0.0
164
  },
165
- "appos":{
166
- "p":0.1818181818,
167
- "r":0.1379310345,
168
- "f":0.1568627451
169
- },
170
  "acl":{
171
- "p":0.3026315789,
172
  "r":0.1742424242,
173
- "f":0.2211538462
174
  },
175
  "iobj":{
176
- "p":0.2450980392,
177
- "r":0.2525252525,
178
- "f":0.2487562189
 
 
 
 
 
179
  },
180
  "discourse":{
181
- "p":0.8,
182
- "r":0.7272727273,
183
- "f":0.7619047619
184
  },
185
  "vocative":{
186
- "p":0.3456790123,
187
- "r":0.3456790123,
188
- "f":0.3456790123
 
 
 
 
 
189
  },
190
  "nummod":{
191
- "p":0.05,
192
- "r":0.3333333333,
193
- "f":0.0869565217
194
  }
195
  },
196
- "lemma_acc":0.8506476468,
197
- "speed":6348.1191496176
198
  }
 
3
  "token_p":0.9983307102,
4
  "token_r":0.9987117706,
5
  "token_f":0.998521204,
6
+ "pos_acc":0.8695506932,
7
+ "morph_acc":0.8207587688,
8
+ "morph_micro_p":0.8816986258,
9
+ "morph_micro_r":0.8705075126,
10
+ "morph_micro_f":0.8760673311,
11
  "morph_per_feat":{
12
  "Mood":{
13
+ "p":0.869502175,
14
+ "r":0.8724539282,
15
+ "f":0.8709755507
16
  },
17
  "Number":{
18
+ "p":0.9452759229,
19
+ "r":0.9367204138,
20
+ "f":0.9409787218
21
  },
22
  "Person":{
23
+ "p":0.8754826255,
24
+ "r":0.8437209302,
25
+ "f":0.8593083847
26
  },
27
  "Tense":{
28
+ "p":0.7706746464,
29
+ "r":0.7599248927,
30
+ "f":0.7652620205
31
  },
32
  "VerbForm":{
33
+ "p":0.8925462459,
34
+ "r":0.8810418904,
35
+ "f":0.8867567568
36
  },
37
  "Voice":{
38
+ "p":0.8799346583,
39
+ "r":0.8669527897,
40
+ "f":0.8733954871
41
  },
42
  "Case":{
43
+ "p":0.8979107746,
44
+ "r":0.8881869867,
45
+ "f":0.8930224118
46
  },
47
  "Gender":{
48
+ "p":0.8402447936,
49
+ "r":0.832036903,
50
+ "f":0.8361207053
51
  },
52
  "Aspect":{
53
+ "p":0.7065217391,
54
+ "r":0.6730769231,
55
+ "f":0.6893939394
56
  },
57
  "Degree":{
58
+ "p":0.3043478261,
59
+ "r":0.1489361702,
60
+ "f":0.2
61
  }
62
  },
63
+ "tag_acc":0.8772875856,
64
+ "sents_p":0.9717987805,
65
+ "sents_r":0.9762633997,
66
+ "sents_f":0.974025974,
67
+ "dep_uas":0.6452202916,
68
+ "dep_las":0.5622764315,
69
  "dep_las_per_type":{
70
  "root":{
71
+ "p":0.8170731707,
72
+ "r":0.8208269525,
73
+ "f":0.8189457601
74
  },
75
  "advmod":{
76
+ "p":0.5800391389,
77
+ "r":0.5757575758,
78
+ "f":0.577890427
79
  },
80
  "nsubj":{
81
+ "p":0.546728972,
82
+ "r":0.523880597,
83
+ "f":0.5350609756
84
  },
85
  "det":{
86
+ "p":0.7865509761,
87
+ "r":0.7573099415,
88
+ "f":0.7716535433
89
  },
90
  "nmod":{
91
+ "p":0.427184466,
92
+ "r":0.4298401421,
93
+ "f":0.4285081895
94
  },
95
  "obj":{
96
+ "p":0.458254865,
97
+ "r":0.4834437086,
98
+ "f":0.4705124073
99
  },
100
  "advcl":{
101
+ "p":0.4983277592,
102
+ "r":0.4478957916,
103
+ "f":0.47176781
104
  },
105
  "cc":{
106
+ "p":0.4601769912,
107
+ "r":0.5582822086,
108
+ "f":0.5045045045
109
  },
110
  "conj":{
111
+ "p":0.4688856729,
112
+ "r":0.4302788845,
113
+ "f":0.4487534626
114
  },
115
  "amod":{
116
+ "p":0.0416666667,
117
+ "r":0.0137931034,
118
+ "f":0.0207253886
119
  },
120
  "cop":{
121
+ "p":0.480565371,
122
+ "r":0.4822695035,
123
+ "f":0.4814159292
124
  },
125
  "obl":{
126
+ "p":0.4888248017,
127
+ "r":0.4863701578,
128
+ "f":0.4875943905
129
  },
130
  "case":{
131
+ "p":0.8123697012,
132
+ "r":0.8101178101,
133
+ "f":0.8112421929
134
  },
135
  "xcomp":{
136
+ "p":0.2343987823,
137
+ "r":0.2955854127,
138
+ "f":0.2614601019
139
  },
140
  "csubj":{
141
+ "p":0.2592592593,
142
+ "r":0.1794871795,
143
+ "f":0.2121212121
144
  },
145
  "mark":{
146
+ "p":0.7413249211,
147
+ "r":0.6791907514,
148
+ "f":0.7088989442
149
  },
150
  "ccomp":{
151
+ "p":0.4269662921,
152
+ "r":0.2878787879,
153
+ "f":0.3438914027
 
 
 
 
 
154
  },
155
  "dep":{
156
  "p":0.0,
157
  "r":0.0,
158
  "f":0.0
159
  },
 
 
 
 
 
160
  "acl":{
161
+ "p":0.2346938776,
162
  "r":0.1742424242,
163
+ "f":0.2
164
  },
165
  "iobj":{
166
+ "p":0.3333333333,
167
+ "r":0.1919191919,
168
+ "f":0.2435897436
169
+ },
170
+ "appos":{
171
+ "p":0.1,
172
+ "r":0.1034482759,
173
+ "f":0.1016949153
174
  },
175
  "discourse":{
176
+ "p":0.6774193548,
177
+ "r":0.6363636364,
178
+ "f":0.65625
179
  },
180
  "vocative":{
181
+ "p":0.3870967742,
182
+ "r":0.2962962963,
183
+ "f":0.3356643357
184
+ },
185
+ "parataxis":{
186
+ "p":0.0625,
187
+ "r":0.2222222222,
188
+ "f":0.0975609756
189
  },
190
  "nummod":{
191
+ "p":0.0952380952,
192
+ "r":0.6666666667,
193
+ "f":0.1666666667
194
  }
195
  },
196
+ "lemma_acc":0.9007418716,
197
+ "speed":5323.2062856447
198
  }
attribute_ruler/patterns CHANGED
Binary files a/attribute_ruler/patterns and b/attribute_ruler/patterns differ
 
config.cfg CHANGED
@@ -10,7 +10,7 @@ seed = 0
10
 
11
  [nlp]
12
  lang = "grc"
13
- pipeline = ["tok2vec","morphologizer","tagger","parser","senter","lemmatizer","attribute_ruler"]
14
  batch_size = 128
15
  disabled = []
16
  before_creation = null
@@ -86,26 +86,6 @@ nO = null
86
  width = ${components.tok2vec.model.encode.width}
87
  upstream = "tok2vec"
88
 
89
- [components.senter]
90
- factory = "senter"
91
- overwrite = false
92
- scorer = {"@scorers":"spacy.senter_scorer.v1"}
93
-
94
- [components.senter.model]
95
- @architectures = "spacy.Tagger.v2"
96
- nO = null
97
- normalize = false
98
-
99
- [components.senter.model.tok2vec]
100
- @architectures = "spacy.HashEmbedCNN.v2"
101
- pretrained_vectors = null
102
- width = 12
103
- depth = 1
104
- embed_size = 2000
105
- window_size = 1
106
- maxout_pieces = 2
107
- subword_features = true
108
-
109
  [components.tagger]
110
  factory = "tagger"
111
  neg_prefix = "!"
@@ -171,7 +151,7 @@ patience = 5000
171
  max_epochs = 0
172
  max_steps = 20000
173
  eval_frequency = 200
174
- frozen_components = ["lemmatizer","senter"]
175
  annotating_components = []
176
  before_to_disk = null
177
  before_update = null
@@ -191,7 +171,7 @@ t = 0.0
191
 
192
  [training.logger]
193
  @loggers = "spacy.WandbLogger.v3"
194
- project_name = "proiel"
195
  remove_config_values = ["paths.train","paths.dev","corpora.train.path","corpora.dev.path"]
196
  log_dataset_dir = "./corpus"
197
  model_log_interval = 1000
 
10
 
11
  [nlp]
12
  lang = "grc"
13
+ pipeline = ["tok2vec","morphologizer","tagger","parser","lemmatizer","attribute_ruler"]
14
  batch_size = 128
15
  disabled = []
16
  before_creation = null
 
86
  width = ${components.tok2vec.model.encode.width}
87
  upstream = "tok2vec"
88
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
89
  [components.tagger]
90
  factory = "tagger"
91
  neg_prefix = "!"
 
151
  max_epochs = 0
152
  max_steps = 20000
153
  eval_frequency = 200
154
+ frozen_components = ["lemmatizer"]
155
  annotating_components = []
156
  before_to_disk = null
157
  before_update = null
 
171
 
172
  [training.logger]
173
  @loggers = "spacy.WandbLogger.v3"
174
+ project_name = "greCy"
175
  remove_config_values = ["paths.train","paths.dev","corpora.train.path","corpora.dev.path"]
176
  log_dataset_dir = "./corpus"
177
  model_log_interval = 1000
grc_perseus_sm-any-py3-none-any.whl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c720b3dcb877fe1233b751e0450636816b9c1f5bd66c5c698c6fc61d70336e4c
3
- size 59581491
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:477d5bcf44e05750a70595038b0b832a4431003b235f78f554c9c468b1f61344
3
+ size 59912019
lemmatizer/cfg CHANGED
The diff for this file is too large to render. See raw diff
 
lemmatizer/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:930386d436927c541305cb480afa8a4ca75d03894abfee89a23fd4e76e8c6d73
3
- size 24138324
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7943319b989596449853f63213d3598cab16ee8576e94756e1406f352f95469c
3
+ size 24263260
lemmatizer/trees CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:889486752498ce47ce48b7888f1249c92d5fb5c505a20574ad38a4a77476c9b1
3
- size 4833057
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0b4cacd6282ecfa887b731fe8aed793709e236050f81662e72cd06fe73a6458
3
+ size 5318689
meta.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
  "lang":"grc",
3
  "name":"perseus_sm",
4
- "version":"3.5.2",
5
  "description":"",
6
  "author":"",
7
  "email":"",
8
  "url":"",
9
  "license":"",
10
- "spacy_version":">=3.5.2,<3.6.0",
11
- "spacy_git_version":"Unknown",
12
  "vectors":{
13
  "width":0,
14
  "vectors":0,
@@ -946,7 +946,6 @@
946
  "morphologizer",
947
  "tagger",
948
  "parser",
949
- "senter",
950
  "lemmatizer",
951
  "attribute_ruler"
952
  ],
@@ -955,7 +954,6 @@
955
  "morphologizer",
956
  "tagger",
957
  "parser",
958
- "senter",
959
  "lemmatizer",
960
  "attribute_ruler"
961
  ],
@@ -963,183 +961,183 @@
963
 
964
  ],
965
  "performance":{
966
- "pos_acc":0.8900634727,
967
- "morph_acc":0.833069799,
968
  "morph_per_feat":{
969
  "Case":{
970
- "p":0.9182653699,
971
- "r":0.907575624,
972
- "f":0.9128892043
973
  },
974
  "Gender":{
975
- "p":0.8753682707,
976
- "r":0.8661660777,
977
- "f":0.8707428622
978
  },
979
  "Number":{
980
- "p":0.9502866626,
981
- "r":0.9431716083,
982
- "f":0.9467157673
983
  },
984
  "Degree":{
985
- "p":0.5245901639,
986
- "r":0.1882352941,
987
- "f":0.2770562771
988
  },
989
  "Tense":{
990
- "p":0.7458996328,
991
- "r":0.7383086988,
992
- "f":0.742084754
993
  },
994
  "VerbForm":{
995
- "p":0.9023255814,
996
- "r":0.8931427187,
997
- "f":0.8977106673
998
  },
999
  "Voice":{
1000
- "p":0.8849167483,
1001
- "r":0.8763336566,
1002
- "f":0.8806042885
1003
  },
1004
  "Aspect":{
1005
- "p":0.7173913043,
1006
- "r":0.6431181486,
1007
- "f":0.6782273603
1008
  },
1009
  "Mood":{
1010
- "p":0.8452903856,
1011
- "r":0.8587010412,
1012
- "f":0.8519429415
1013
  },
1014
  "Person":{
1015
- "p":0.8706854643,
1016
- "r":0.8544847328,
1017
- "f":0.8625090296
1018
  }
1019
  },
1020
- "tag_acc":0.8956201577,
1021
- "dep_uas":0.6668855274,
1022
- "dep_las":0.5832828283,
1023
  "dep_las_per_type":{
1024
  "det":{
1025
- "p":0.8400460299,
1026
- "r":0.8138238573,
1027
- "f":0.8267270668
1028
  },
1029
  "advmod":{
1030
- "p":0.630127774,
1031
- "r":0.6041263701,
1032
- "f":0.6168531929
1033
  },
1034
  "case":{
1035
- "p":0.8592268417,
1036
- "r":0.8751857355,
1037
- "f":0.8671328671
1038
  },
1039
  "nmod":{
1040
- "p":0.4193548387,
1041
- "r":0.4342672414,
1042
- "f":0.4266807835
1043
  },
1044
  "cc":{
1045
- "p":0.4908026756,
1046
- "r":0.5699029126,
1047
- "f":0.5274034142
1048
  },
1049
  "conj":{
1050
- "p":0.4895738894,
1051
- "r":0.4864864865,
1052
- "f":0.488025305
1053
  },
1054
  "csubj":{
1055
- "p":0.35,
1056
- "r":0.1359223301,
1057
- "f":0.1958041958
1058
  },
1059
  "obl":{
1060
- "p":0.496124031,
1061
- "r":0.4971751412,
1062
- "f":0.49664903
1063
  },
1064
  "root":{
1065
- "p":0.8151700087,
1066
- "r":0.8223394899,
1067
- "f":0.8187390543
1068
  },
1069
  "cop":{
1070
- "p":0.5682656827,
1071
- "r":0.5441696113,
1072
- "f":0.5559566787
1073
  },
1074
  "obj":{
1075
- "p":0.4538807649,
1076
- "r":0.5186375321,
1077
- "f":0.4841031794
1078
  },
1079
  "acl":{
1080
- "p":0.1978021978,
1081
- "r":0.1111111111,
1082
- "f":0.1422924901
1083
  },
1084
  "xcomp":{
1085
- "p":0.3108298172,
1086
- "r":0.3240469208,
1087
- "f":0.3173007897
1088
  },
1089
  "nsubj":{
1090
- "p":0.5744476465,
1091
- "r":0.4701257862,
1092
- "f":0.5170773887
1093
  },
1094
  "amod":{
1095
- "p":0.0784313725,
1096
- "r":0.0294117647,
1097
- "f":0.0427807487
1098
  },
1099
  "advcl":{
1100
- "p":0.4567188788,
1101
- "r":0.4825783972,
1102
- "f":0.4692926726
1103
  },
1104
  "mark":{
1105
- "p":0.7689969605,
1106
- "r":0.704735376,
1107
- "f":0.7354651163
1108
  },
1109
  "iobj":{
1110
- "p":0.3518518519,
1111
- "r":0.2794117647,
1112
- "f":0.3114754098
1113
  },
1114
  "dep":{
1115
  "p":0.0,
1116
  "r":0.0,
1117
  "f":0.0
1118
  },
1119
- "parataxis":{
1120
  "p":0.0,
1121
  "r":0.0,
1122
  "f":0.0
1123
  },
1124
  "ccomp":{
1125
- "p":0.3233082707,
1126
- "r":0.2067307692,
1127
- "f":0.2521994135
1128
  },
1129
- "nummod":{
1130
- "p":0.0666666667,
1131
- "r":0.125,
1132
- "f":0.0869565217
1133
  },
1134
  "vocative":{
1135
- "p":0.5,
1136
- "r":0.5217391304,
1137
- "f":0.5106382979
1138
  },
1139
- "appos":{
1140
- "p":0.125,
1141
- "r":0.08,
1142
- "f":0.0975609756
1143
  },
1144
  "discourse":{
1145
  "p":0.9375,
@@ -1147,14 +1145,14 @@
1147
  "f":0.9090909091
1148
  }
1149
  },
1150
- "sents_p":0.9808195292,
1151
  "sents_r":0.9894459103,
1152
- "sents_f":0.9851138354,
1153
- "lemma_acc":0.9104912479,
1154
- "tok2vec_loss":34009.3370705922,
1155
- "morphologizer_loss":1739.7677844763,
1156
- "tagger_loss":769.0862725675,
1157
- "parser_loss":16434.4719876691
1158
  },
1159
  "requirements":[
1160
 
 
1
  {
2
  "lang":"grc",
3
  "name":"perseus_sm",
4
+ "version":"3.5.3",
5
  "description":"",
6
  "author":"",
7
  "email":"",
8
  "url":"",
9
  "license":"",
10
+ "spacy_version":">=3.5.3,<3.6.0",
11
+ "spacy_git_version":"512241e12",
12
  "vectors":{
13
  "width":0,
14
  "vectors":0,
 
946
  "morphologizer",
947
  "tagger",
948
  "parser",
 
949
  "lemmatizer",
950
  "attribute_ruler"
951
  ],
 
954
  "morphologizer",
955
  "tagger",
956
  "parser",
 
957
  "lemmatizer",
958
  "attribute_ruler"
959
  ],
 
961
 
962
  ],
963
  "performance":{
964
+ "pos_acc":0.8929297493,
965
+ "morph_acc":0.8346510052,
966
  "morph_per_feat":{
967
  "Case":{
968
+ "p":0.9179131054,
969
+ "r":0.9092512567,
970
+ "f":0.9135616499
971
  },
972
  "Gender":{
973
+ "p":0.8731403118,
974
+ "r":0.8658127208,
975
+ "f":0.8694610778
976
  },
977
  "Number":{
978
+ "p":0.9484939759,
979
+ "r":0.9430967355,
980
+ "f":0.9457876558
981
  },
982
  "Degree":{
983
+ "p":0.4925373134,
984
+ "r":0.1941176471,
985
+ "f":0.2784810127
986
  },
987
  "Tense":{
988
+ "p":0.7461127308,
989
+ "r":0.7441240611,
990
+ "f":0.745117069
991
  },
992
  "VerbForm":{
993
+ "p":0.9018464529,
994
+ "r":0.8994426945,
995
+ "f":0.9006429698
996
  },
997
  "Voice":{
998
+ "p":0.8808075894,
999
+ "r":0.8780310378,
1000
+ "f":0.879417122
1001
  },
1002
  "Aspect":{
1003
+ "p":0.7550724638,
1004
+ "r":0.634591961,
1005
+ "f":0.6896095301
1006
  },
1007
  "Mood":{
1008
+ "p":0.849609375,
1009
+ "r":0.8626673277,
1010
+ "f":0.8560885609
1011
  },
1012
  "Person":{
1013
+ "p":0.8747563353,
1014
+ "r":0.8563931298,
1015
+ "f":0.8654773385
1016
  }
1017
  },
1018
+ "tag_acc":0.8967495652,
1019
+ "dep_uas":0.6605898394,
1020
+ "dep_las":0.5799121345,
1021
  "dep_las_per_type":{
1022
  "det":{
1023
+ "p":0.8470770422,
1024
+ "r":0.8130806392,
1025
+ "f":0.8297307546
1026
  },
1027
  "advmod":{
1028
+ "p":0.6020663745,
1029
+ "r":0.6199226306,
1030
+ "f":0.6108640407
1031
  },
1032
  "case":{
1033
+ "p":0.8546384222,
1034
+ "r":0.8692421991,
1035
+ "f":0.861878453
1036
  },
1037
  "nmod":{
1038
+ "p":0.4320920044,
1039
+ "r":0.4251077586,
1040
+ "f":0.4285714286
1041
  },
1042
  "cc":{
1043
+ "p":0.5095715588,
1044
+ "r":0.5427184466,
1045
+ "f":0.5256229431
1046
  },
1047
  "conj":{
1048
+ "p":0.4928278689,
1049
+ "r":0.4333333333,
1050
+ "f":0.4611697028
1051
  },
1052
  "csubj":{
1053
+ "p":0.4347826087,
1054
+ "r":0.1941747573,
1055
+ "f":0.2684563758
1056
  },
1057
  "obl":{
1058
+ "p":0.4923611111,
1059
+ "r":0.5007062147,
1060
+ "f":0.4964985994
1061
  },
1062
  "root":{
1063
+ "p":0.8005249344,
1064
+ "r":0.8047493404,
1065
+ "f":0.8026315789
1066
  },
1067
  "cop":{
1068
+ "p":0.537593985,
1069
+ "r":0.5053003534,
1070
+ "f":0.5209471767
1071
  },
1072
  "obj":{
1073
+ "p":0.4622144112,
1074
+ "r":0.5070694087,
1075
+ "f":0.4836040454
1076
  },
1077
  "acl":{
1078
+ "p":0.252173913,
1079
+ "r":0.1790123457,
1080
+ "f":0.2093862816
1081
  },
1082
  "xcomp":{
1083
+ "p":0.2749445676,
1084
+ "r":0.3636363636,
1085
+ "f":0.3131313131
1086
  },
1087
  "nsubj":{
1088
+ "p":0.5424610052,
1089
+ "r":0.4921383648,
1090
+ "f":0.516075845
1091
  },
1092
  "amod":{
1093
+ "p":0.1363636364,
1094
+ "r":0.0661764706,
1095
+ "f":0.0891089109
1096
  },
1097
  "advcl":{
1098
+ "p":0.5194174757,
1099
+ "r":0.4660278746,
1100
+ "f":0.4912764004
1101
  },
1102
  "mark":{
1103
+ "p":0.7138728324,
1104
+ "r":0.6880222841,
1105
+ "f":0.7007092199
1106
  },
1107
  "iobj":{
1108
+ "p":0.3636363636,
1109
+ "r":0.2058823529,
1110
+ "f":0.2629107981
1111
  },
1112
  "dep":{
1113
  "p":0.0,
1114
  "r":0.0,
1115
  "f":0.0
1116
  },
1117
+ "appos":{
1118
  "p":0.0,
1119
  "r":0.0,
1120
  "f":0.0
1121
  },
1122
  "ccomp":{
1123
+ "p":0.3858267717,
1124
+ "r":0.2355769231,
1125
+ "f":0.2925373134
1126
  },
1127
+ "parataxis":{
1128
+ "p":0.0,
1129
+ "r":0.0,
1130
+ "f":0.0
1131
  },
1132
  "vocative":{
1133
+ "p":0.3333333333,
1134
+ "r":0.3913043478,
1135
+ "f":0.36
1136
  },
1137
+ "nummod":{
1138
+ "p":0.1578947368,
1139
+ "r":0.1875,
1140
+ "f":0.1714285714
1141
  },
1142
  "discourse":{
1143
  "p":0.9375,
 
1145
  "f":0.9090909091
1146
  }
1147
  },
1148
+ "sents_p":0.9842519685,
1149
  "sents_r":0.9894459103,
1150
+ "sents_f":0.9868421053,
1151
+ "lemma_acc":0.9723320158,
1152
+ "tok2vec_loss":37568.3918470888,
1153
+ "morphologizer_loss":1413.9878097773,
1154
+ "tagger_loss":653.8194056507,
1155
+ "parser_loss":15512.3811200972
1156
  },
1157
  "requirements":[
1158
 
morphologizer/model CHANGED
Binary files a/morphologizer/model and b/morphologizer/model differ
 
parser/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9a3e8902ee357781567c8e673371ba9dfe8145694dc5e179444283b1cda0f599
3
  size 1787174
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:736bac09572f96f956b0f115d8b4735b85506388de942488eb4f4402aba2493b
3
  size 1787174
tagger/model CHANGED
Binary files a/tagger/model and b/tagger/model differ
 
tok2vec/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eeeccfa4ce2558615f6708bbbf5d319783f98ebd12cb2b4831cc65794a26b28a
3
  size 34875837
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d48dddef89b68884b1757c8c92414a66834b87f98a0f38e250c8005d39618d7
3
  size 34875837
vocab/strings.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:20743e47b7d04efa38a6d5c70c3201002a82280c38aa788a64a65f8868f4104c
3
- size 12443077
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8325579291b33a014614b91dc7a42d6627bdc964ba3635a49a84564bd0b88db4
3
+ size 17971365