Jacobo commited on
Commit
7c8574a
1 Parent(s): dc17a5f

Update spaCy pipeline

Browse files
README.md CHANGED
@@ -13,55 +13,55 @@ model-index:
13
  metrics:
14
  - name: TAG (XPOS) Accuracy
15
  type: accuracy
16
- value: 0.9750219748
17
  - task:
18
  name: POS
19
  type: token-classification
20
  metrics:
21
  - name: POS (UPOS) Accuracy
22
  type: accuracy
23
- value: 0.9726047466
24
  - task:
25
  name: MORPH
26
  type: token-classification
27
  metrics:
28
  - name: Morph (UFeats) Accuracy
29
  type: accuracy
30
- value: 0.9088045708
31
  - task:
32
  name: LEMMA
33
  type: token-classification
34
  metrics:
35
  - name: Lemma Accuracy
36
  type: accuracy
37
- value: 0.9732639906
38
  - task:
39
  name: UNLABELED_DEPENDENCIES
40
  type: token-classification
41
  metrics:
42
  - name: Unlabeled Attachment Score (UAS)
43
  type: f_score
44
- value: 0.8111631995
45
  - task:
46
  name: LABELED_DEPENDENCIES
47
  type: token-classification
48
  metrics:
49
  - name: Labeled Attachment Score (LAS)
50
  type: f_score
51
- value: 0.7622326399
52
  - task:
53
  name: SENTS
54
  type: token-classification
55
  metrics:
56
  - name: Sentences F-Score
57
  type: f_score
58
- value: 0.6111922141
59
  ---
60
  | Feature | Description |
61
  | --- | --- |
62
  | **Name** | `grc_proiel_lg` |
63
- | **Version** | `3.5.3` |
64
- | **spaCy** | `>=3.5.3,<3.6.0` |
65
  | **Default Pipeline** | `tok2vec`, `morphologizer`, `tagger`, `parser`, `lemmatizer`, `attribute_ruler` |
66
  | **Components** | `tok2vec`, `morphologizer`, `tagger`, `parser`, `lemmatizer`, `attribute_ruler` |
67
  | **Vectors** | -1 keys, 200000 unique vectors (300 dimensions) |
@@ -87,16 +87,16 @@ model-index:
87
 
88
  | Type | Score |
89
  | --- | --- |
90
- | `POS_ACC` | 97.30 |
91
- | `MORPH_ACC` | 90.60 |
92
- | `TAG_ACC` | 97.70 |
93
- | `DEP_UAS` | 80.68 |
94
- | `DEP_LAS` | 76.07 |
95
- | `SENTS_P` | 56.43 |
96
- | `SENTS_R` | 62.02 |
97
- | `SENTS_F` | 59.09 |
98
- | `LEMMA_ACC` | 97.33 |
99
- | `TOK2VEC_LOSS` | 7384506.01 |
100
- | `MORPHOLOGIZER_LOSS` | 80044.78 |
101
- | `TAGGER_LOSS` | 25253.04 |
102
- | `PARSER_LOSS` | 1795439.09 |
 
13
  metrics:
14
  - name: TAG (XPOS) Accuracy
15
  type: accuracy
16
+ value: 0.9753149722
17
  - task:
18
  name: POS
19
  type: token-classification
20
  metrics:
21
  - name: POS (UPOS) Accuracy
22
  type: accuracy
23
+ value: 0.97333724
24
  - task:
25
  name: MORPH
26
  type: token-classification
27
  metrics:
28
  - name: Morph (UFeats) Accuracy
29
  type: accuracy
30
+ value: 0.9031643715
31
  - task:
32
  name: LEMMA
33
  type: token-classification
34
  metrics:
35
  - name: Lemma Accuracy
36
  type: accuracy
37
+ value: 0.9745092294
38
  - task:
39
  name: UNLABELED_DEPENDENCIES
40
  type: token-classification
41
  metrics:
42
  - name: Unlabeled Attachment Score (UAS)
43
  type: f_score
44
+ value: 0.8039115148
45
  - task:
46
  name: LABELED_DEPENDENCIES
47
  type: token-classification
48
  metrics:
49
  - name: Labeled Attachment Score (LAS)
50
  type: f_score
51
+ value: 0.75666569
52
  - task:
53
  name: SENTS
54
  type: token-classification
55
  metrics:
56
  - name: Sentences F-Score
57
  type: f_score
58
+ value: 0.6032818533
59
  ---
60
  | Feature | Description |
61
  | --- | --- |
62
  | **Name** | `grc_proiel_lg` |
63
+ | **Version** | `3.6.0` |
64
+ | **spaCy** | `>=3.6.0,<3.7.0` |
65
  | **Default Pipeline** | `tok2vec`, `morphologizer`, `tagger`, `parser`, `lemmatizer`, `attribute_ruler` |
66
  | **Components** | `tok2vec`, `morphologizer`, `tagger`, `parser`, `lemmatizer`, `attribute_ruler` |
67
  | **Vectors** | -1 keys, 200000 unique vectors (300 dimensions) |
 
87
 
88
  | Type | Score |
89
  | --- | --- |
90
+ | `POS_ACC` | 97.33 |
91
+ | `MORPH_ACC` | 90.32 |
92
+ | `TAG_ACC` | 97.53 |
93
+ | `DEP_UAS` | 80.39 |
94
+ | `DEP_LAS` | 75.67 |
95
+ | `SENTS_P` | 59.35 |
96
+ | `SENTS_R` | 61.33 |
97
+ | `SENTS_F` | 60.33 |
98
+ | `LEMMA_ACC` | 97.45 |
99
+ | `TOK2VEC_LOSS` | 7465584.11 |
100
+ | `MORPHOLOGIZER_LOSS` | 211872.15 |
101
+ | `TAGGER_LOSS` | 48038.59 |
102
+ | `PARSER_LOSS` | 2751762.68 |
accuracy.json CHANGED
@@ -3,204 +3,204 @@
3
  "token_p":1.0,
4
  "token_r":1.0,
5
  "token_f":1.0,
6
- "pos_acc":0.9705573081,
7
- "morph_acc":0.9017575484,
8
- "morph_micro_p":0.9639012033,
9
- "morph_micro_r":0.9622471098,
10
- "morph_micro_f":0.9630734463,
11
  "morph_per_feat":{
12
  "Case":{
13
- "p":0.9706231063,
14
- "r":0.9690911482,
15
- "f":0.9698565223
16
  },
17
  "Gender":{
18
- "p":0.9175940647,
19
- "r":0.9184458295,
20
- "f":0.9180197495
21
  },
22
  "Number":{
23
- "p":0.9906521973,
24
- "r":0.9892703863,
25
- "f":0.9899608096
26
  },
27
  "Aspect":{
28
- "p":0.9545454545,
29
- "r":0.9565522074,
30
- "f":0.9555477774
31
  },
32
  "Mood":{
33
- "p":0.9621212121,
34
- "r":0.961560862,
35
- "f":0.9618409554
36
  },
37
  "Person":{
38
- "p":0.9724980901,
39
- "r":0.9680608365,
40
- "f":0.9702743902
41
  },
42
  "Tense":{
43
- "p":0.9582570487,
44
- "r":0.9551094891,
45
- "f":0.9566806799
46
  },
47
  "VerbForm":{
48
- "p":0.9871841816,
49
- "r":0.9835826341,
50
- "f":0.985380117
51
  },
52
  "Voice":{
53
- "p":0.9469058953,
54
- "r":0.9437956204,
55
- "f":0.9453481996
56
  },
57
  "PronType":{
58
- "p":0.9835183317,
59
- "r":0.9779264214,
60
- "f":0.9807144055
61
  },
62
  "Degree":{
63
- "p":0.8667529107,
64
- "r":0.8769633508,
65
- "f":0.8718282368
66
  },
67
  "Definite":{
68
- "p":0.9921962096,
69
- "r":0.991643454,
70
- "f":0.9919197548
71
  },
72
  "Reflex":{
73
  "p":1.0,
74
- "r":0.9782608696,
75
- "f":0.989010989
76
  },
77
  "Polarity":{
78
- "p":0.995412844,
79
- "r":0.9819004525,
80
- "f":0.9886104784
81
  },
82
  "Poss":{
83
- "p":0.8333333333,
84
- "r":0.3846153846,
85
- "f":0.5263157895
86
  }
87
  },
88
- "tag_acc":0.9742376446,
89
- "sents_p":0.5994180407,
90
- "sents_r":0.5902578797,
91
- "sents_f":0.5948026949,
92
- "dep_uas":0.7958539883,
93
- "dep_las":0.7480847228,
94
  "dep_las_per_type":{
95
  "iobj":{
96
- "p":0.7191780822,
97
  "r":0.7208237986,
98
- "f":0.72
99
  },
100
  "root":{
101
- "p":0.786614937,
102
- "r":0.7745940783,
103
- "f":0.7805582291
104
  },
105
  "nsubj":{
106
- "p":0.701754386,
107
- "r":0.7174887892,
108
- "f":0.7095343681
109
  },
110
  "advmod":{
111
- "p":0.7222222222,
112
- "r":0.6861111111,
113
- "f":0.7037037037
114
  },
115
  "advcl":{
116
- "p":0.6400651466,
117
- "r":0.6517412935,
118
- "f":0.6458504519
119
  },
120
  "ccomp":{
121
- "p":0.5155279503,
122
- "r":0.512345679,
123
- "f":0.5139318885
124
  },
125
  "discourse":{
126
- "p":0.8063186813,
127
- "r":0.8074277854,
128
- "f":0.8068728522
129
  },
130
  "obj":{
131
- "p":0.7548717949,
132
- "r":0.8114663727,
133
- "f":0.7821466525
134
  },
135
  "det":{
136
- "p":0.9367201426,
137
- "r":0.9223343572,
138
- "f":0.9294715897
139
  },
140
  "nmod":{
141
- "p":0.7134615385,
142
- "r":0.7162162162,
143
- "f":0.7148362235
144
  },
145
  "cop":{
146
- "p":0.72,
147
- "r":0.7641509434,
148
- "f":0.7414187643
149
  },
150
  "appos":{
151
- "p":0.3916666667,
152
- "r":0.2865853659,
153
- "f":0.3309859155
154
  },
155
  "case":{
156
- "p":0.9578587699,
157
- "r":0.9567690557,
158
- "f":0.9573136027
159
  },
160
  "acl":{
161
- "p":0.4932432432,
162
- "r":0.4451219512,
163
- "f":0.4679487179
164
  },
165
  "mark":{
166
- "p":0.8930232558,
167
- "r":0.8888888889,
168
- "f":0.8909512761
169
  },
170
  "obl":{
171
- "p":0.6829558999,
172
- "r":0.7198492462,
173
- "f":0.7009174312
174
  },
175
  "nsubj:pass":{
176
- "p":0.776119403,
177
- "r":0.5473684211,
178
- "f":0.6419753086
179
  },
180
  "xcomp":{
181
- "p":0.6,
182
- "r":0.475,
183
- "f":0.5302325581
184
  },
185
  "cc":{
186
- "p":0.6378968254,
187
- "r":0.6366336634,
188
- "f":0.6372646184
189
  },
190
  "conj":{
191
- "p":0.5728643216,
192
- "r":0.5922077922,
193
- "f":0.5823754789
194
  },
195
  "dislocated":{
196
- "p":0.0,
197
- "r":0.0,
198
- "f":0.0
199
  },
200
  "amod":{
201
- "p":0.6968325792,
202
- "r":0.712962963,
203
- "f":0.704805492
204
  },
205
  "parataxis":{
206
  "p":0.0,
@@ -213,34 +213,39 @@
213
  "f":0.0
214
  },
215
  "nummod":{
216
- "p":0.8805970149,
217
- "r":0.8428571429,
218
- "f":0.8613138686
219
  },
220
  "fixed":{
221
- "p":0.7777777778,
222
- "r":0.875,
223
- "f":0.8235294118
224
  },
225
  "csubj:pass":{
226
- "p":0.5,
227
- "r":0.1428571429,
228
- "f":0.2222222222
229
  },
230
  "obl:agent":{
231
- "p":0.8571428571,
232
- "r":0.2727272727,
233
- "f":0.4137931034
234
  },
235
  "orphan":{
236
- "p":0.1481481481,
237
- "r":0.1142857143,
238
- "f":0.1290322581
239
  },
240
  "vocative":{
241
- "p":0.7755102041,
242
  "r":0.6229508197,
243
- "f":0.6909090909
 
 
 
 
 
244
  },
245
  "aux":{
246
  "p":0.0,
@@ -251,13 +256,8 @@
251
  "p":0.0,
252
  "r":0.0,
253
  "f":0.0
254
- },
255
- "flat:name":{
256
- "p":0.8571428571,
257
- "r":0.8571428571,
258
- "f":0.8571428571
259
  }
260
  },
261
- "lemma_acc":0.9724350308,
262
- "speed":3885.4826243627
263
  }
 
3
  "token_p":1.0,
4
  "token_r":1.0,
5
  "token_f":1.0,
6
+ "pos_acc":0.9690551299,
7
+ "morph_acc":0.8973261229,
8
+ "morph_micro_p":0.9620992574,
9
+ "morph_micro_r":0.9594924133,
10
+ "morph_micro_f":0.9607940671,
11
  "morph_per_feat":{
12
  "Case":{
13
+ "p":0.9703635406,
14
+ "r":0.9689596212,
15
+ "f":0.9696610727
16
  },
17
  "Gender":{
18
+ "p":0.9136538207,
19
+ "r":0.9148654025,
20
+ "f":0.9142592102
21
  },
22
  "Number":{
23
+ "p":0.9888172043,
24
+ "r":0.986695279,
25
+ "f":0.987755102
26
  },
27
  "Aspect":{
28
+ "p":0.9461914745,
29
+ "r":0.9488437281,
30
+ "f":0.9475157453
31
  },
32
  "Mood":{
33
+ "p":0.9607728337,
34
+ "r":0.9557367501,
35
+ "f":0.9582481752
36
  },
37
  "Person":{
38
+ "p":0.9749518304,
39
+ "r":0.9619771863,
40
+ "f":0.9684210526
41
  },
42
  "Tense":{
43
+ "p":0.9530791789,
44
+ "r":0.9489051095,
45
+ "f":0.950987564
46
  },
47
  "VerbForm":{
48
+ "p":0.9853372434,
49
+ "r":0.9806639912,
50
+ "f":0.9829950631
51
  },
52
  "Voice":{
53
+ "p":0.9461143695,
54
+ "r":0.9419708029,
55
+ "f":0.9440380395
56
  },
57
  "PronType":{
58
+ "p":0.9818426362,
59
+ "r":0.9765886288,
60
+ "f":0.9792085848
61
  },
62
  "Degree":{
63
+ "p":0.8759894459,
64
+ "r":0.8691099476,
65
+ "f":0.8725361367
66
  },
67
  "Definite":{
68
+ "p":0.9894736842,
69
+ "r":0.9949860724,
70
+ "f":0.9922222222
71
  },
72
  "Reflex":{
73
  "p":1.0,
74
+ "r":0.9565217391,
75
+ "f":0.9777777778
76
  },
77
  "Polarity":{
78
+ "p":0.99543379,
79
+ "r":0.9864253394,
80
+ "f":0.9909090909
81
  },
82
  "Poss":{
83
+ "p":0.8571428571,
84
+ "r":0.4615384615,
85
+ "f":0.6
86
  }
87
  },
88
+ "tag_acc":0.9727354664,
89
+ "sents_p":0.5894538606,
90
+ "sents_r":0.5978987584,
91
+ "sents_f":0.5936462779,
92
+ "dep_uas":0.7927745231,
93
+ "dep_las":0.7434279706,
94
  "dep_las_per_type":{
95
  "iobj":{
96
+ "p":0.7110609481,
97
  "r":0.7208237986,
98
+ "f":0.7159090909
99
  },
100
  "root":{
101
+ "p":0.7711864407,
102
+ "r":0.782234957,
103
+ "f":0.7766714083
104
  },
105
  "nsubj":{
106
+ "p":0.7379553467,
107
+ "r":0.7040358744,
108
+ "f":0.7205966724
109
  },
110
  "advmod":{
111
+ "p":0.6937321937,
112
+ "r":0.6763888889,
113
+ "f":0.6849507736
114
  },
115
  "advcl":{
116
+ "p":0.6299212598,
117
+ "r":0.6633499171,
118
+ "f":0.6462035541
119
  },
120
  "ccomp":{
121
+ "p":0.5982905983,
122
+ "r":0.4320987654,
123
+ "f":0.5017921147
124
  },
125
  "discourse":{
126
+ "p":0.7997237569,
127
+ "r":0.7964236589,
128
+ "f":0.7980702963
129
  },
130
  "obj":{
131
+ "p":0.7411167513,
132
+ "r":0.8048511577,
133
+ "f":0.7716701903
134
  },
135
  "det":{
136
+ "p":0.921387791,
137
+ "r":0.9205792014,
138
+ "f":0.9209833187
139
  },
140
  "nmod":{
141
+ "p":0.7365145228,
142
+ "r":0.6853281853,
143
+ "f":0.71
144
  },
145
  "cop":{
146
+ "p":0.7175925926,
147
+ "r":0.7311320755,
148
+ "f":0.7242990654
149
  },
150
  "appos":{
151
+ "p":0.4415584416,
152
+ "r":0.2073170732,
153
+ "f":0.2821576763
154
  },
155
  "case":{
156
+ "p":0.9569648924,
157
+ "r":0.9613196815,
158
+ "f":0.9591373439
159
  },
160
  "acl":{
161
+ "p":0.4692307692,
162
+ "r":0.3719512195,
163
+ "f":0.4149659864
164
  },
165
  "mark":{
166
+ "p":0.8755760369,
167
+ "r":0.8796296296,
168
+ "f":0.8775981524
169
  },
170
  "obl":{
171
+ "p":0.6899509804,
172
+ "r":0.7072864322,
173
+ "f":0.6985111663
174
  },
175
  "nsubj:pass":{
176
+ "p":0.5888888889,
177
+ "r":0.5578947368,
178
+ "f":0.572972973
179
  },
180
  "xcomp":{
181
+ "p":0.5407725322,
182
+ "r":0.525,
183
+ "f":0.532769556
184
  },
185
  "cc":{
186
+ "p":0.6444885799,
187
+ "r":0.6425742574,
188
+ "f":0.643529995
189
  },
190
  "conj":{
191
+ "p":0.5714285714,
192
+ "r":0.5974025974,
193
+ "f":0.5841269841
194
  },
195
  "dislocated":{
196
+ "p":0.25,
197
+ "r":0.0714285714,
198
+ "f":0.1111111111
199
  },
200
  "amod":{
201
+ "p":0.6666666667,
202
+ "r":0.7037037037,
203
+ "f":0.6846846847
204
  },
205
  "parataxis":{
206
  "p":0.0,
 
213
  "f":0.0
214
  },
215
  "nummod":{
216
+ "p":0.8571428571,
217
+ "r":0.8571428571,
218
+ "f":0.8571428571
219
  },
220
  "fixed":{
221
+ "p":0.6,
222
+ "r":0.75,
223
+ "f":0.6666666667
224
  },
225
  "csubj:pass":{
226
+ "p":0.0,
227
+ "r":0.0,
228
+ "f":0.0
229
  },
230
  "obl:agent":{
231
+ "p":0.6111111111,
232
+ "r":0.5,
233
+ "f":0.55
234
  },
235
  "orphan":{
236
+ "p":0.25,
237
+ "r":0.1714285714,
238
+ "f":0.2033898305
239
  },
240
  "vocative":{
241
+ "p":0.7169811321,
242
  "r":0.6229508197,
243
+ "f":0.6666666667
244
+ },
245
+ "flat:name":{
246
+ "p":0.8571428571,
247
+ "r":0.8571428571,
248
+ "f":0.8571428571
249
  },
250
  "aux":{
251
  "p":0.0,
 
256
  "p":0.0,
257
  "r":0.0,
258
  "f":0.0
 
 
 
 
 
259
  }
260
  },
261
+ "lemma_acc":0.9730359021,
262
+ "speed":5439.8496899715
263
  }
attribute_ruler/patterns CHANGED
Binary files a/attribute_ruler/patterns and b/attribute_ruler/patterns differ
 
config.cfg CHANGED
@@ -52,6 +52,7 @@ subword_features = true
52
  [components.morphologizer]
53
  factory = "morphologizer"
54
  extend = false
 
55
  overwrite = true
56
  scorer = {"@scorers":"spacy.morphologizer_scorer.v1"}
57
 
@@ -88,6 +89,7 @@ upstream = "tok2vec"
88
 
89
  [components.tagger]
90
  factory = "tagger"
 
91
  neg_prefix = "!"
92
  overwrite = false
93
  scorer = {"@scorers":"spacy.tagger_scorer.v1"}
 
52
  [components.morphologizer]
53
  factory = "morphologizer"
54
  extend = false
55
+ label_smoothing = 0.0
56
  overwrite = true
57
  scorer = {"@scorers":"spacy.morphologizer_scorer.v1"}
58
 
 
89
 
90
  [components.tagger]
91
  factory = "tagger"
92
+ label_smoothing = 0.0
93
  neg_prefix = "!"
94
  overwrite = false
95
  scorer = {"@scorers":"spacy.tagger_scorer.v1"}
grc_proiel_lg-any-py3-none-any.whl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6f6d52ca36e56051ee6dedbf75068347011d027c2593ea9108d76aeb69033bf9
3
- size 279450617
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9234167488a72eb95faedd3bd7ca6a90beabfe4ec67fa1fa157d6516150bef7
3
+ size 279459562
lemmatizer/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:39e4bd7cc76a93e28df338b870437f588562b373304ed017c70e86372846d794
3
  size 24489602
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:27789bec48a44e7f4651d87d904d92a159e4769a5cdb3d249ba949e92ebf22cd
3
  size 24489602
meta.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
  "lang":"grc",
3
  "name":"proiel_lg",
4
- "version":"3.5.3",
5
  "description":"",
6
  "author":"",
7
  "email":"",
8
  "url":"",
9
  "license":"",
10
- "spacy_version":">=3.5.3,<3.6.0",
11
- "spacy_git_version":"512241e12",
12
  "vectors":{
13
  "width":300,
14
  "vectors":200000,
@@ -1132,73 +1132,73 @@
1132
 
1133
  ],
1134
  "performance":{
1135
- "pos_acc":0.9726047466,
1136
- "morph_acc":0.9088045708,
1137
  "morph_per_feat":{
1138
  "Case":{
1139
- "p":0.9753507774,
1140
- "r":0.973750631,
1141
- "f":0.9745500474
1142
  },
1143
  "Gender":{
1144
- "p":0.9225486456,
1145
- "r":0.9256092893,
1146
- "f":0.9240764331
1147
  },
1148
  "Number":{
1149
- "p":0.9908836631,
1150
- "r":0.9890393961,
1151
- "f":0.9899606707
1152
  },
1153
  "Person":{
1154
- "p":0.9730029586,
1155
- "r":0.9712070875,
1156
- "f":0.9721041936
1157
  },
1158
  "PronType":{
1159
- "p":0.9859293194,
1160
- "r":0.9782467532,
1161
- "f":0.9820730117
1162
  },
1163
  "Polarity":{
1164
  "p":1.0,
1165
- "r":0.9844559585,
1166
- "f":0.9921671018
1167
  },
1168
  "Aspect":{
1169
- "p":0.9670710572,
1170
  "r":0.9500567537,
1171
- "f":0.9584884054
1172
  },
1173
  "Mood":{
1174
- "p":0.9747416762,
1175
- "r":0.9719519176,
1176
- "f":0.9733447979
1177
  },
1178
  "Tense":{
1179
- "p":0.9620034542,
1180
- "r":0.9567159052,
1181
- "f":0.9593523941
1182
  },
1183
  "VerbForm":{
1184
- "p":0.9906735751,
1185
- "r":0.9845520082,
1186
- "f":0.9876033058
1187
  },
1188
  "Voice":{
1189
- "p":0.9537132988,
1190
- "r":0.9484713157,
1191
- "f":0.9510850844
1192
  },
1193
  "Degree":{
1194
- "p":0.9129834254,
1195
- "r":0.8884408602,
1196
- "f":0.9005449591
1197
  },
1198
  "Definite":{
1199
- "p":0.9919441461,
1200
- "r":0.9978390059,
1201
- "f":0.9948828441
1202
  },
1203
  "Reflex":{
1204
  "p":1.0,
@@ -1207,188 +1207,188 @@
1207
  },
1208
  "Poss":{
1209
  "p":1.0,
1210
- "r":0.7368421053,
1211
- "f":0.8484848485
1212
  }
1213
  },
1214
- "tag_acc":0.9750219748,
1215
- "dep_uas":0.8111631995,
1216
- "dep_las":0.7622326399,
1217
  "dep_las_per_type":{
1218
  "nsubj":{
1219
- "p":0.7627659574,
1220
- "r":0.7768147346,
1221
- "f":0.769726248
1222
  },
1223
  "discourse":{
1224
- "p":0.8019125683,
1225
- "r":0.8063186813,
1226
- "f":0.804109589
1227
  },
1228
  "mark":{
1229
- "p":0.8448979592,
1230
- "r":0.8346774194,
1231
- "f":0.8397565923
1232
  },
1233
  "advmod":{
1234
- "p":0.7207207207,
1235
- "r":0.7132243685,
1236
- "f":0.71695295
1237
  },
1238
  "advcl":{
1239
- "p":0.6761133603,
1240
- "r":0.6844262295,
1241
- "f":0.6802443992
1242
  },
1243
  "xcomp":{
1244
- "p":0.6180904523,
1245
- "r":0.492,
1246
- "f":0.5478841871
1247
  },
1248
  "cop":{
1249
- "p":0.7466063348,
1250
- "r":0.7710280374,
1251
- "f":0.7586206897
1252
  },
1253
  "root":{
1254
- "p":0.8030888031,
1255
- "r":0.8164867517,
1256
- "f":0.8097323601
1257
  },
1258
  "det":{
1259
- "p":0.9293501962,
1260
- "r":0.9241110147,
1261
- "f":0.9267232007
1262
  },
1263
  "nmod":{
1264
- "p":0.731316726,
1265
- "r":0.7235915493,
1266
- "f":0.7274336283
1267
  },
1268
  "obj":{
1269
- "p":0.7871720117,
1270
- "r":0.8411214953,
1271
- "f":0.813253012
1272
  },
1273
  "case":{
1274
- "p":0.9564744287,
1275
- "r":0.9638157895,
1276
- "f":0.9601310759
1277
  },
1278
  "obl":{
1279
- "p":0.6971098266,
1280
  "r":0.7362637363,
1281
- "f":0.716152019
1282
  },
1283
  "cc":{
1284
- "p":0.6632337796,
1285
- "r":0.6625514403,
1286
- "f":0.6628924344
1287
  },
1288
  "conj":{
1289
- "p":0.6045576408,
1290
- "r":0.5918635171,
1291
- "f":0.5981432361
1292
  },
1293
  "obl:agent":{
1294
- "p":0.9166666667,
1295
- "r":0.2972972973,
1296
- "f":0.4489795918
1297
  },
1298
  "ccomp":{
1299
- "p":0.5187165775,
1300
- "r":0.4825870647,
1301
- "f":0.5
1302
  },
1303
  "nsubj:pass":{
1304
- "p":0.6904761905,
1305
- "r":0.5420560748,
1306
- "f":0.6073298429
1307
  },
1308
  "amod":{
1309
- "p":0.6901408451,
1310
- "r":0.6901408451,
1311
- "f":0.6901408451
1312
  },
1313
  "acl":{
1314
- "p":0.4444444444,
1315
- "r":0.4363636364,
1316
- "f":0.4403669725
1317
  },
1318
  "iobj":{
1319
- "p":0.7162471396,
1320
- "r":0.7228637413,
1321
- "f":0.7195402299
1322
  },
1323
- "appos":{
1324
- "p":0.4074074074,
1325
- "r":0.3120567376,
1326
- "f":0.3534136546
1327
  },
1328
  "nummod":{
1329
- "p":0.8644067797,
1330
- "r":0.75,
1331
- "f":0.8031496063
1332
  },
1333
  "vocative":{
1334
- "p":0.7118644068,
1335
- "r":0.6086956522,
1336
- "f":0.65625
1337
  },
1338
  "orphan":{
1339
- "p":0.1428571429,
1340
  "r":0.0930232558,
1341
- "f":0.1126760563
1342
  },
1343
- "dep":{
1344
- "p":0.0,
1345
- "r":0.0,
1346
- "f":0.0
1347
  },
1348
  "parataxis":{
1349
- "p":0.1666666667,
1350
- "r":0.1,
1351
- "f":0.125
 
 
 
 
 
1352
  },
1353
  "dislocated":{
1354
- "p":0.5555555556,
1355
- "r":0.1923076923,
1356
- "f":0.2857142857
1357
  },
1358
  "csubj:pass":{
1359
- "p":0.25,
1360
- "r":0.2,
1361
- "f":0.2222222222
1362
  },
1363
- "flat:name":{
1364
- "p":0.9285714286,
1365
- "r":0.5909090909,
1366
- "f":0.7222222222
1367
  },
1368
  "aux:pass":{
1369
  "p":0.0,
1370
  "r":0.0,
1371
  "f":0.0
1372
  },
1373
- "fixed":{
1374
- "p":0.8333333333,
1375
- "r":0.5,
1376
- "f":0.625
1377
- },
1378
  "aux":{
1379
  "p":0.0,
1380
  "r":0.0,
1381
  "f":0.0
1382
  }
1383
  },
1384
- "sents_p":0.6061776062,
1385
- "sents_r":0.6162904809,
1386
- "sents_f":0.6111922141,
1387
- "lemma_acc":0.9732639906,
1388
- "tok2vec_loss":73002.5595581873,
1389
- "morphologizer_loss":779.3010618389,
1390
- "tagger_loss":218.2356933637,
1391
- "parser_loss":17925.5136122362
1392
  },
1393
  "requirements":[
1394
 
 
1
  {
2
  "lang":"grc",
3
  "name":"proiel_lg",
4
+ "version":"3.6.0",
5
  "description":"",
6
  "author":"",
7
  "email":"",
8
  "url":"",
9
  "license":"",
10
+ "spacy_version":">=3.6.0,<3.7.0",
11
+ "spacy_git_version":"6fc153a26",
12
  "vectors":{
13
  "width":300,
14
  "vectors":200000,
 
1132
 
1133
  ],
1134
  "performance":{
1135
+ "pos_acc":0.97333724,
1136
+ "morph_acc":0.9031643715,
1137
  "morph_per_feat":{
1138
  "Case":{
1139
+ "p":0.9714430124,
1140
+ "r":0.9702170621,
1141
+ "f":0.9708296502
1142
  },
1143
  "Gender":{
1144
+ "p":0.9143509707,
1145
+ "r":0.9194844966,
1146
+ "f":0.9169105484
1147
  },
1148
  "Number":{
1149
+ "p":0.991193535,
1150
+ "r":0.9892462,
1151
+ "f":0.9902189101
1152
  },
1153
  "Person":{
1154
+ "p":0.9777448071,
1155
+ "r":0.973052787,
1156
+ "f":0.9753931545
1157
  },
1158
  "PronType":{
1159
+ "p":0.986932375,
1160
+ "r":0.9808441558,
1161
+ "f":0.9838788471
1162
  },
1163
  "Polarity":{
1164
  "p":1.0,
1165
+ "r":0.9792746114,
1166
+ "f":0.9895287958
1167
  },
1168
  "Aspect":{
1169
+ "p":0.9698725377,
1170
  "r":0.9500567537,
1171
+ "f":0.9598623853
1172
  },
1173
  "Mood":{
1174
+ "p":0.9718066743,
1175
+ "r":0.966800229,
1176
+ "f":0.9692969871
1177
  },
1178
  "Tense":{
1179
+ "p":0.9599585778,
1180
+ "r":0.9553418069,
1181
+ "f":0.9576446281
1182
  },
1183
  "VerbForm":{
1184
+ "p":0.9892992751,
1185
+ "r":0.9838654308,
1186
+ "f":0.9865748709
1187
  },
1188
  "Voice":{
1189
+ "p":0.9558163618,
1190
+ "r":0.9512195122,
1191
+ "f":0.9535123967
1192
  },
1193
  "Degree":{
1194
+ "p":0.901504788,
1195
+ "r":0.8857526882,
1196
+ "f":0.893559322
1197
  },
1198
  "Definite":{
1199
+ "p":0.9919527897,
1200
+ "r":0.998919503,
1201
+ "f":0.9954239569
1202
  },
1203
  "Reflex":{
1204
  "p":1.0,
 
1207
  },
1208
  "Poss":{
1209
  "p":1.0,
1210
+ "r":0.7894736842,
1211
+ "f":0.8823529412
1212
  }
1213
  },
1214
+ "tag_acc":0.9753149722,
1215
+ "dep_uas":0.8039115148,
1216
+ "dep_las":0.75666569,
1217
  "dep_las_per_type":{
1218
  "nsubj":{
1219
+ "p":0.7616875713,
1220
+ "r":0.7237269772,
1221
+ "f":0.7422222222
1222
  },
1223
  "discourse":{
1224
+ "p":0.806362379,
1225
+ "r":0.8008241758,
1226
+ "f":0.8035837354
1227
  },
1228
  "mark":{
1229
+ "p":0.8155737705,
1230
+ "r":0.8024193548,
1231
+ "f":0.8089430894
1232
  },
1233
  "advmod":{
1234
+ "p":0.7274074074,
1235
+ "r":0.7295690936,
1236
+ "f":0.7284866469
1237
  },
1238
  "advcl":{
1239
+ "p":0.6850393701,
1240
+ "r":0.7131147541,
1241
+ "f":0.6987951807
1242
  },
1243
  "xcomp":{
1244
+ "p":0.5513307985,
1245
+ "r":0.58,
1246
+ "f":0.5653021442
1247
  },
1248
  "cop":{
1249
+ "p":0.7336448598,
1250
+ "r":0.7336448598,
1251
+ "f":0.7336448598
1252
  },
1253
  "root":{
1254
+ "p":0.7939221273,
1255
+ "r":0.8204121688,
1256
+ "f":0.8069498069
1257
  },
1258
  "det":{
1259
+ "p":0.9313640313,
1260
+ "r":0.9297484822,
1261
+ "f":0.9305555556
1262
  },
1263
  "nmod":{
1264
+ "p":0.7538461538,
1265
+ "r":0.6901408451,
1266
+ "f":0.7205882353
1267
  },
1268
  "obj":{
1269
+ "p":0.7806580259,
1270
+ "r":0.8130841121,
1271
+ "f":0.7965412004
1272
  },
1273
  "case":{
1274
+ "p":0.9588299025,
1275
+ "r":0.9703947368,
1276
+ "f":0.9645776567
1277
  },
1278
  "obl":{
1279
+ "p":0.6963048499,
1280
  "r":0.7362637363,
1281
+ "f":0.715727003
1282
  },
1283
  "cc":{
1284
+ "p":0.6373966942,
1285
+ "r":0.6347736626,
1286
+ "f":0.6360824742
1287
  },
1288
  "conj":{
1289
+ "p":0.562099872,
1290
+ "r":0.5761154856,
1291
+ "f":0.5690213869
1292
  },
1293
  "obl:agent":{
1294
+ "p":1.0,
1295
+ "r":0.4864864865,
1296
+ "f":0.6545454545
1297
  },
1298
  "ccomp":{
1299
+ "p":0.5673758865,
1300
+ "r":0.3980099502,
1301
+ "f":0.4678362573
1302
  },
1303
  "nsubj:pass":{
1304
+ "p":0.6534653465,
1305
+ "r":0.6168224299,
1306
+ "f":0.6346153846
1307
  },
1308
  "amod":{
1309
+ "p":0.6592920354,
1310
+ "r":0.6995305164,
1311
+ "f":0.6788154897
1312
  },
1313
  "acl":{
1314
+ "p":0.4846153846,
1315
+ "r":0.3818181818,
1316
+ "f":0.4271186441
1317
  },
1318
  "iobj":{
1319
+ "p":0.7181208054,
1320
+ "r":0.7413394919,
1321
+ "f":0.7295454545
1322
  },
1323
+ "dep":{
1324
+ "p":0.0,
1325
+ "r":0.0,
1326
+ "f":0.0
1327
  },
1328
  "nummod":{
1329
+ "p":0.8983050847,
1330
+ "r":0.7794117647,
1331
+ "f":0.8346456693
1332
  },
1333
  "vocative":{
1334
+ "p":0.7704918033,
1335
+ "r":0.6811594203,
1336
+ "f":0.7230769231
1337
  },
1338
  "orphan":{
1339
+ "p":0.2352941176,
1340
  "r":0.0930232558,
1341
+ "f":0.1333333333
1342
  },
1343
+ "appos":{
1344
+ "p":0.3425925926,
1345
+ "r":0.2624113475,
1346
+ "f":0.297188755
1347
  },
1348
  "parataxis":{
1349
+ "p":0.1,
1350
+ "r":0.05,
1351
+ "f":0.0666666667
1352
+ },
1353
+ "flat:name":{
1354
+ "p":0.8125,
1355
+ "r":0.5909090909,
1356
+ "f":0.6842105263
1357
  },
1358
  "dislocated":{
1359
+ "p":0.5,
1360
+ "r":0.3076923077,
1361
+ "f":0.380952381
1362
  },
1363
  "csubj:pass":{
1364
+ "p":0.0,
1365
+ "r":0.0,
1366
+ "f":0.0
1367
  },
1368
+ "fixed":{
1369
+ "p":0.6666666667,
1370
+ "r":0.6,
1371
+ "f":0.6315789474
1372
  },
1373
  "aux:pass":{
1374
  "p":0.0,
1375
  "r":0.0,
1376
  "f":0.0
1377
  },
 
 
 
 
 
1378
  "aux":{
1379
  "p":0.0,
1380
  "r":0.0,
1381
  "f":0.0
1382
  }
1383
  },
1384
+ "sents_p":0.5935422602,
1385
+ "sents_r":0.6133464181,
1386
+ "sents_f":0.6032818533,
1387
+ "lemma_acc":0.9745092294,
1388
+ "tok2vec_loss":74655.8410613122,
1389
+ "morphologizer_loss":2118.7215433121,
1390
+ "tagger_loss":480.3859246671,
1391
+ "parser_loss":27517.6268136028
1392
  },
1393
  "requirements":[
1394
 
morphologizer/cfg CHANGED
@@ -1,5 +1,6 @@
1
  {
2
  "extend":false,
 
3
  "labels_morph":{
4
  "Case=Gen|Gender=Masc|Number=Sing|POS=PROPN":"Case=Gen|Gender=Masc|Number=Sing",
5
  "Case=Gen|Gender=Masc|Number=Sing|POS=NOUN":"Case=Gen|Gender=Masc|Number=Sing",
 
1
  {
2
  "extend":false,
3
+ "label_smoothing":0.0,
4
  "labels_morph":{
5
  "Case=Gen|Gender=Masc|Number=Sing|POS=PROPN":"Case=Gen|Gender=Masc|Number=Sing",
6
  "Case=Gen|Gender=Masc|Number=Sing|POS=NOUN":"Case=Gen|Gender=Masc|Number=Sing",
morphologizer/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6e8d56f2fd0e91993c9950c7db2020a989445e6e3fe6696b22066aed68711527
3
  size 1058262
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16c0f9a004933d19457d0226782b226e658bb5644c50c8d7138f5c966599a51e
3
  size 1058262
parser/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:de71e831cfc42e7cf212530b32489a38fa6a56e791c0102fcfd7dd086b535279
3
  size 1782009
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb1b9433bbeb024f29ff77f14ba38faaa18905f61f5a34657a00821762d965cb
3
  size 1782009
tagger/cfg CHANGED
@@ -1,4 +1,5 @@
1
  {
 
2
  "labels":[
3
  "A-",
4
  "C-",
 
1
  {
2
+ "label_smoothing":0.0,
3
  "labels":[
4
  "A-",
5
  "C-",
tagger/model CHANGED
Binary files a/tagger/model and b/tagger/model differ
 
tok2vec/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c6ebd7dcc4d53847a71bf3c39cb7ae9bb8fd984132dbe83cd0510aec777b735e
3
  size 35970008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc7e53d3c14d9d149273e812073c2ad86a40f9f616637cca1a3b7c00c0a62cdd
3
  size 35970008
vocab/strings.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e11087e9bbbfcc4871885e5930e003630da432f3a604f83a687b9f53efe5869a
3
- size 17727257
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96d2990c91aa1e0a5cc77bee8ba8fa45c5534c3eb2697a6dbde30cc6fb44238e
3
+ size 17718106
vocab/vectors.cfg CHANGED
@@ -5,5 +5,6 @@
5
  "hash_count":2,
6
  "hash_seed":2166136261,
7
  "bow":"<",
8
- "eow":">"
 
9
  }
 
5
  "hash_count":2,
6
  "hash_seed":2166136261,
7
  "bow":"<",
8
+ "eow":">",
9
+ "attr":65
10
  }