adrianeboyd commited on
Commit
599be47
1 Parent(s): 09d11c9

Update spaCy pipeline

Browse files
README.md CHANGED
@@ -48,7 +48,7 @@ model-index:
48
  metrics:
49
  - name: Lemma Accuracy
50
  type: accuracy
51
- value: 0.9645886243
52
  - task:
53
  name: UNLABELED_DEPENDENCIES
54
  type: token-classification
@@ -78,8 +78,8 @@ Spanish pipeline optimized for CPU. Components: tok2vec, morphologizer, parser,
78
  | Feature | Description |
79
  | --- | --- |
80
  | **Name** | `es_core_news_md` |
81
- | **Version** | `3.6.0` |
82
- | **spaCy** | `>=3.6.0,<3.7.0` |
83
  | **Default Pipeline** | `tok2vec`, `morphologizer`, `parser`, `attribute_ruler`, `lemmatizer`, `ner` |
84
  | **Components** | `tok2vec`, `morphologizer`, `parser`, `senter`, `attribute_ruler`, `lemmatizer`, `ner` |
85
  | **Vectors** | 500000 keys, 20000 unique vectors (300 dimensions) |
@@ -120,7 +120,7 @@ Spanish pipeline optimized for CPU. Components: tok2vec, morphologizer, parser,
120
  | `DEP_UAS` | 91.26 |
121
  | `DEP_LAS` | 88.00 |
122
  | `TAG_ACC` | 96.11 |
123
- | `LEMMA_ACC` | 96.46 |
124
  | `ENTS_P` | 89.25 |
125
  | `ENTS_R` | 89.51 |
126
  | `ENTS_F` | 89.38 |
 
48
  metrics:
49
  - name: Lemma Accuracy
50
  type: accuracy
51
+ value: 0.964971968
52
  - task:
53
  name: UNLABELED_DEPENDENCIES
54
  type: token-classification
 
78
  | Feature | Description |
79
  | --- | --- |
80
  | **Name** | `es_core_news_md` |
81
+ | **Version** | `3.7.0` |
82
+ | **spaCy** | `>=3.7.0,<3.8.0` |
83
  | **Default Pipeline** | `tok2vec`, `morphologizer`, `parser`, `attribute_ruler`, `lemmatizer`, `ner` |
84
  | **Components** | `tok2vec`, `morphologizer`, `parser`, `senter`, `attribute_ruler`, `lemmatizer`, `ner` |
85
  | **Vectors** | 500000 keys, 20000 unique vectors (300 dimensions) |
 
120
  | `DEP_UAS` | 91.26 |
121
  | `DEP_LAS` | 88.00 |
122
  | `TAG_ACC` | 96.11 |
123
+ | `LEMMA_ACC` | 96.50 |
124
  | `ENTS_P` | 89.25 |
125
  | `ENTS_R` | 89.51 |
126
  | `ENTS_F` | 89.38 |
accuracy.json CHANGED
@@ -293,7 +293,7 @@
293
  }
294
  },
295
  "tag_acc": 0.9610850187,
296
- "lemma_acc": 0.9645886243,
297
  "ents_p": 0.8925237438,
298
  "ents_r": 0.8951031872,
299
  "ents_f": 0.8938116045,
@@ -319,5 +319,5 @@
319
  "f": 0.8288097756
320
  }
321
  },
322
- "speed": 10142.7772589352
323
  }
 
293
  }
294
  },
295
  "tag_acc": 0.9610850187,
296
+ "lemma_acc": 0.964971968,
297
  "ents_p": 0.8925237438,
298
  "ents_r": 0.8951031872,
299
  "ents_f": 0.8938116045,
 
319
  "f": 0.8288097756
320
  }
321
  },
322
+ "speed": 8100.6553926426
323
  }
config.cfg CHANGED
@@ -17,6 +17,7 @@ after_creation = null
17
  after_pipeline_creation = null
18
  batch_size = 256
19
  tokenizer = {"@tokenizers":"spacy.Tokenizer.v1"}
 
20
 
21
  [components]
22
 
 
17
  after_pipeline_creation = null
18
  batch_size = 256
19
  tokenizer = {"@tokenizers":"spacy.Tokenizer.v1"}
20
+ vectors = {"@vectors":"spacy.Vectors.v1"}
21
 
22
  [components]
23
 
es_core_news_md-any-py3-none-any.whl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b3d69542decdde20097a10795bddb8dc841731cd2e00e3f490306c850c2f7cd4
3
- size 42285715
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d6d6ebed875869a9759c8c096f2cef581fa32d861646030f771c83e5799de82
3
+ size 42285776
lemmatizer/lookups/lookups.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:be833a634de5b55fa529aceee97fcc09a193e2017b5e4b34bafe103ad97600aa
3
- size 165037
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee3740fdad2ebc1cf79a63a8e5b2d2f3dd47b33c3a7a0bc9351ba5a1246b6a07
3
+ size 165225
meta.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
  "lang":"es",
3
  "name":"core_news_md",
4
- "version":"3.6.0",
5
  "description":"Spanish pipeline optimized for CPU. Components: tok2vec, morphologizer, parser, senter, ner, attribute_ruler, lemmatizer.",
6
  "author":"Explosion",
7
  "email":"contact@explosion.ai",
8
  "url":"https://explosion.ai",
9
  "license":"GNU GPL 3.0",
10
- "spacy_version":">=3.6.0,<3.7.0",
11
- "spacy_git_version":"cb4fdc83e",
12
  "vectors":{
13
  "width":300,
14
  "vectors":20000,
@@ -815,7 +815,7 @@
815
  }
816
  },
817
  "tag_acc":0.9610850187,
818
- "lemma_acc":0.9645886243,
819
  "ents_p":0.8925237438,
820
  "ents_r":0.8951031872,
821
  "ents_f":0.8938116045,
@@ -841,7 +841,7 @@
841
  "f":0.8288097756
842
  }
843
  },
844
- "speed":10142.7772589352
845
  },
846
  "sources":[
847
  {
 
1
  {
2
  "lang":"es",
3
  "name":"core_news_md",
4
+ "version":"3.7.0",
5
  "description":"Spanish pipeline optimized for CPU. Components: tok2vec, morphologizer, parser, senter, ner, attribute_ruler, lemmatizer.",
6
  "author":"Explosion",
7
  "email":"contact@explosion.ai",
8
  "url":"https://explosion.ai",
9
  "license":"GNU GPL 3.0",
10
+ "spacy_version":">=3.7.0,<3.8.0",
11
+ "spacy_git_version":"6b4f77441",
12
  "vectors":{
13
  "width":300,
14
  "vectors":20000,
 
815
  }
816
  },
817
  "tag_acc":0.9610850187,
818
+ "lemma_acc":0.964971968,
819
  "ents_p":0.8925237438,
820
  "ents_r":0.8951031872,
821
  "ents_f":0.8938116045,
 
841
  "f":0.8288097756
842
  }
843
  },
844
+ "speed":8100.6553926426
845
  },
846
  "sources":[
847
  {