Update spaCy pipeline

Browse files

Files changed (10) hide show

README.md +9 -9
attribute_ruler/patterns +0 -0
config.cfg +0 -2
en_skillner-any-py3-none-any.whl +2 -2
meta.json +33 -33
ner/model +2 -2
ner/moves +1 -1
tagger/cfg +0 -1
vocab/lookups.bin +2 -2
vocab/strings.json +0 -0

README.md CHANGED Viewed

@@ -14,25 +14,25 @@ model-index:
     metrics:
     - name: NER Precision
       type: precision
-      value: 0.4605714286
     - name: NER Recall
       type: recall
-      value: 0.4574347333
     - name: NER F Score
       type: f_score
-      value: 0.4589977221
 ---
 A Named Entity Recognition (NER) model to extract SKILL, EXPERIENCE and BENEFIT from job adverts.
 | Feature | Description |
 | --- | --- |
 | **Name** | `en_skillner` |
-| **Version** | `3.7.1` |
-| **spaCy** | `>=3.7.4,<3.8.0` |
 | **Default Pipeline** | `tok2vec`, `tagger`, `parser`, `attribute_ruler`, `lemmatizer`, `ner` |
 | **Components** | `tok2vec`, `tagger`, `parser`, `senter`, `attribute_ruler`, `lemmatizer`, `ner` |
 | **Vectors** | 514157 keys, 514157 unique vectors (300 dimensions) |
-| **Sources** | [OntoNotes 5](https://catalog.ldc.upenn.edu/LDC2013T19) (Ralph Weischedel, Martha Palmer, Mitchell Marcus, Eduard Hovy, Sameer Pradhan, Lance Ramshaw, Nianwen Xue, Ann Taylor, Jeff Kaufman, Michelle Franchini, Mohammed El-Bachouti, Robert Belvin, Ann Houston)<br>[ClearNLP Constituent-to-Dependency Conversion](https://github.com/clir/clearnlp-guidelines/blob/master/md/components/dependency_conversion.md) (Emory University)<br>[WordNet 3.0](https://wordnet.princeton.edu/) (Princeton University)<br>[Explosion Vectors (OSCAR 2109 + Wikipedia + OpenSubtitles + WMT News Crawl)](https://github.com/explosion/spacy-vectors-builder) (Explosion) |
 | **License** | `MIT` |
 | **Author** | [nestauk](https://explosion.ai) |
@@ -52,6 +52,6 @@ A Named Entity Recognition (NER) model to extract SKILL, EXPERIENCE and BENEFIT
 | Type | Score |
 | --- | --- |
-| `ENTS_P` | 46.06 |
-| `ENTS_R` | 45.74 |
-| `ENTS_F` | 45.90 |

     metrics:
     - name: NER Precision
       type: precision
+      value: 0.5991309071
     - name: NER Recall
       type: recall
+      value: 0.5768828452
     - name: NER F Score
       type: f_score
+      value: 0.5877964295
 ---
 A Named Entity Recognition (NER) model to extract SKILL, EXPERIENCE and BENEFIT from job adverts.
 | Feature | Description |
 | --- | --- |
 | **Name** | `en_skillner` |
+| **Version** | `3.5.0` |
+| **spaCy** | `>=3.5.3,<3.6.0` |
 | **Default Pipeline** | `tok2vec`, `tagger`, `parser`, `attribute_ruler`, `lemmatizer`, `ner` |
 | **Components** | `tok2vec`, `tagger`, `parser`, `senter`, `attribute_ruler`, `lemmatizer`, `ner` |
 | **Vectors** | 514157 keys, 514157 unique vectors (300 dimensions) |
+| **Sources** | [OntoNotes 5](https://catalog.ldc.upenn.edu/LDC2013T19) (Ralph Weischedel, Martha Palmer, Mitchell Marcus, Eduard Hovy, Sameer Pradhan, Lance Ramshaw, Nianwen Xue, Ann Taylor, Jeff Kaufman, Michelle Franchini, Mohammed El-Bachouti, Robert Belvin, Ann Houston)<br />[ClearNLP Constituent-to-Dependency Conversion](https://github.com/clir/clearnlp-guidelines/blob/master/md/components/dependency_conversion.md) (Emory University)<br />[WordNet 3.0](https://wordnet.princeton.edu/) (Princeton University)<br />[Explosion Vectors (OSCAR 2109 + Wikipedia + OpenSubtitles + WMT News Crawl)](https://github.com/explosion/spacy-vectors-builder) (Explosion) |
 | **License** | `MIT` |
 | **Author** | [nestauk](https://explosion.ai) |
 | Type | Score |
 | --- | --- |
+| `ENTS_P` | 59.91 |
+| `ENTS_R` | 57.69 |
+| `ENTS_F` | 58.78 |

attribute_ruler/patterns CHANGED Viewed

Binary files a/attribute_ruler/patterns and b/attribute_ruler/patterns differ

config.cfg CHANGED Viewed

@@ -17,7 +17,6 @@ after_creation = null
 after_pipeline_creation = null
 batch_size = 256
 tokenizer = {"@tokenizers":"spacy.Tokenizer.v1"}
-vectors = {"@vectors":"spacy.Vectors.v1"}
 [components]
@@ -117,7 +116,6 @@ maxout_pieces = 2
 [components.tagger]
 factory = "tagger"
-label_smoothing = 0.0
 neg_prefix = "!"
 overwrite = false
 scorer = {"@scorers":"spacy.tagger_scorer.v1"}

 after_pipeline_creation = null
 batch_size = 256
 tokenizer = {"@tokenizers":"spacy.Tokenizer.v1"}
 [components]
 [components.tagger]
 factory = "tagger"
 neg_prefix = "!"
 overwrite = false
 scorer = {"@scorers":"spacy.tagger_scorer.v1"}

en_skillner-any-py3-none-any.whl CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6d6401718f0b7e4271c63c65f625a931ecadad6916c30ebfaf4a954f3c645912
-size 587702666

 version https://git-lfs.github.com/spec/v1
+oid sha256:86b2de6b625e84c55050bccdba70da7d4dc1d39f272bb9debba1b74b0857c868
+size 587688649

meta.json CHANGED Viewed

@@ -1,14 +1,14 @@
 {
   "lang":"en",
   "name":"skillner",
-  "version":"3.7.1",
   "description":"A Named Entity Recognition (NER) model to extract SKILL, EXPERIENCE and BENEFIT from job adverts.",
   "author":"nestauk",
   "email":"[email protected]",
   "url":"https://explosion.ai",
   "license":"MIT",
-  "spacy_version":">=3.7.4,<3.8.0",
-  "spacy_git_version":"bd2c17e20",
   "vectors":{
     "width":300,
     "vectors":514157,
@@ -43,45 +43,45 @@
     "senter"
   ],
   "performance":{
-    "ents_p":0.4605714286,
-    "ents_r":0.4574347333,
-    "ents_f":0.4589977221,
     "ents_per_type":{
       "SKILL":{
-        "correct":461,
-        "incorrect":8,
         "partial":0,
-        "missed":304,
-        "spurious":340,
-        "possible":773,
-        "actual":809,
-        "precision":0.5698393078,
-        "recall":0.596377749,
-        "f1":0.582806574
       },
       "EXPERIENCE":{
-        "correct":33,
-        "incorrect":16,
         "partial":0,
-        "missed":59,
-        "spurious":17,
-        "possible":108,
-        "actual":66,
-        "precision":0.5,
-        "recall":0.3055555556,
-        "f1":0.3793103448
       },
       "BENEFIT":{
-        "correct":0,
-        "incorrect":0,
         "partial":0,
-        "missed":0,
-        "spurious":0,
-        "possible":0,
-        "actual":0,
-        "precision":0,
-        "recall":0,
-        "f1":0
       }
     }
   },

 {
   "lang":"en",
   "name":"skillner",
+  "version":"3.5.0",
   "description":"A Named Entity Recognition (NER) model to extract SKILL, EXPERIENCE and BENEFIT from job adverts.",
   "author":"nestauk",
   "email":"[email protected]",
   "url":"https://explosion.ai",
   "license":"MIT",
+  "spacy_version":">=3.5.3,<3.6.0",
+  "spacy_git_version":"9e0322de1",
   "vectors":{
     "width":300,
     "vectors":514157,
     "senter"
   ],
   "performance":{
+    "ents_p":0.5991309071,
+    "ents_r":0.5768828452,
+    "ents_f":0.5877964295,
     "ents_per_type":{
       "SKILL":{
+        "correct":1208,
+        "incorrect":32,
         "partial":0,
+        "missed":429,
+        "spurious":420,
+        "possible":1669,
+        "actual":1660,
+        "precision":0.7277108434,
+        "recall":0.7237866986,
+        "f1":0.7257434665
       },
       "EXPERIENCE":{
+        "correct":84,
+        "incorrect":37,
         "partial":0,
+        "missed":55,
+        "spurious":29,
+        "possible":176,
+        "actual":150,
+        "precision":0.56,
+        "recall":0.4772727273,
+        "f1":0.5153374233
       },
       "BENEFIT":{
+        "correct":24,
+        "incorrect":3,
         "partial":0,
+        "missed":40,
+        "spurious":4,
+        "possible":67,
+        "actual":31,
+        "precision":0.7741935484,
+        "recall":0.3582089552,
+        "f1":0.4897959184
       }
     }
   },

ner/model CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:00f3751c9e8131d61d924c752bc58f62e329d56e34612a544a8cea766b0bc6e5
-size 6383023

 version https://git-lfs.github.com/spec/v1
+oid sha256:5dd953e4cc7eeaa1052539fcb71b312a0650910a310fb84b5eac2d89e993e8c0
+size 6384063

ner/moves CHANGED Viewed

@@ -1 +1 @@

- ��moves�|{"0":{},"1":{"ORG":56516,"DATE":40493,"PERSON":36534,"GPE":26745,"MONEY":15158,"CARDINAL":14109,"NORP":9641,"PERCENT":9199,"WORK_OF_ART":4488,"LOC":4055,"TIME":3678,"QUANTITY":3123,"FAC":3046,"EVENT":3021,"ORDINAL":2142,"PRODUCT":1787,"LAW":1624,"LANGUAGE":355,"~~SKILL~~":-1,"~~EXPERIENCE~~":-2},"2":{"ORG":56516,"DATE":40493,"PERSON":36534,"GPE":26745,"MONEY":15158,"CARDINAL":14109,"NORP":9641,"PERCENT":9199,"WORK_OF_ART":4488,"LOC":4055,"TIME":3678,"QUANTITY":3123,"FAC":3046,"EVENT":3021,"ORDINAL":2142,"PRODUCT":1787,"LAW":1624,"LANGUAGE":355,"~~SKILL~~":-1,"~~EXPERIENCE~~":-2},"3":{"ORG":56516,"DATE":40493,"PERSON":36534,"GPE":26745,"MONEY":15158,"CARDINAL":14109,"NORP":9641,"PERCENT":9199,"WORK_OF_ART":4488,"LOC":4055,"TIME":3678,"QUANTITY":3123,"FAC":3046,"EVENT":3021,"ORDINAL":2142,"PRODUCT":1787,"LAW":1624,"LANGUAGE":355,"~~SKILL~~":-1,"~~EXPERIENCE~~":-2},"4":{"ORG":56516,"DATE":40493,"PERSON":36534,"GPE":26745,"MONEY":15158,"CARDINAL":14109,"NORP":9641,"PERCENT":9199,"WORK_OF_ART":4488,"LOC":4055,"TIME":3678,"QUANTITY":3123,"FAC":3046,"EVENT":3021,"ORDINAL":2142,"PRODUCT":1787,"LAW":1624,"LANGUAGE":355,"":1,"~~SKILL~~":-1,"~~EXPERIENCE~~":-2},"5":{"":1}}�cfg��neg_key�

+ ��moves��{"0":{},"1":{"ORG":56516,"DATE":40493,"PERSON":36534,"GPE":26745,"MONEY":15158,"CARDINAL":14109,"NORP":9641,"PERCENT":9199,"WORK_OF_ART":4488,"LOC":4055,"TIME":3678,"QUANTITY":3123,"FAC":3046,"EVENT":3021,"ORDINAL":2142,"PRODUCT":1787,"LAW":1624,"LANGUAGE":355,"EXPERIENCE":-1,"SKILL":-2,"BENEFIT":-3},"2":{"ORG":56516,"DATE":40493,"PERSON":36534,"GPE":26745,"MONEY":15158,"CARDINAL":14109,"NORP":9641,"PERCENT":9199,"WORK_OF_ART":4488,"LOC":4055,"TIME":3678,"QUANTITY":3123,"FAC":3046,"EVENT":3021,"ORDINAL":2142,"PRODUCT":1787,"LAW":1624,"LANGUAGE":355,"EXPERIENCE":-1,"SKILL":-2,"BENEFIT":-3},"3":{"ORG":56516,"DATE":40493,"PERSON":36534,"GPE":26745,"MONEY":15158,"CARDINAL":14109,"NORP":9641,"PERCENT":9199,"WORK_OF_ART":4488,"LOC":4055,"TIME":3678,"QUANTITY":3123,"FAC":3046,"EVENT":3021,"ORDINAL":2142,"PRODUCT":1787,"LAW":1624,"LANGUAGE":355,"EXPERIENCE":-1,"SKILL":-2,"BENEFIT":-3},"4":{"ORG":56516,"DATE":40493,"PERSON":36534,"GPE":26745,"MONEY":15158,"CARDINAL":14109,"NORP":9641,"PERCENT":9199,"WORK_OF_ART":4488,"LOC":4055,"TIME":3678,"QUANTITY":3123,"FAC":3046,"EVENT":3021,"ORDINAL":2142,"PRODUCT":1787,"LAW":1624,"LANGUAGE":355,"":1,"EXPERIENCE":-1,"SKILL":-2,"BENEFIT":-3},"5":{"":1}}�cfg��neg_key�

tagger/cfg CHANGED Viewed

@@ -1,5 +1,4 @@
 {
-  "label_smoothing":0.0,
   "labels":[
     "$",
     "''",

 {
   "labels":[
     "$",
     "''",

vocab/lookups.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fce9c883c56165f29573cc938c2a1c9d417ac61bd8f56b671dd5f7996de70682
-size 70040

 version https://git-lfs.github.com/spec/v1
+oid sha256:1ddd140ecac6a8c4592e9146d6e30074569ffaed97ee51edc9587dc510f8934c
+size 69982

vocab/strings.json CHANGED Viewed

The diff for this file is too large to render. See raw diff