Commit
·
486ce79
1
Parent(s):
c7180d3
Update spaCy pipeline
Browse files- README.md +2 -2
- accuracy.json +1 -1
- config.cfg +2 -0
- meta.json +4 -4
- morphologizer/cfg +1 -0
- nl_core_news_md-any-py3-none-any.whl +2 -2
- tagger/cfg +1 -0
README.md
CHANGED
@@ -78,8 +78,8 @@ Dutch pipeline optimized for CPU. Components: tok2vec, morphologizer, tagger, pa
|
|
78 |
| Feature | Description |
|
79 |
| --- | --- |
|
80 |
| **Name** | `nl_core_news_md` |
|
81 |
-
| **Version** | `3.
|
82 |
-
| **spaCy** | `>=3.
|
83 |
| **Default Pipeline** | `tok2vec`, `morphologizer`, `tagger`, `parser`, `lemmatizer`, `attribute_ruler`, `ner` |
|
84 |
| **Components** | `tok2vec`, `morphologizer`, `tagger`, `parser`, `lemmatizer`, `senter`, `attribute_ruler`, `ner` |
|
85 |
| **Vectors** | 500000 keys, 20000 unique vectors (300 dimensions) |
|
|
|
78 |
| Feature | Description |
|
79 |
| --- | --- |
|
80 |
| **Name** | `nl_core_news_md` |
|
81 |
+
| **Version** | `3.6.0` |
|
82 |
+
| **spaCy** | `>=3.6.0,<3.7.0` |
|
83 |
| **Default Pipeline** | `tok2vec`, `morphologizer`, `tagger`, `parser`, `lemmatizer`, `attribute_ruler`, `ner` |
|
84 |
| **Components** | `tok2vec`, `morphologizer`, `tagger`, `parser`, `lemmatizer`, `senter`, `attribute_ruler`, `ner` |
|
85 |
| **Vectors** | 500000 keys, 20000 unique vectors (300 dimensions) |
|
accuracy.json
CHANGED
@@ -277,7 +277,7 @@
|
|
277 |
"f": 0.0
|
278 |
}
|
279 |
},
|
280 |
-
"speed":
|
281 |
"token_acc": 0.999433329,
|
282 |
"token_p": 0.9974281853,
|
283 |
"token_r": 0.9975586363,
|
|
|
277 |
"f": 0.0
|
278 |
}
|
279 |
},
|
280 |
+
"speed": 11001.4289307816,
|
281 |
"token_acc": 0.999433329,
|
282 |
"token_p": 0.9974281853,
|
283 |
"token_r": 0.9975586363,
|
config.cfg
CHANGED
@@ -46,6 +46,7 @@ upstream = "tok2vec"
|
|
46 |
[components.morphologizer]
|
47 |
factory = "morphologizer"
|
48 |
extend = false
|
|
|
49 |
overwrite = true
|
50 |
scorer = {"@scorers":"spacy.morphologizer_scorer.v1"}
|
51 |
|
@@ -143,6 +144,7 @@ maxout_pieces = 2
|
|
143 |
|
144 |
[components.tagger]
|
145 |
factory = "tagger"
|
|
|
146 |
neg_prefix = "!"
|
147 |
overwrite = false
|
148 |
scorer = {"@scorers":"spacy.tagger_scorer.v1"}
|
|
|
46 |
[components.morphologizer]
|
47 |
factory = "morphologizer"
|
48 |
extend = false
|
49 |
+
label_smoothing = 0.0
|
50 |
overwrite = true
|
51 |
scorer = {"@scorers":"spacy.morphologizer_scorer.v1"}
|
52 |
|
|
|
144 |
|
145 |
[components.tagger]
|
146 |
factory = "tagger"
|
147 |
+
label_smoothing = 0.0
|
148 |
neg_prefix = "!"
|
149 |
overwrite = false
|
150 |
scorer = {"@scorers":"spacy.tagger_scorer.v1"}
|
meta.json
CHANGED
@@ -1,14 +1,14 @@
|
|
1 |
{
|
2 |
"lang":"nl",
|
3 |
"name":"core_news_md",
|
4 |
-
"version":"3.
|
5 |
"description":"Dutch pipeline optimized for CPU. Components: tok2vec, morphologizer, tagger, parser, lemmatizer (trainable_lemmatizer), senter, ner.",
|
6 |
"author":"Explosion",
|
7 |
"email":"[email protected]",
|
8 |
"url":"https://explosion.ai",
|
9 |
"license":"CC BY-SA 4.0",
|
10 |
-
"spacy_version":">=3.
|
11 |
-
"spacy_git_version":"
|
12 |
"vectors":{
|
13 |
"width":300,
|
14 |
"vectors":20000,
|
@@ -655,7 +655,7 @@
|
|
655 |
"f":0.0
|
656 |
}
|
657 |
},
|
658 |
-
"speed":
|
659 |
"token_acc":0.999433329,
|
660 |
"token_p":0.9974281853,
|
661 |
"token_r":0.9975586363,
|
|
|
1 |
{
|
2 |
"lang":"nl",
|
3 |
"name":"core_news_md",
|
4 |
+
"version":"3.6.0",
|
5 |
"description":"Dutch pipeline optimized for CPU. Components: tok2vec, morphologizer, tagger, parser, lemmatizer (trainable_lemmatizer), senter, ner.",
|
6 |
"author":"Explosion",
|
7 |
"email":"[email protected]",
|
8 |
"url":"https://explosion.ai",
|
9 |
"license":"CC BY-SA 4.0",
|
10 |
+
"spacy_version":">=3.6.0,<3.7.0",
|
11 |
+
"spacy_git_version":"cb4fdc83e",
|
12 |
"vectors":{
|
13 |
"width":300,
|
14 |
"vectors":20000,
|
|
|
655 |
"f":0.0
|
656 |
}
|
657 |
},
|
658 |
+
"speed":11001.4289307816,
|
659 |
"token_acc":0.999433329,
|
660 |
"token_p":0.9974281853,
|
661 |
"token_r":0.9975586363,
|
morphologizer/cfg
CHANGED
@@ -1,5 +1,6 @@
|
|
1 |
{
|
2 |
"extend":false,
|
|
|
3 |
"labels_morph":{
|
4 |
"POS=PRON|Person=3|PronType=Dem":"Person=3|PronType=Dem",
|
5 |
"Number=Sing|POS=AUX|Tense=Pres|VerbForm=Fin":"Number=Sing|Tense=Pres|VerbForm=Fin",
|
|
|
1 |
{
|
2 |
"extend":false,
|
3 |
+
"label_smoothing":0.0,
|
4 |
"labels_morph":{
|
5 |
"POS=PRON|Person=3|PronType=Dem":"Person=3|PronType=Dem",
|
6 |
"Number=Sing|POS=AUX|Tense=Pres|VerbForm=Fin":"Number=Sing|Tense=Pres|VerbForm=Fin",
|
nl_core_news_md-any-py3-none-any.whl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6e294737c628772a13b727b51bf8eb6b254ad546fb6faa2a03eaa8073763380b
|
3 |
+
size 42745425
|
tagger/cfg
CHANGED
@@ -1,4 +1,5 @@
|
|
1 |
{
|
|
|
2 |
"labels":[
|
3 |
"ADJ|nom|basis|met-e|mv-n",
|
4 |
"ADJ|nom|basis|met-e|zonder-n|bijz",
|
|
|
1 |
{
|
2 |
+
"label_smoothing":0.0,
|
3 |
"labels":[
|
4 |
"ADJ|nom|basis|met-e|mv-n",
|
5 |
"ADJ|nom|basis|met-e|zonder-n|bijz",
|