Adriane Boyd
commited on
Commit
•
c004b3f
1
Parent(s):
aaf8333
Update spaCy pipeline
Browse files- README.md +8 -8
- accuracy.json +4 -4
- config.cfg +1 -6
- meta.json +9 -13
- senter/model +1 -1
- vocab/strings.json +2 -2
- xx_sent_ud_sm-any-py3-none-any.whl +2 -2
README.md
CHANGED
@@ -13,7 +13,7 @@ model-index:
|
|
13 |
metrics:
|
14 |
- name: Sentences F-Score
|
15 |
type: f_score
|
16 |
-
value: 0.
|
17 |
---
|
18 |
### Details: https://spacy.io/models/xx#xx_sent_ud_sm
|
19 |
|
@@ -22,10 +22,10 @@ Multi-language pipeline optimized for CPU. Components: senter.
|
|
22 |
| Feature | Description |
|
23 |
| --- | --- |
|
24 |
| **Name** | `xx_sent_ud_sm` |
|
25 |
-
| **Version** | `3.
|
26 |
-
| **spaCy** | `>=3.
|
27 |
-
| **Default Pipeline** | `senter
|
28 |
-
| **Components** | `senter
|
29 |
| **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
|
30 |
| **Sources** | [Universal Dependencies v2.8 (UD_Afrikaans-AfriBooms, UD_Croatian-SET, UD_Czech-CAC, UD_Czech-CLTT, UD_Danish-DDT, UD_Dutch-Alpino, UD_Dutch-LassySmall, UD_English-EWT, UD_Finnish-FTB, UD_Finnish-TDT, UD_French-GSD, UD_French-Spoken, UD_German-GSD, UD_Indonesian-GSD, UD_Irish-IDT, UD_Italian-TWITTIRO, UD_Korean-GSD, UD_Korean-Kaist, UD_Latvian-LVTB, UD_Lithuanian-ALKSNIS, UD_Lithuanian-HSE, UD_Marathi-UFAL, UD_Norwegian-Bokmaal, UD_Norwegian-Nynorsk, UD_Norwegian-NynorskLIA, UD_Persian-Seraji, UD_Portuguese-Bosque, UD_Portuguese-GSD, UD_Romanian-Nonstandard, UD_Romanian-RRT, UD_Russian-GSD, UD_Russian-Taiga, UD_Serbian-SET, UD_Slovak-SNK, UD_Spanish-GSD, UD_Swedish-Talbanken, UD_Telugu-MTG, UD_Vietnamese-VTB)](https://universaldependencies.org/) (Zeman, Daniel; Nivre, Joakim; Abrams, Mitchell; et al.) |
|
31 |
| **License** | `CC BY-SA 3.0` |
|
@@ -43,6 +43,6 @@ Multi-language pipeline optimized for CPU. Components: senter.
|
|
43 |
| `TOKEN_P` | 95.31 |
|
44 |
| `TOKEN_R` | 95.72 |
|
45 |
| `TOKEN_F` | 95.52 |
|
46 |
-
| `SENTS_P` | 90.
|
47 |
-
| `SENTS_R` | 81.
|
48 |
-
| `SENTS_F` | 85.
|
|
|
13 |
metrics:
|
14 |
- name: Sentences F-Score
|
15 |
type: f_score
|
16 |
+
value: 0.8580767932
|
17 |
---
|
18 |
### Details: https://spacy.io/models/xx#xx_sent_ud_sm
|
19 |
|
|
|
22 |
| Feature | Description |
|
23 |
| --- | --- |
|
24 |
| **Name** | `xx_sent_ud_sm` |
|
25 |
+
| **Version** | `3.4.0` |
|
26 |
+
| **spaCy** | `>=3.4.0,<3.5.0` |
|
27 |
+
| **Default Pipeline** | `senter` |
|
28 |
+
| **Components** | `senter` |
|
29 |
| **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
|
30 |
| **Sources** | [Universal Dependencies v2.8 (UD_Afrikaans-AfriBooms, UD_Croatian-SET, UD_Czech-CAC, UD_Czech-CLTT, UD_Danish-DDT, UD_Dutch-Alpino, UD_Dutch-LassySmall, UD_English-EWT, UD_Finnish-FTB, UD_Finnish-TDT, UD_French-GSD, UD_French-Spoken, UD_German-GSD, UD_Indonesian-GSD, UD_Irish-IDT, UD_Italian-TWITTIRO, UD_Korean-GSD, UD_Korean-Kaist, UD_Latvian-LVTB, UD_Lithuanian-ALKSNIS, UD_Lithuanian-HSE, UD_Marathi-UFAL, UD_Norwegian-Bokmaal, UD_Norwegian-Nynorsk, UD_Norwegian-NynorskLIA, UD_Persian-Seraji, UD_Portuguese-Bosque, UD_Portuguese-GSD, UD_Romanian-Nonstandard, UD_Romanian-RRT, UD_Russian-GSD, UD_Russian-Taiga, UD_Serbian-SET, UD_Slovak-SNK, UD_Spanish-GSD, UD_Swedish-Talbanken, UD_Telugu-MTG, UD_Vietnamese-VTB)](https://universaldependencies.org/) (Zeman, Daniel; Nivre, Joakim; Abrams, Mitchell; et al.) |
|
31 |
| **License** | `CC BY-SA 3.0` |
|
|
|
43 |
| `TOKEN_P` | 95.31 |
|
44 |
| `TOKEN_R` | 95.72 |
|
45 |
| `TOKEN_F` | 95.52 |
|
46 |
+
| `SENTS_P` | 90.67 |
|
47 |
+
| `SENTS_R` | 81.44 |
|
48 |
+
| `SENTS_F` | 85.81 |
|
accuracy.json
CHANGED
@@ -3,8 +3,8 @@
|
|
3 |
"token_p": 0.9530830451,
|
4 |
"token_r": 0.9572374635,
|
5 |
"token_f": 0.955155737,
|
6 |
-
"sents_p": 0.
|
7 |
-
"sents_r": 0.
|
8 |
-
"sents_f": 0.
|
9 |
-
"speed":
|
10 |
}
|
|
|
3 |
"token_p": 0.9530830451,
|
4 |
"token_r": 0.9572374635,
|
5 |
"token_f": 0.955155737,
|
6 |
+
"sents_p": 0.9067233159,
|
7 |
+
"sents_r": 0.8143843398,
|
8 |
+
"sents_f": 0.8580767932,
|
9 |
+
"speed": 174049.2099894174
|
10 |
}
|
config.cfg
CHANGED
@@ -10,7 +10,7 @@ seed = 0
|
|
10 |
|
11 |
[nlp]
|
12 |
lang = "xx"
|
13 |
-
pipeline = ["senter"
|
14 |
disabled = []
|
15 |
before_creation = null
|
16 |
after_creation = null
|
@@ -20,11 +20,6 @@ tokenizer = {"@tokenizers":"spacy.Tokenizer.v1"}
|
|
20 |
|
21 |
[components]
|
22 |
|
23 |
-
[components.attribute_ruler]
|
24 |
-
factory = "attribute_ruler"
|
25 |
-
scorer = {"@scorers":"spacy.attribute_ruler_scorer.v1"}
|
26 |
-
validate = false
|
27 |
-
|
28 |
[components.senter]
|
29 |
factory = "senter"
|
30 |
overwrite = false
|
|
|
10 |
|
11 |
[nlp]
|
12 |
lang = "xx"
|
13 |
+
pipeline = ["senter"]
|
14 |
disabled = []
|
15 |
before_creation = null
|
16 |
after_creation = null
|
|
|
20 |
|
21 |
[components]
|
22 |
|
|
|
|
|
|
|
|
|
|
|
23 |
[components.senter]
|
24 |
factory = "senter"
|
25 |
overwrite = false
|
meta.json
CHANGED
@@ -1,14 +1,14 @@
|
|
1 |
{
|
2 |
"lang":"xx",
|
3 |
"name":"sent_ud_sm",
|
4 |
-
"version":"3.
|
5 |
"description":"Multi-language pipeline optimized for CPU. Components: senter.",
|
6 |
"author":"Explosion",
|
7 |
"email":"[email protected]",
|
8 |
"url":"https://explosion.ai",
|
9 |
"license":"CC BY-SA 3.0",
|
10 |
-
"spacy_version":">=3.
|
11 |
-
"spacy_git_version":"
|
12 |
"vectors":{
|
13 |
"width":0,
|
14 |
"vectors":0,
|
@@ -16,17 +16,13 @@
|
|
16 |
"name":null
|
17 |
},
|
18 |
"labels":{
|
19 |
-
"attribute_ruler":[
|
20 |
|
21 |
-
]
|
22 |
},
|
23 |
"pipeline":[
|
24 |
-
"senter"
|
25 |
-
"attribute_ruler"
|
26 |
],
|
27 |
"components":[
|
28 |
-
"senter"
|
29 |
-
"attribute_ruler"
|
30 |
],
|
31 |
"disabled":[
|
32 |
|
@@ -36,10 +32,10 @@
|
|
36 |
"token_p":0.9530830451,
|
37 |
"token_r":0.9572374635,
|
38 |
"token_f":0.955155737,
|
39 |
-
"sents_p":0.
|
40 |
-
"sents_r":0.
|
41 |
-
"sents_f":0.
|
42 |
-
"speed":
|
43 |
},
|
44 |
"sources":[
|
45 |
{
|
|
|
1 |
{
|
2 |
"lang":"xx",
|
3 |
"name":"sent_ud_sm",
|
4 |
+
"version":"3.4.0",
|
5 |
"description":"Multi-language pipeline optimized for CPU. Components: senter.",
|
6 |
"author":"Explosion",
|
7 |
"email":"[email protected]",
|
8 |
"url":"https://explosion.ai",
|
9 |
"license":"CC BY-SA 3.0",
|
10 |
+
"spacy_version":">=3.4.0,<3.5.0",
|
11 |
+
"spacy_git_version":"dd038b536",
|
12 |
"vectors":{
|
13 |
"width":0,
|
14 |
"vectors":0,
|
|
|
16 |
"name":null
|
17 |
},
|
18 |
"labels":{
|
|
|
19 |
|
|
|
20 |
},
|
21 |
"pipeline":[
|
22 |
+
"senter"
|
|
|
23 |
],
|
24 |
"components":[
|
25 |
+
"senter"
|
|
|
26 |
],
|
27 |
"disabled":[
|
28 |
|
|
|
32 |
"token_p":0.9530830451,
|
33 |
"token_r":0.9572374635,
|
34 |
"token_f":0.955155737,
|
35 |
+
"sents_p":0.9067233159,
|
36 |
+
"sents_r":0.8143843398,
|
37 |
+
"sents_f":0.8580767932,
|
38 |
+
"speed":174049.2099894174
|
39 |
},
|
40 |
"sources":[
|
41 |
{
|
senter/model
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 197089
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:246adc5eaf65c874096bcbc872fe05e102f19e7f1f9fd1e3adce173f1b9a32be
|
3 |
size 197089
|
vocab/strings.json
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cc7b2014c27f229fc1a30b1785a675047e7af79e4adf1c84e07521c7bf8b8ee9
|
3 |
+
size 22450815
|
xx_sent_ud_sm-any-py3-none-any.whl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e43437e2847e57d913e86f978e3c86d2cc74d1b8caf6091757cd856a6d9c771
|
3 |
+
size 4324474
|