philipp-zettl
commited on
Update spaCy pipeline
Browse files- README.md +2 -2
- config.cfg +7 -4
- en_degree_ner-any-py3-none-any.whl +2 -2
- meta.json +5 -5
- ner/model +0 -0
- ner/moves +1 -1
- tok2vec/model +1 -1
- vocab/lookups.bin +2 -2
- vocab/strings.json +11 -0
README.md
CHANGED
@@ -24,8 +24,8 @@ model-index:
|
|
24 |
| Feature | Description |
|
25 |
| --- | --- |
|
26 |
| **Name** | `en_degree_ner` |
|
27 |
-
| **Version** | `0.
|
28 |
-
| **spaCy** | `>=3.
|
29 |
| **Default Pipeline** | `tok2vec`, `ner` |
|
30 |
| **Components** | `tok2vec`, `ner` |
|
31 |
| **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
|
|
|
24 |
| Feature | Description |
|
25 |
| --- | --- |
|
26 |
| **Name** | `en_degree_ner` |
|
27 |
+
| **Version** | `0.2.0` |
|
28 |
+
| **spaCy** | `>=3.6.1,<3.7.0` |
|
29 |
| **Default Pipeline** | `tok2vec`, `ner` |
|
30 |
| **Components** | `tok2vec`, `ner` |
|
31 |
| **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
|
config.cfg
CHANGED
@@ -1,6 +1,6 @@
|
|
1 |
[paths]
|
2 |
-
train = "degree_ner_train.spacy"
|
3 |
-
dev = "degree_ner_valid.spacy"
|
4 |
vectors = "en_core_web_sm"
|
5 |
init_tok2vec = null
|
6 |
|
@@ -17,7 +17,6 @@ before_creation = null
|
|
17 |
after_creation = null
|
18 |
after_pipeline_creation = null
|
19 |
tokenizer = {"@tokenizers":"spacy.Tokenizer.v1"}
|
20 |
-
vectors = {"@vectors":"spacy.Vectors.v1"}
|
21 |
|
22 |
[components]
|
23 |
|
@@ -136,10 +135,14 @@ ents_per_type = null
|
|
136 |
vectors = ${paths.vectors}
|
137 |
init_tok2vec = ${paths.init_tok2vec}
|
138 |
vocab_data = null
|
139 |
-
lookups = null
|
140 |
before_init = null
|
141 |
after_init = null
|
142 |
|
143 |
[initialize.components]
|
144 |
|
|
|
|
|
|
|
|
|
|
|
145 |
[initialize.tokenizer]
|
|
|
1 |
[paths]
|
2 |
+
train = "training_data/degree_ner_train.spacy"
|
3 |
+
dev = "training_data/degree_ner_valid.spacy"
|
4 |
vectors = "en_core_web_sm"
|
5 |
init_tok2vec = null
|
6 |
|
|
|
17 |
after_creation = null
|
18 |
after_pipeline_creation = null
|
19 |
tokenizer = {"@tokenizers":"spacy.Tokenizer.v1"}
|
|
|
20 |
|
21 |
[components]
|
22 |
|
|
|
135 |
vectors = ${paths.vectors}
|
136 |
init_tok2vec = ${paths.init_tok2vec}
|
137 |
vocab_data = null
|
|
|
138 |
before_init = null
|
139 |
after_init = null
|
140 |
|
141 |
[initialize.components]
|
142 |
|
143 |
+
[initialize.lookups]
|
144 |
+
@misc = "spacy.LookupsDataLoader.v1"
|
145 |
+
lang = ${nlp.lang}
|
146 |
+
tables = ["lexeme_norm"]
|
147 |
+
|
148 |
[initialize.tokenizer]
|
en_degree_ner-any-py3-none-any.whl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef8317dc8d7607ed3afa375f804c9ee93d74961af4d73308fb76977b8205d044
|
3 |
+
size 31996372
|
meta.json
CHANGED
@@ -1,14 +1,14 @@
|
|
1 |
{
|
2 |
"lang":"en",
|
3 |
"name":"degree_ner",
|
4 |
-
"version":"0.
|
5 |
"description":"",
|
6 |
"author":"",
|
7 |
"email":"",
|
8 |
"url":"",
|
9 |
"license":"",
|
10 |
-
"spacy_version":">=3.
|
11 |
-
"spacy_git_version":"
|
12 |
"vectors":{
|
13 |
"width":0,
|
14 |
"vectors":0,
|
@@ -45,8 +45,8 @@
|
|
45 |
"f":1.0
|
46 |
}
|
47 |
},
|
48 |
-
"tok2vec_loss":0.
|
49 |
-
"ner_loss":0.
|
50 |
},
|
51 |
"requirements":[
|
52 |
|
|
|
1 |
{
|
2 |
"lang":"en",
|
3 |
"name":"degree_ner",
|
4 |
+
"version":"0.2.0",
|
5 |
"description":"",
|
6 |
"author":"",
|
7 |
"email":"",
|
8 |
"url":"",
|
9 |
"license":"",
|
10 |
+
"spacy_version":">=3.6.1,<3.7.0",
|
11 |
+
"spacy_git_version":"458bc5f45",
|
12 |
"vectors":{
|
13 |
"width":0,
|
14 |
"vectors":0,
|
|
|
45 |
"f":1.0
|
46 |
}
|
47 |
},
|
48 |
+
"tok2vec_loss":0.0,
|
49 |
+
"ner_loss":0.0
|
50 |
},
|
51 |
"requirements":[
|
52 |
|
ner/model
CHANGED
Binary files a/ner/model and b/ner/model differ
|
|
ner/moves
CHANGED
@@ -1 +1 @@
|
|
1 |
-
��moves�p{"0":{},"1":{"DEGREE":
|
|
|
1 |
+
��moves�p{"0":{},"1":{"DEGREE":484792},"2":{"DEGREE":484792},"3":{"DEGREE":484792},"4":{"DEGREE":484792,"":1},"5":{"":1}}�cfg��neg_key�
|
tok2vec/model
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 34126801
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a07b207de049fd5a5a2c38017156daa5b2c6110ca56870557b88ab26352aa973
|
3 |
size 34126801
|
vocab/lookups.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fce9c883c56165f29573cc938c2a1c9d417ac61bd8f56b671dd5f7996de70682
|
3 |
+
size 70040
|
vocab/strings.json
CHANGED
@@ -12194,6 +12194,7 @@
|
|
12194 |
"Dionysius",
|
12195 |
"Diotrephes",
|
12196 |
"Dip",
|
|
|
12197 |
"Diploma",
|
12198 |
"Diplomacy",
|
12199 |
"Diplomatic",
|
@@ -16111,6 +16112,7 @@
|
|
16111 |
"Higgenbotham",
|
16112 |
"Higgins",
|
16113 |
"High",
|
|
|
16114 |
"Higher",
|
16115 |
"Highest",
|
16116 |
"Highland",
|
@@ -16237,6 +16239,7 @@
|
|
16237 |
"Holcomb",
|
16238 |
"Hold",
|
16239 |
"Holden",
|
|
|
16240 |
"Holders",
|
16241 |
"Holding",
|
16242 |
"Holdings",
|
@@ -16322,6 +16325,7 @@
|
|
16322 |
"Honorable",
|
16323 |
"Honorary",
|
16324 |
"Honors",
|
|
|
16325 |
"Hood",
|
16326 |
"Hooker",
|
16327 |
"Hooks",
|
@@ -17939,6 +17943,7 @@
|
|
17939 |
"K",
|
17940 |
"K's",
|
17941 |
"K.",
|
|
|
17942 |
"KAISER",
|
17943 |
"KB",
|
17944 |
"KC",
|
@@ -23387,6 +23392,7 @@
|
|
23387 |
"Pharpar",
|
23388 |
"Phase",
|
23389 |
"Phasing",
|
|
|
23390 |
"Phelan",
|
23391 |
"Phelps",
|
23392 |
"Phenix",
|
@@ -24066,6 +24072,7 @@
|
|
24066 |
"Prussia",
|
24067 |
"Pryce",
|
24068 |
"Pryor",
|
|
|
24069 |
"Psa",
|
24070 |
"Psalm",
|
24071 |
"Psalms",
|
@@ -44267,6 +44274,7 @@
|
|
44267 |
"dioxins",
|
44268 |
"dip",
|
44269 |
"diphtheria",
|
|
|
44270 |
"diploma",
|
44271 |
"diplomacy",
|
44272 |
"diplomas",
|
@@ -53000,6 +53008,7 @@
|
|
53000 |
"honour",
|
53001 |
"honourable",
|
53002 |
"honoured",
|
|
|
53003 |
"hoo",
|
53004 |
"hood",
|
53005 |
"hooded",
|
@@ -55328,6 +55337,7 @@
|
|
55328 |
"ipe",
|
55329 |
"iph",
|
55330 |
"iphone",
|
|
|
55331 |
"ipo",
|
55332 |
"ipod",
|
55333 |
"ipods",
|
@@ -56401,6 +56411,7 @@
|
|
56401 |
"k.",
|
56402 |
"k.a",
|
56403 | |
|
|
56404 |
"kV",
|
56405 |
"kWh",
|
56406 |
"ka",
|
|
|
12194 |
"Dionysius",
|
12195 |
"Diotrephes",
|
12196 |
"Dip",
|
12197 |
+
"Dipl",
|
12198 |
"Diploma",
|
12199 |
"Diplomacy",
|
12200 |
"Diplomatic",
|
|
|
16112 |
"Higgenbotham",
|
16113 |
"Higgins",
|
16114 |
"High",
|
16115 |
+
"HighSchool",
|
16116 |
"Higher",
|
16117 |
"Highest",
|
16118 |
"Highland",
|
|
|
16239 |
"Holcomb",
|
16240 |
"Hold",
|
16241 |
"Holden",
|
16242 |
+
"Holder",
|
16243 |
"Holders",
|
16244 |
"Holding",
|
16245 |
"Holdings",
|
|
|
16325 |
"Honorable",
|
16326 |
"Honorary",
|
16327 |
"Honors",
|
16328 |
+
"Honours",
|
16329 |
"Hood",
|
16330 |
"Hooker",
|
16331 |
"Hooks",
|
|
|
17943 |
"K",
|
17944 |
"K's",
|
17945 |
"K.",
|
17946 |
+
"K12",
|
17947 |
"KAISER",
|
17948 |
"KB",
|
17949 |
"KC",
|
|
|
23392 |
"Pharpar",
|
23393 |
"Phase",
|
23394 |
"Phasing",
|
23395 |
+
"Phd",
|
23396 |
"Phelan",
|
23397 |
"Phelps",
|
23398 |
"Phenix",
|
|
|
24072 |
"Prussia",
|
24073 |
"Pryce",
|
24074 |
"Pryor",
|
24075 |
+
"Ps",
|
24076 |
"Psa",
|
24077 |
"Psalm",
|
24078 |
"Psalms",
|
|
|
44274 |
"dioxins",
|
44275 |
"dip",
|
44276 |
"diphtheria",
|
44277 |
+
"dipl",
|
44278 |
"diploma",
|
44279 |
"diplomacy",
|
44280 |
"diplomas",
|
|
|
53008 |
"honour",
|
53009 |
"honourable",
|
53010 |
"honoured",
|
53011 |
+
"honours",
|
53012 |
"hoo",
|
53013 |
"hood",
|
53014 |
"hooded",
|
|
|
55337 |
"ipe",
|
55338 |
"iph",
|
55339 |
"iphone",
|
55340 |
+
"ipl",
|
55341 |
"ipo",
|
55342 |
"ipod",
|
55343 |
"ipods",
|
|
|
56411 |
"k.",
|
56412 |
"k.a",
|
56413 | |
56414 |
+
"k12",
|
56415 |
"kV",
|
56416 |
"kWh",
|
56417 |
"ka",
|