philipp-zettl commited on
Commit
70996be
·
verified ·
1 Parent(s): 74d7384

Update spaCy pipeline

Browse files
README.md CHANGED
@@ -24,8 +24,8 @@ model-index:
24
  | Feature | Description |
25
  | --- | --- |
26
  | **Name** | `en_degree_ner` |
27
- | **Version** | `0.1.0` |
28
- | **spaCy** | `>=3.7.4,<3.8.0` |
29
  | **Default Pipeline** | `tok2vec`, `ner` |
30
  | **Components** | `tok2vec`, `ner` |
31
  | **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
 
24
  | Feature | Description |
25
  | --- | --- |
26
  | **Name** | `en_degree_ner` |
27
+ | **Version** | `0.2.0` |
28
+ | **spaCy** | `>=3.6.1,<3.7.0` |
29
  | **Default Pipeline** | `tok2vec`, `ner` |
30
  | **Components** | `tok2vec`, `ner` |
31
  | **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
config.cfg CHANGED
@@ -1,6 +1,6 @@
1
  [paths]
2
- train = "degree_ner_train.spacy"
3
- dev = "degree_ner_valid.spacy"
4
  vectors = "en_core_web_sm"
5
  init_tok2vec = null
6
 
@@ -17,7 +17,6 @@ before_creation = null
17
  after_creation = null
18
  after_pipeline_creation = null
19
  tokenizer = {"@tokenizers":"spacy.Tokenizer.v1"}
20
- vectors = {"@vectors":"spacy.Vectors.v1"}
21
 
22
  [components]
23
 
@@ -136,10 +135,14 @@ ents_per_type = null
136
  vectors = ${paths.vectors}
137
  init_tok2vec = ${paths.init_tok2vec}
138
  vocab_data = null
139
- lookups = null
140
  before_init = null
141
  after_init = null
142
 
143
  [initialize.components]
144
 
 
 
 
 
 
145
  [initialize.tokenizer]
 
1
  [paths]
2
+ train = "training_data/degree_ner_train.spacy"
3
+ dev = "training_data/degree_ner_valid.spacy"
4
  vectors = "en_core_web_sm"
5
  init_tok2vec = null
6
 
 
17
  after_creation = null
18
  after_pipeline_creation = null
19
  tokenizer = {"@tokenizers":"spacy.Tokenizer.v1"}
 
20
 
21
  [components]
22
 
 
135
  vectors = ${paths.vectors}
136
  init_tok2vec = ${paths.init_tok2vec}
137
  vocab_data = null
 
138
  before_init = null
139
  after_init = null
140
 
141
  [initialize.components]
142
 
143
+ [initialize.lookups]
144
+ @misc = "spacy.LookupsDataLoader.v1"
145
+ lang = ${nlp.lang}
146
+ tables = ["lexeme_norm"]
147
+
148
  [initialize.tokenizer]
en_degree_ner-any-py3-none-any.whl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ae21d2e7ab6d2eecc862390da6e56ea659758825b15781aae89c40790489e47c
3
- size 31925456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef8317dc8d7607ed3afa375f804c9ee93d74961af4d73308fb76977b8205d044
3
+ size 31996372
meta.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
  "lang":"en",
3
  "name":"degree_ner",
4
- "version":"0.1.0",
5
  "description":"",
6
  "author":"",
7
  "email":"",
8
  "url":"",
9
  "license":"",
10
- "spacy_version":">=3.7.4,<3.8.0",
11
- "spacy_git_version":"bff8725f4",
12
  "vectors":{
13
  "width":0,
14
  "vectors":0,
@@ -45,8 +45,8 @@
45
  "f":1.0
46
  }
47
  },
48
- "tok2vec_loss":0.0000000273,
49
- "ner_loss":0.000000224
50
  },
51
  "requirements":[
52
 
 
1
  {
2
  "lang":"en",
3
  "name":"degree_ner",
4
+ "version":"0.2.0",
5
  "description":"",
6
  "author":"",
7
  "email":"",
8
  "url":"",
9
  "license":"",
10
+ "spacy_version":">=3.6.1,<3.7.0",
11
+ "spacy_git_version":"458bc5f45",
12
  "vectors":{
13
  "width":0,
14
  "vectors":0,
 
45
  "f":1.0
46
  }
47
  },
48
+ "tok2vec_loss":0.0,
49
+ "ner_loss":0.0
50
  },
51
  "requirements":[
52
 
ner/model CHANGED
Binary files a/ner/model and b/ner/model differ
 
ner/moves CHANGED
@@ -1 +1 @@
1
- ��moves�p{"0":{},"1":{"DEGREE":280503},"2":{"DEGREE":280503},"3":{"DEGREE":280503},"4":{"DEGREE":280503,"":1},"5":{"":1}}�cfg��neg_key�
 
1
+ ��moves�p{"0":{},"1":{"DEGREE":484792},"2":{"DEGREE":484792},"3":{"DEGREE":484792},"4":{"DEGREE":484792,"":1},"5":{"":1}}�cfg��neg_key�
tok2vec/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c47bcf6c1c21504e5f6276f591159d92526567eab0a7141cb684edf864f86f11
3
  size 34126801
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a07b207de049fd5a5a2c38017156daa5b2c6110ca56870557b88ab26352aa973
3
  size 34126801
vocab/lookups.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:76be8b528d0075f7aae98d6fa57a6d3c83ae480a8469e668d7b0af968995ac71
3
- size 1
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fce9c883c56165f29573cc938c2a1c9d417ac61bd8f56b671dd5f7996de70682
3
+ size 70040
vocab/strings.json CHANGED
@@ -12194,6 +12194,7 @@
12194
  "Dionysius",
12195
  "Diotrephes",
12196
  "Dip",
 
12197
  "Diploma",
12198
  "Diplomacy",
12199
  "Diplomatic",
@@ -16111,6 +16112,7 @@
16111
  "Higgenbotham",
16112
  "Higgins",
16113
  "High",
 
16114
  "Higher",
16115
  "Highest",
16116
  "Highland",
@@ -16237,6 +16239,7 @@
16237
  "Holcomb",
16238
  "Hold",
16239
  "Holden",
 
16240
  "Holders",
16241
  "Holding",
16242
  "Holdings",
@@ -16322,6 +16325,7 @@
16322
  "Honorable",
16323
  "Honorary",
16324
  "Honors",
 
16325
  "Hood",
16326
  "Hooker",
16327
  "Hooks",
@@ -17939,6 +17943,7 @@
17939
  "K",
17940
  "K's",
17941
  "K.",
 
17942
  "KAISER",
17943
  "KB",
17944
  "KC",
@@ -23387,6 +23392,7 @@
23387
  "Pharpar",
23388
  "Phase",
23389
  "Phasing",
 
23390
  "Phelan",
23391
  "Phelps",
23392
  "Phenix",
@@ -24066,6 +24072,7 @@
24066
  "Prussia",
24067
  "Pryce",
24068
  "Pryor",
 
24069
  "Psa",
24070
  "Psalm",
24071
  "Psalms",
@@ -44267,6 +44274,7 @@
44267
  "dioxins",
44268
  "dip",
44269
  "diphtheria",
 
44270
  "diploma",
44271
  "diplomacy",
44272
  "diplomas",
@@ -53000,6 +53008,7 @@
53000
  "honour",
53001
  "honourable",
53002
  "honoured",
 
53003
  "hoo",
53004
  "hood",
53005
  "hooded",
@@ -55328,6 +55337,7 @@
55328
  "ipe",
55329
  "iph",
55330
  "iphone",
 
55331
  "ipo",
55332
  "ipod",
55333
  "ipods",
@@ -56401,6 +56411,7 @@
56401
  "k.",
56402
  "k.a",
56403
 
56404
  "kV",
56405
  "kWh",
56406
  "ka",
 
12194
  "Dionysius",
12195
  "Diotrephes",
12196
  "Dip",
12197
+ "Dipl",
12198
  "Diploma",
12199
  "Diplomacy",
12200
  "Diplomatic",
 
16112
  "Higgenbotham",
16113
  "Higgins",
16114
  "High",
16115
+ "HighSchool",
16116
  "Higher",
16117
  "Highest",
16118
  "Highland",
 
16239
  "Holcomb",
16240
  "Hold",
16241
  "Holden",
16242
+ "Holder",
16243
  "Holders",
16244
  "Holding",
16245
  "Holdings",
 
16325
  "Honorable",
16326
  "Honorary",
16327
  "Honors",
16328
+ "Honours",
16329
  "Hood",
16330
  "Hooker",
16331
  "Hooks",
 
17943
  "K",
17944
  "K's",
17945
  "K.",
17946
+ "K12",
17947
  "KAISER",
17948
  "KB",
17949
  "KC",
 
23392
  "Pharpar",
23393
  "Phase",
23394
  "Phasing",
23395
+ "Phd",
23396
  "Phelan",
23397
  "Phelps",
23398
  "Phenix",
 
24072
  "Prussia",
24073
  "Pryce",
24074
  "Pryor",
24075
+ "Ps",
24076
  "Psa",
24077
  "Psalm",
24078
  "Psalms",
 
44274
  "dioxins",
44275
  "dip",
44276
  "diphtheria",
44277
+ "dipl",
44278
  "diploma",
44279
  "diplomacy",
44280
  "diplomas",
 
53008
  "honour",
53009
  "honourable",
53010
  "honoured",
53011
+ "honours",
53012
  "hoo",
53013
  "hood",
53014
  "hooded",
 
55337
  "ipe",
55338
  "iph",
55339
  "iphone",
55340
+ "ipl",
55341
  "ipo",
55342
  "ipod",
55343
  "ipods",
 
56411
  "k.",
56412
  "k.a",
56413
56414
+ "k12",
56415
  "kV",
56416
  "kWh",
56417
  "ka",