adrianeboyd commited on
Commit
cbd9cb3
1 Parent(s): 49f366e

Update spaCy pipeline

Browse files
README.md CHANGED
@@ -14,27 +14,27 @@ model-index:
14
  metrics:
15
  - name: NER Precision
16
  type: precision
17
- value: 0.8298969072
18
  - name: NER Recall
19
  type: recall
20
- value: 0.8100628931
21
  - name: NER F Score
22
  type: f_score
23
- value: 0.8198599618
24
  - task:
25
  name: TAG
26
  type: token-classification
27
  metrics:
28
  - name: TAG (XPOS) Accuracy
29
  type: accuracy
30
- value: 0.9712488769
31
  - task:
32
  name: POS
33
  type: token-classification
34
  metrics:
35
  - name: POS (UPOS) Accuracy
36
  type: accuracy
37
- value: 0.9798207196
38
  - task:
39
  name: MORPH
40
  type: token-classification
@@ -55,21 +55,21 @@ model-index:
55
  metrics:
56
  - name: Unlabeled Attachment Score (UAS)
57
  type: f_score
58
- value: 0.9355666622
59
  - task:
60
  name: LABELED_DEPENDENCIES
61
  type: token-classification
62
  metrics:
63
  - name: Labeled Attachment Score (LAS)
64
  type: f_score
65
- value: 0.9241776538
66
  - task:
67
  name: SENTS
68
  type: token-classification
69
  metrics:
70
  - name: Sentences F-Score
71
  type: f_score
72
- value: 0.9755142018
73
  ---
74
  ### Details: https://spacy.io/models/ja#ja_core_news_trf
75
 
@@ -78,8 +78,8 @@ Japanese transformer pipeline (cl-tohoku/bert-base-japanese-char-v2). Components
78
  | Feature | Description |
79
  | --- | --- |
80
  | **Name** | `ja_core_news_trf` |
81
- | **Version** | `3.5.0` |
82
- | **spaCy** | `>=3.5.0,<3.6.0` |
83
  | **Default Pipeline** | `transformer`, `morphologizer`, `parser`, `attribute_ruler`, `ner` |
84
  | **Components** | `transformer`, `morphologizer`, `parser`, `attribute_ruler`, `ner` |
85
  | **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
@@ -111,16 +111,16 @@ Japanese transformer pipeline (cl-tohoku/bert-base-japanese-char-v2). Components
111
  | `TOKEN_F` | 97.77 |
112
  | `POS_ACC` | 97.98 |
113
  | `MORPH_ACC` | 0.00 |
114
- | `MORPH_MICRO_P` | 33.56 |
115
- | `MORPH_MICRO_R` | 96.08 |
116
- | `MORPH_MICRO_F` | 49.75 |
117
- | `SENTS_P` | 96.89 |
118
- | `SENTS_R` | 98.22 |
119
- | `SENTS_F` | 97.55 |
120
- | `DEP_UAS` | 93.56 |
121
- | `DEP_LAS` | 92.42 |
122
- | `TAG_ACC` | 97.12 |
123
  | `LEMMA_ACC` | 96.71 |
124
- | `ENTS_P` | 82.99 |
125
- | `ENTS_R` | 81.01 |
126
- | `ENTS_F` | 81.99 |
 
14
  metrics:
15
  - name: NER Precision
16
  type: precision
17
+ value: 0.8356510746
18
  - name: NER Recall
19
  type: recall
20
+ value: 0.8314465409
21
  - name: NER F Score
22
  type: f_score
23
+ value: 0.8335435057
24
  - task:
25
  name: TAG
26
  type: token-classification
27
  metrics:
28
  - name: TAG (XPOS) Accuracy
29
  type: accuracy
30
+ value: 0.9713305562
31
  - task:
32
  name: POS
33
  type: token-classification
34
  metrics:
35
  - name: POS (UPOS) Accuracy
36
  type: accuracy
37
+ value: 0.9798190675
38
  - task:
39
  name: MORPH
40
  type: token-classification
 
55
  metrics:
56
  - name: Unlabeled Attachment Score (UAS)
57
  type: f_score
58
+ value: 0.9311959654
59
  - task:
60
  name: LABELED_DEPENDENCIES
61
  type: token-classification
62
  metrics:
63
  - name: Labeled Attachment Score (LAS)
64
  type: f_score
65
+ value: 0.9202934425
66
  - task:
67
  name: SENTS
68
  type: token-classification
69
  metrics:
70
  - name: Sentences F-Score
71
  type: f_score
72
+ value: 0.9639727361
73
  ---
74
  ### Details: https://spacy.io/models/ja#ja_core_news_trf
75
 
 
78
  | Feature | Description |
79
  | --- | --- |
80
  | **Name** | `ja_core_news_trf` |
81
+ | **Version** | `3.6.1` |
82
+ | **spaCy** | `>=3.6.0,<3.7.0` |
83
  | **Default Pipeline** | `transformer`, `morphologizer`, `parser`, `attribute_ruler`, `ner` |
84
  | **Components** | `transformer`, `morphologizer`, `parser`, `attribute_ruler`, `ner` |
85
  | **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
 
111
  | `TOKEN_F` | 97.77 |
112
  | `POS_ACC` | 97.98 |
113
  | `MORPH_ACC` | 0.00 |
114
+ | `MORPH_MICRO_P` | 34.01 |
115
+ | `MORPH_MICRO_R` | 98.04 |
116
+ | `MORPH_MICRO_F` | 50.51 |
117
+ | `SENTS_P` | 95.19 |
118
+ | `SENTS_R` | 97.63 |
119
+ | `SENTS_F` | 96.40 |
120
+ | `DEP_UAS` | 93.12 |
121
+ | `DEP_LAS` | 92.03 |
122
+ | `TAG_ACC` | 97.13 |
123
  | `LEMMA_ACC` | 96.71 |
124
+ | `ENTS_P` | 83.57 |
125
+ | `ENTS_R` | 83.14 |
126
+ | `ENTS_F` | 83.35 |
accuracy.json CHANGED
@@ -3,16 +3,16 @@
3
  "token_p": 0.9764591282,
4
  "token_r": 0.9790021974,
5
  "token_f": 0.9777290092,
6
- "pos_acc": 0.9798207196,
7
  "morph_acc": 0.0,
8
- "morph_micro_p": 0.3356164384,
9
- "morph_micro_r": 0.9607843137,
10
- "morph_micro_f": 0.4974619289,
11
  "morph_per_feat": {
12
  "Polarity": {
13
  "p": 1.0,
14
- "r": 0.9607843137,
15
- "f": 0.98
16
  },
17
  "Inflection": {
18
  "p": 0.0,
@@ -25,106 +25,106 @@
25
  "f": 0.0
26
  }
27
  },
28
- "sents_p": 0.9688715953,
29
- "sents_r": 0.9822485207,
30
- "sents_f": 0.9755142018,
31
- "dep_uas": 0.9355666622,
32
- "dep_las": 0.9241776538,
33
  "dep_las_per_type": {
34
  "cc": {
35
- "p": 0.875,
36
  "r": 0.875,
37
- "f": 0.875
38
  },
39
  "compound": {
40
- "p": 0.9552414605,
41
- "r": 0.9143179256,
42
- "f": 0.9343317972
43
  },
44
  "obl": {
45
- "p": 0.8567901235,
46
- "r": 0.8664169788,
47
- "f": 0.8615766605
48
  },
49
  "case": {
50
- "p": 0.990015361,
51
- "r": 0.9794832827,
52
- "f": 0.9847211612
53
  },
54
  "dislocated": {
55
- "p": 0.8181818182,
56
- "r": 0.6923076923,
57
- "f": 0.75
58
  },
59
  "nsubj": {
60
- "p": 0.875,
61
- "r": 0.8598848369,
62
- "f": 0.8673765731
63
  },
64
  "nmod": {
65
- "p": 0.921641791,
66
- "r": 0.8666666667,
67
- "f": 0.8933092224
68
  },
69
  "root": {
70
- "p": 0.9645669291,
71
- "r": 0.966469428,
72
- "f": 0.9655172414
73
  },
74
  "aux": {
75
- "p": 0.9757462687,
76
- "r": 0.9712163417,
77
- "f": 0.9734760354
78
  },
79
  "advcl": {
80
- "p": 0.7333333333,
81
- "r": 0.7415730337,
82
- "f": 0.7374301676
83
  },
84
  "mark": {
85
- "p": 0.964,
86
- "r": 0.964,
87
- "f": 0.964
88
  },
89
  "fixed": {
90
- "p": 0.9663716814,
91
- "r": 0.9927272727,
92
- "f": 0.9793721973
93
  },
94
  "acl": {
95
- "p": 0.8780487805,
96
- "r": 0.8703296703,
97
- "f": 0.8741721854
98
  },
99
  "obj": {
100
- "p": 0.9726443769,
101
- "r": 0.9667673716,
102
- "f": 0.9696969697
103
  },
104
  "nummod": {
105
- "p": 0.9806451613,
106
  "r": 0.899408284,
107
- "f": 0.9382716049
108
  },
109
  "advmod": {
110
- "p": 0.7388059701,
111
- "r": 0.7071428571,
112
- "f": 0.7226277372
113
  },
114
  "amod": {
115
- "p": 0.9333333333,
116
- "r": 0.7567567568,
117
- "f": 0.8358208955
118
  },
119
  "cop": {
120
- "p": 0.9821428571,
121
- "r": 0.9593023256,
122
- "f": 0.9705882353
123
  },
124
  "ccomp": {
125
- "p": 0.9444444444,
126
- "r": 0.7727272727,
127
- "f": 0.85
128
  },
129
  "det": {
130
  "p": 1.0,
@@ -132,76 +132,76 @@
132
  "f": 0.9904761905
133
  },
134
  "csubj": {
135
- "p": 0.7692307692,
136
- "r": 0.8333333333,
137
- "f": 0.8
138
  },
139
  "dep": {
140
- "p": 0.2857142857,
141
  "r": 0.2857142857,
142
- "f": 0.2857142857
143
  }
144
  },
145
- "tag_acc": 0.9712488769,
146
  "lemma_acc": 0.9670526831,
147
- "ents_p": 0.8298969072,
148
- "ents_r": 0.8100628931,
149
- "ents_f": 0.8198599618,
150
  "ents_per_type": {
151
  "DATE": {
152
- "p": 0.9906542056,
153
- "r": 0.9724770642,
154
- "f": 0.9814814815
155
  },
156
  "ORG": {
157
- "p": 0.7445255474,
158
  "r": 0.7445255474,
159
- "f": 0.7445255474
 
 
 
 
 
160
  },
161
  "PERSON": {
162
- "p": 0.9516129032,
163
- "r": 0.8489208633,
164
- "f": 0.897338403
165
  },
166
  "GPE": {
167
- "p": 0.79,
168
  "r": 0.8404255319,
169
- "f": 0.8144329897
170
  },
171
  "PRODUCT": {
172
- "p": 0.5945945946,
173
- "r": 0.5238095238,
174
- "f": 0.5569620253
175
  },
176
  "TIME": {
177
- "p": 0.8,
178
  "r": 1.0,
179
- "f": 0.8888888889
180
  },
181
  "QUANTITY": {
182
- "p": 0.8904109589,
183
- "r": 0.9848484848,
184
- "f": 0.9352517986
185
  },
186
  "NORP": {
187
- "p": 0.6785714286,
188
- "r": 0.59375,
189
- "f": 0.6333333333
190
- },
191
- "TITLE_AFFIX": {
192
- "p": 0.7857142857,
193
- "r": 0.7333333333,
194
- "f": 0.7586206897
195
  },
196
  "ORDINAL": {
197
- "p": 0.652173913,
198
- "r": 0.6818181818,
199
- "f": 0.6666666667
200
  },
201
  "WORK_OF_ART": {
202
- "p": 0.8461538462,
203
- "r": 0.6470588235,
204
- "f": 0.7333333333
205
  },
206
  "CARDINAL": {
207
  "p": 1.0,
@@ -209,29 +209,29 @@
209
  "f": 0.6666666667
210
  },
211
  "LOC": {
212
- "p": 0.6,
213
- "r": 0.9,
214
- "f": 0.72
215
  },
216
  "PERCENT": {
217
  "p": 1.0,
218
- "r": 0.7142857143,
219
- "f": 0.8333333333
220
  },
221
  "EVENT": {
222
- "p": 0.9090909091,
223
- "r": 0.7692307692,
224
- "f": 0.8333333333
225
  },
226
  "FAC": {
227
- "p": 0.7692307692,
228
- "r": 0.8108108108,
229
- "f": 0.7894736842
230
  },
231
  "MOVEMENT": {
232
- "p": 0.3333333333,
233
- "r": 0.2,
234
- "f": 0.25
235
  },
236
  "LAW": {
237
  "p": 0.6666666667,
@@ -249,5 +249,5 @@
249
  "f": 1.0
250
  }
251
  },
252
- "speed": 3501.8234367587
253
  }
 
3
  "token_p": 0.9764591282,
4
  "token_r": 0.9790021974,
5
  "token_f": 0.9777290092,
6
+ "pos_acc": 0.9798190675,
7
  "morph_acc": 0.0,
8
+ "morph_micro_p": 0.3401360544,
9
+ "morph_micro_r": 0.9803921569,
10
+ "morph_micro_f": 0.5050505051,
11
  "morph_per_feat": {
12
  "Polarity": {
13
  "p": 1.0,
14
+ "r": 0.9803921569,
15
+ "f": 0.9900990099
16
  },
17
  "Inflection": {
18
  "p": 0.0,
 
25
  "f": 0.0
26
  }
27
  },
28
+ "sents_p": 0.9519230769,
29
+ "sents_r": 0.9763313609,
30
+ "sents_f": 0.9639727361,
31
+ "dep_uas": 0.9311959654,
32
+ "dep_las": 0.9202934425,
33
  "dep_las_per_type": {
34
  "cc": {
35
+ "p": 0.8936170213,
36
  "r": 0.875,
37
+ "f": 0.8842105263
38
  },
39
  "compound": {
40
+ "p": 0.9544917258,
41
+ "r": 0.9103720406,
42
+ "f": 0.9319099827
43
  },
44
  "obl": {
45
+ "p": 0.8436724566,
46
+ "r": 0.8489388265,
47
+ "f": 0.8462974487
48
  },
49
  "case": {
50
+ "p": 0.9832317073,
51
+ "r": 0.9802431611,
52
+ "f": 0.9817351598
53
  },
54
  "dislocated": {
55
+ "p": 0.6666666667,
56
+ "r": 0.6153846154,
57
+ "f": 0.64
58
  },
59
  "nsubj": {
60
+ "p": 0.8618677043,
61
+ "r": 0.8502879079,
62
+ "f": 0.8560386473
63
  },
64
  "nmod": {
65
+ "p": 0.9235588972,
66
+ "r": 0.8619883041,
67
+ "f": 0.8917120387
68
  },
69
  "root": {
70
+ "p": 0.9359223301,
71
+ "r": 0.9506903353,
72
+ "f": 0.9432485323
73
  },
74
  "aux": {
75
+ "p": 0.9765698219,
76
+ "r": 0.9675023213,
77
+ "f": 0.9720149254
78
  },
79
  "advcl": {
80
+ "p": 0.7379310345,
81
+ "r": 0.7213483146,
82
+ "f": 0.7295454545
83
  },
84
  "mark": {
85
+ "p": 0.9756592292,
86
+ "r": 0.962,
87
+ "f": 0.9687814703
88
  },
89
  "fixed": {
90
+ "p": 0.9661921708,
91
+ "r": 0.9872727273,
92
+ "f": 0.976618705
93
  },
94
  "acl": {
95
+ "p": 0.8942731278,
96
+ "r": 0.8923076923,
97
+ "f": 0.8932893289
98
  },
99
  "obj": {
100
+ "p": 0.9539877301,
101
+ "r": 0.9395770393,
102
+ "f": 0.9467275495
103
  },
104
  "nummod": {
105
+ "p": 0.987012987,
106
  "r": 0.899408284,
107
+ "f": 0.9411764706
108
  },
109
  "advmod": {
110
+ "p": 0.7537313433,
111
+ "r": 0.7214285714,
112
+ "f": 0.7372262774
113
  },
114
  "amod": {
115
+ "p": 0.9375,
116
+ "r": 0.8108108108,
117
+ "f": 0.8695652174
118
  },
119
  "cop": {
120
+ "p": 0.9764705882,
121
+ "r": 0.9651162791,
122
+ "f": 0.9707602339
123
  },
124
  "ccomp": {
125
+ "p": 0.9047619048,
126
+ "r": 0.8636363636,
127
+ "f": 0.8837209302
128
  },
129
  "det": {
130
  "p": 1.0,
 
132
  "f": 0.9904761905
133
  },
134
  "csubj": {
135
+ "p": 0.7333333333,
136
+ "r": 0.9166666667,
137
+ "f": 0.8148148148
138
  },
139
  "dep": {
140
+ "p": 0.25,
141
  "r": 0.2857142857,
142
+ "f": 0.2666666667
143
  }
144
  },
145
+ "tag_acc": 0.9713305562,
146
  "lemma_acc": 0.9670526831,
147
+ "ents_p": 0.8356510746,
148
+ "ents_r": 0.8314465409,
149
+ "ents_f": 0.8335435057,
150
  "ents_per_type": {
151
  "DATE": {
152
+ "p": 0.9727272727,
153
+ "r": 0.9816513761,
154
+ "f": 0.9771689498
155
  },
156
  "ORG": {
157
+ "p": 0.7906976744,
158
  "r": 0.7445255474,
159
+ "f": 0.7669172932
160
+ },
161
+ "TITLE_AFFIX": {
162
+ "p": 0.9230769231,
163
+ "r": 0.8,
164
+ "f": 0.8571428571
165
  },
166
  "PERSON": {
167
+ "p": 0.8865248227,
168
+ "r": 0.8992805755,
169
+ "f": 0.8928571429
170
  },
171
  "GPE": {
172
+ "p": 0.8404255319,
173
  "r": 0.8404255319,
174
+ "f": 0.8404255319
175
  },
176
  "PRODUCT": {
177
+ "p": 0.625,
178
+ "r": 0.5952380952,
179
+ "f": 0.6097560976
180
  },
181
  "TIME": {
182
+ "p": 1.0,
183
  "r": 1.0,
184
+ "f": 1.0
185
  },
186
  "QUANTITY": {
187
+ "p": 0.875,
188
+ "r": 0.9545454545,
189
+ "f": 0.9130434783
190
  },
191
  "NORP": {
192
+ "p": 0.6875,
193
+ "r": 0.6875,
194
+ "f": 0.6875
 
 
 
 
 
195
  },
196
  "ORDINAL": {
197
+ "p": 0.64,
198
+ "r": 0.7272727273,
199
+ "f": 0.6808510638
200
  },
201
  "WORK_OF_ART": {
202
+ "p": 0.8,
203
+ "r": 0.7058823529,
204
+ "f": 0.75
205
  },
206
  "CARDINAL": {
207
  "p": 1.0,
 
209
  "f": 0.6666666667
210
  },
211
  "LOC": {
212
+ "p": 0.5714285714,
213
+ "r": 0.8,
214
+ "f": 0.6666666667
215
  },
216
  "PERCENT": {
217
  "p": 1.0,
218
+ "r": 1.0,
219
+ "f": 1.0
220
  },
221
  "EVENT": {
222
+ "p": 0.9130434783,
223
+ "r": 0.8076923077,
224
+ "f": 0.8571428571
225
  },
226
  "FAC": {
227
+ "p": 0.7179487179,
228
+ "r": 0.7567567568,
229
+ "f": 0.7368421053
230
  },
231
  "MOVEMENT": {
232
+ "p": 0.6666666667,
233
+ "r": 0.4,
234
+ "f": 0.5
235
  },
236
  "LAW": {
237
  "p": 0.6666666667,
 
249
  "f": 1.0
250
  }
251
  },
252
+ "speed": 668.4231187225
253
  }
config.cfg CHANGED
@@ -96,8 +96,8 @@ max_batch_items = 4096
96
  set_extra_annotations = {"@annotation_setters":"spacy-transformers.null_annotation_setter.v1"}
97
 
98
  [components.transformer.model]
99
- @architectures = "spacy-transformers.TransformerModel.v3"
100
  name = "cl-tohoku/bert-base-japanese-char-v2"
 
101
  mixed_precision = false
102
 
103
  [components.transformer.model.get_spans]
 
96
  set_extra_annotations = {"@annotation_setters":"spacy-transformers.null_annotation_setter.v1"}
97
 
98
  [components.transformer.model]
 
99
  name = "cl-tohoku/bert-base-japanese-char-v2"
100
+ @architectures = "spacy-transformers.TransformerModel.v3"
101
  mixed_precision = false
102
 
103
  [components.transformer.model.get_spans]
ja_core_news_trf-any-py3-none-any.whl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:af1c8bca8b1a4de8acff4e37981769d1234e36f3cfdfac49806c402a5b88dd2c
3
- size 337887987
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf7e1ee38ed3b7191498980ae170fc9b3dc3f6a979dc82e7e9efa8cc0b746ff4
3
+ size 337889759
meta.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
  "lang":"ja",
3
  "name":"core_news_trf",
4
- "version":"3.5.0",
5
  "description":"Japanese transformer pipeline (cl-tohoku/bert-base-japanese-char-v2). Components: transformer, morphologizer, parser, ner.",
6
  "author":"Explosion",
7
  "email":"[email protected]",
8
  "url":"https://explosion.ai",
9
  "license":"CC BY-SA 3.0",
10
- "spacy_version":">=3.5.0,<3.6.0",
11
- "spacy_git_version":"9e0322de1",
12
  "vectors":{
13
  "width":0,
14
  "vectors":0,
@@ -115,16 +115,16 @@
115
  "token_p":0.9764591282,
116
  "token_r":0.9790021974,
117
  "token_f":0.9777290092,
118
- "pos_acc":0.9798207196,
119
  "morph_acc":0.0,
120
- "morph_micro_p":0.3356164384,
121
- "morph_micro_r":0.9607843137,
122
- "morph_micro_f":0.4974619289,
123
  "morph_per_feat":{
124
  "Polarity":{
125
  "p":1.0,
126
- "r":0.9607843137,
127
- "f":0.98
128
  },
129
  "Inflection":{
130
  "p":0.0,
@@ -137,106 +137,106 @@
137
  "f":0.0
138
  }
139
  },
140
- "sents_p":0.9688715953,
141
- "sents_r":0.9822485207,
142
- "sents_f":0.9755142018,
143
- "dep_uas":0.9355666622,
144
- "dep_las":0.9241776538,
145
  "dep_las_per_type":{
146
  "cc":{
147
- "p":0.875,
148
  "r":0.875,
149
- "f":0.875
150
  },
151
  "compound":{
152
- "p":0.9552414605,
153
- "r":0.9143179256,
154
- "f":0.9343317972
155
  },
156
  "obl":{
157
- "p":0.8567901235,
158
- "r":0.8664169788,
159
- "f":0.8615766605
160
  },
161
  "case":{
162
- "p":0.990015361,
163
- "r":0.9794832827,
164
- "f":0.9847211612
165
  },
166
  "dislocated":{
167
- "p":0.8181818182,
168
- "r":0.6923076923,
169
- "f":0.75
170
  },
171
  "nsubj":{
172
- "p":0.875,
173
- "r":0.8598848369,
174
- "f":0.8673765731
175
  },
176
  "nmod":{
177
- "p":0.921641791,
178
- "r":0.8666666667,
179
- "f":0.8933092224
180
  },
181
  "root":{
182
- "p":0.9645669291,
183
- "r":0.966469428,
184
- "f":0.9655172414
185
  },
186
  "aux":{
187
- "p":0.9757462687,
188
- "r":0.9712163417,
189
- "f":0.9734760354
190
  },
191
  "advcl":{
192
- "p":0.7333333333,
193
- "r":0.7415730337,
194
- "f":0.7374301676
195
  },
196
  "mark":{
197
- "p":0.964,
198
- "r":0.964,
199
- "f":0.964
200
  },
201
  "fixed":{
202
- "p":0.9663716814,
203
- "r":0.9927272727,
204
- "f":0.9793721973
205
  },
206
  "acl":{
207
- "p":0.8780487805,
208
- "r":0.8703296703,
209
- "f":0.8741721854
210
  },
211
  "obj":{
212
- "p":0.9726443769,
213
- "r":0.9667673716,
214
- "f":0.9696969697
215
  },
216
  "nummod":{
217
- "p":0.9806451613,
218
  "r":0.899408284,
219
- "f":0.9382716049
220
  },
221
  "advmod":{
222
- "p":0.7388059701,
223
- "r":0.7071428571,
224
- "f":0.7226277372
225
  },
226
  "amod":{
227
- "p":0.9333333333,
228
- "r":0.7567567568,
229
- "f":0.8358208955
230
  },
231
  "cop":{
232
- "p":0.9821428571,
233
- "r":0.9593023256,
234
- "f":0.9705882353
235
  },
236
  "ccomp":{
237
- "p":0.9444444444,
238
- "r":0.7727272727,
239
- "f":0.85
240
  },
241
  "det":{
242
  "p":1.0,
@@ -244,76 +244,76 @@
244
  "f":0.9904761905
245
  },
246
  "csubj":{
247
- "p":0.7692307692,
248
- "r":0.8333333333,
249
- "f":0.8
250
  },
251
  "dep":{
252
- "p":0.2857142857,
253
  "r":0.2857142857,
254
- "f":0.2857142857
255
  }
256
  },
257
- "tag_acc":0.9712488769,
258
  "lemma_acc":0.9670526831,
259
- "ents_p":0.8298969072,
260
- "ents_r":0.8100628931,
261
- "ents_f":0.8198599618,
262
  "ents_per_type":{
263
  "DATE":{
264
- "p":0.9906542056,
265
- "r":0.9724770642,
266
- "f":0.9814814815
267
  },
268
  "ORG":{
269
- "p":0.7445255474,
270
  "r":0.7445255474,
271
- "f":0.7445255474
 
 
 
 
 
272
  },
273
  "PERSON":{
274
- "p":0.9516129032,
275
- "r":0.8489208633,
276
- "f":0.897338403
277
  },
278
  "GPE":{
279
- "p":0.79,
280
  "r":0.8404255319,
281
- "f":0.8144329897
282
  },
283
  "PRODUCT":{
284
- "p":0.5945945946,
285
- "r":0.5238095238,
286
- "f":0.5569620253
287
  },
288
  "TIME":{
289
- "p":0.8,
290
  "r":1.0,
291
- "f":0.8888888889
292
  },
293
  "QUANTITY":{
294
- "p":0.8904109589,
295
- "r":0.9848484848,
296
- "f":0.9352517986
297
  },
298
  "NORP":{
299
- "p":0.6785714286,
300
- "r":0.59375,
301
- "f":0.6333333333
302
- },
303
- "TITLE_AFFIX":{
304
- "p":0.7857142857,
305
- "r":0.7333333333,
306
- "f":0.7586206897
307
  },
308
  "ORDINAL":{
309
- "p":0.652173913,
310
- "r":0.6818181818,
311
- "f":0.6666666667
312
  },
313
  "WORK_OF_ART":{
314
- "p":0.8461538462,
315
- "r":0.6470588235,
316
- "f":0.7333333333
317
  },
318
  "CARDINAL":{
319
  "p":1.0,
@@ -321,29 +321,29 @@
321
  "f":0.6666666667
322
  },
323
  "LOC":{
324
- "p":0.6,
325
- "r":0.9,
326
- "f":0.72
327
  },
328
  "PERCENT":{
329
  "p":1.0,
330
- "r":0.7142857143,
331
- "f":0.8333333333
332
  },
333
  "EVENT":{
334
- "p":0.9090909091,
335
- "r":0.7692307692,
336
- "f":0.8333333333
337
  },
338
  "FAC":{
339
- "p":0.7692307692,
340
- "r":0.8108108108,
341
- "f":0.7894736842
342
  },
343
  "MOVEMENT":{
344
- "p":0.3333333333,
345
- "r":0.2,
346
- "f":0.25
347
  },
348
  "LAW":{
349
  "p":0.6666666667,
@@ -361,7 +361,7 @@
361
  "f":1.0
362
  }
363
  },
364
- "speed":3501.8234367587
365
  },
366
  "sources":[
367
  {
@@ -384,7 +384,7 @@
384
  }
385
  ],
386
  "requirements":[
387
- "spacy-transformers>=1.2.0.dev0,<1.3.0",
388
  "sudachipy>=0.5.2,!=0.6.1",
389
  "sudachidict-core>=20211220"
390
  ]
 
1
  {
2
  "lang":"ja",
3
  "name":"core_news_trf",
4
+ "version":"3.6.1",
5
  "description":"Japanese transformer pipeline (cl-tohoku/bert-base-japanese-char-v2). Components: transformer, morphologizer, parser, ner.",
6
  "author":"Explosion",
7
  "email":"[email protected]",
8
  "url":"https://explosion.ai",
9
  "license":"CC BY-SA 3.0",
10
+ "spacy_version":">=3.6.0,<3.7.0",
11
+ "spacy_git_version":"c067b5264",
12
  "vectors":{
13
  "width":0,
14
  "vectors":0,
 
115
  "token_p":0.9764591282,
116
  "token_r":0.9790021974,
117
  "token_f":0.9777290092,
118
+ "pos_acc":0.9798190675,
119
  "morph_acc":0.0,
120
+ "morph_micro_p":0.3401360544,
121
+ "morph_micro_r":0.9803921569,
122
+ "morph_micro_f":0.5050505051,
123
  "morph_per_feat":{
124
  "Polarity":{
125
  "p":1.0,
126
+ "r":0.9803921569,
127
+ "f":0.9900990099
128
  },
129
  "Inflection":{
130
  "p":0.0,
 
137
  "f":0.0
138
  }
139
  },
140
+ "sents_p":0.9519230769,
141
+ "sents_r":0.9763313609,
142
+ "sents_f":0.9639727361,
143
+ "dep_uas":0.9311959654,
144
+ "dep_las":0.9202934425,
145
  "dep_las_per_type":{
146
  "cc":{
147
+ "p":0.8936170213,
148
  "r":0.875,
149
+ "f":0.8842105263
150
  },
151
  "compound":{
152
+ "p":0.9544917258,
153
+ "r":0.9103720406,
154
+ "f":0.9319099827
155
  },
156
  "obl":{
157
+ "p":0.8436724566,
158
+ "r":0.8489388265,
159
+ "f":0.8462974487
160
  },
161
  "case":{
162
+ "p":0.9832317073,
163
+ "r":0.9802431611,
164
+ "f":0.9817351598
165
  },
166
  "dislocated":{
167
+ "p":0.6666666667,
168
+ "r":0.6153846154,
169
+ "f":0.64
170
  },
171
  "nsubj":{
172
+ "p":0.8618677043,
173
+ "r":0.8502879079,
174
+ "f":0.8560386473
175
  },
176
  "nmod":{
177
+ "p":0.9235588972,
178
+ "r":0.8619883041,
179
+ "f":0.8917120387
180
  },
181
  "root":{
182
+ "p":0.9359223301,
183
+ "r":0.9506903353,
184
+ "f":0.9432485323
185
  },
186
  "aux":{
187
+ "p":0.9765698219,
188
+ "r":0.9675023213,
189
+ "f":0.9720149254
190
  },
191
  "advcl":{
192
+ "p":0.7379310345,
193
+ "r":0.7213483146,
194
+ "f":0.7295454545
195
  },
196
  "mark":{
197
+ "p":0.9756592292,
198
+ "r":0.962,
199
+ "f":0.9687814703
200
  },
201
  "fixed":{
202
+ "p":0.9661921708,
203
+ "r":0.9872727273,
204
+ "f":0.976618705
205
  },
206
  "acl":{
207
+ "p":0.8942731278,
208
+ "r":0.8923076923,
209
+ "f":0.8932893289
210
  },
211
  "obj":{
212
+ "p":0.9539877301,
213
+ "r":0.9395770393,
214
+ "f":0.9467275495
215
  },
216
  "nummod":{
217
+ "p":0.987012987,
218
  "r":0.899408284,
219
+ "f":0.9411764706
220
  },
221
  "advmod":{
222
+ "p":0.7537313433,
223
+ "r":0.7214285714,
224
+ "f":0.7372262774
225
  },
226
  "amod":{
227
+ "p":0.9375,
228
+ "r":0.8108108108,
229
+ "f":0.8695652174
230
  },
231
  "cop":{
232
+ "p":0.9764705882,
233
+ "r":0.9651162791,
234
+ "f":0.9707602339
235
  },
236
  "ccomp":{
237
+ "p":0.9047619048,
238
+ "r":0.8636363636,
239
+ "f":0.8837209302
240
  },
241
  "det":{
242
  "p":1.0,
 
244
  "f":0.9904761905
245
  },
246
  "csubj":{
247
+ "p":0.7333333333,
248
+ "r":0.9166666667,
249
+ "f":0.8148148148
250
  },
251
  "dep":{
252
+ "p":0.25,
253
  "r":0.2857142857,
254
+ "f":0.2666666667
255
  }
256
  },
257
+ "tag_acc":0.9713305562,
258
  "lemma_acc":0.9670526831,
259
+ "ents_p":0.8356510746,
260
+ "ents_r":0.8314465409,
261
+ "ents_f":0.8335435057,
262
  "ents_per_type":{
263
  "DATE":{
264
+ "p":0.9727272727,
265
+ "r":0.9816513761,
266
+ "f":0.9771689498
267
  },
268
  "ORG":{
269
+ "p":0.7906976744,
270
  "r":0.7445255474,
271
+ "f":0.7669172932
272
+ },
273
+ "TITLE_AFFIX":{
274
+ "p":0.9230769231,
275
+ "r":0.8,
276
+ "f":0.8571428571
277
  },
278
  "PERSON":{
279
+ "p":0.8865248227,
280
+ "r":0.8992805755,
281
+ "f":0.8928571429
282
  },
283
  "GPE":{
284
+ "p":0.8404255319,
285
  "r":0.8404255319,
286
+ "f":0.8404255319
287
  },
288
  "PRODUCT":{
289
+ "p":0.625,
290
+ "r":0.5952380952,
291
+ "f":0.6097560976
292
  },
293
  "TIME":{
294
+ "p":1.0,
295
  "r":1.0,
296
+ "f":1.0
297
  },
298
  "QUANTITY":{
299
+ "p":0.875,
300
+ "r":0.9545454545,
301
+ "f":0.9130434783
302
  },
303
  "NORP":{
304
+ "p":0.6875,
305
+ "r":0.6875,
306
+ "f":0.6875
 
 
 
 
 
307
  },
308
  "ORDINAL":{
309
+ "p":0.64,
310
+ "r":0.7272727273,
311
+ "f":0.6808510638
312
  },
313
  "WORK_OF_ART":{
314
+ "p":0.8,
315
+ "r":0.7058823529,
316
+ "f":0.75
317
  },
318
  "CARDINAL":{
319
  "p":1.0,
 
321
  "f":0.6666666667
322
  },
323
  "LOC":{
324
+ "p":0.5714285714,
325
+ "r":0.8,
326
+ "f":0.6666666667
327
  },
328
  "PERCENT":{
329
  "p":1.0,
330
+ "r":1.0,
331
+ "f":1.0
332
  },
333
  "EVENT":{
334
+ "p":0.9130434783,
335
+ "r":0.8076923077,
336
+ "f":0.8571428571
337
  },
338
  "FAC":{
339
+ "p":0.7179487179,
340
+ "r":0.7567567568,
341
+ "f":0.7368421053
342
  },
343
  "MOVEMENT":{
344
+ "p":0.6666666667,
345
+ "r":0.4,
346
+ "f":0.5
347
  },
348
  "LAW":{
349
  "p":0.6666666667,
 
361
  "f":1.0
362
  }
363
  },
364
+ "speed":668.4231187225
365
  },
366
  "sources":[
367
  {
 
384
  }
385
  ],
386
  "requirements":[
387
+ "spacy-transformers>=1.2.2,<1.3.0",
388
  "sudachipy>=0.5.2,!=0.6.1",
389
  "sudachidict-core>=20211220"
390
  ]
morphologizer/cfg CHANGED
@@ -1,5 +1,6 @@
1
  {
2
  "extend":true,
 
3
  "labels_morph":{
4
  "POS=NOUN":"",
5
  "POS=ADP":"",
 
1
  {
2
  "extend":true,
3
+ "label_smoothing":0.0,
4
  "labels_morph":{
5
  "POS=NOUN":"",
6
  "POS=ADP":"",
morphologizer/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b29b5a466d2b2e04d0ba5ecc814b1c2dd3b68779a268d1c9f2e53acc3ae3e341
3
  size 59084
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3a1049a275d37cece33da1393ca92b132ca87447073c704ebab7bc69d73efa1
3
  size 59084
ner/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8861afdc60dc55a1be8bc7af4d9f886b7df4b01fb10a7edf4db75c1bd4eb4b6d
3
  size 338861
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be17299903d639e7f1bb4379616a9c8f53cd53f758ba9533ea680e799e2eec53
3
  size 338861
parser/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a6db32102f6c2c87ecac20d4510cd45b863de1e00a1080b029ceff5926f3fde3
3
  size 318612
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:596b2e4e3b94484870fdb6a818bd3d0e5cd5eb13a25ec17076d9f9595eb1ca54
3
  size 318612
transformer/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:43a45ee97862b26d1b81b9896d5d5ed3b599d3b6bf80db3c2b03d6bb6e62437a
3
- size 363145845
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5148b11902ffcdbd01171380ba2b6e44769aa5bbbdca877d36d3081dd629ff8
3
+ size 363145763
vocab/strings.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a5c0c3d498c927b78335dc65ecb0eb22e2dd05617c40665dc66c0b600e8dc6f4
3
- size 1600681
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a71f56abaa60650314209e675a9652a03240e9e7d8fff74f8aaed649519b2d6b
3
+ size 1599987