Skip to content

Commit 902a5b5

Browse files
committed
Update custom_ner_model29+23-1git including iteration_data.json
1 parent da64d8a commit 902a5b5

File tree

12 files changed

+21973
-0
lines changed

12 files changed

+21973
-0
lines changed
Lines changed: 130 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,130 @@
1+
[paths]
2+
train = null
3+
dev = null
4+
vectors = null
5+
init_tok2vec = null
6+
7+
[system]
8+
seed = 0
9+
gpu_allocator = null
10+
11+
[nlp]
12+
lang = "he"
13+
pipeline = ["ner"]
14+
disabled = []
15+
before_creation = null
16+
after_creation = null
17+
after_pipeline_creation = null
18+
batch_size = 1000
19+
tokenizer = {"@tokenizers":"spacy.Tokenizer.v1"}
20+
vectors = {"@vectors":"spacy.Vectors.v1"}
21+
22+
[components]
23+
24+
[components.ner]
25+
factory = "ner"
26+
incorrect_spans_key = null
27+
moves = null
28+
scorer = {"@scorers":"spacy.ner_scorer.v1"}
29+
update_with_oracle_cut_size = 100
30+
31+
[components.ner.model]
32+
@architectures = "spacy.TransitionBasedParser.v2"
33+
state_type = "ner"
34+
extra_state_tokens = false
35+
hidden_width = 64
36+
maxout_pieces = 2
37+
use_upper = true
38+
nO = null
39+
40+
[components.ner.model.tok2vec]
41+
@architectures = "spacy.HashEmbedCNN.v2"
42+
pretrained_vectors = null
43+
width = 96
44+
depth = 4
45+
embed_size = 2000
46+
window_size = 1
47+
maxout_pieces = 3
48+
subword_features = true
49+
50+
[corpora]
51+
52+
[corpora.dev]
53+
@readers = "spacy.Corpus.v1"
54+
path = ${paths.dev}
55+
gold_preproc = false
56+
max_length = 0
57+
limit = 0
58+
augmenter = null
59+
60+
[corpora.train]
61+
@readers = "spacy.Corpus.v1"
62+
path = ${paths.train}
63+
gold_preproc = false
64+
max_length = 0
65+
limit = 0
66+
augmenter = null
67+
68+
[training]
69+
seed = ${system.seed}
70+
gpu_allocator = ${system.gpu_allocator}
71+
dropout = 0.1
72+
accumulate_gradient = 1
73+
patience = 1600
74+
max_epochs = 0
75+
max_steps = 20000
76+
eval_frequency = 200
77+
frozen_components = []
78+
annotating_components = []
79+
dev_corpus = "corpora.dev"
80+
train_corpus = "corpora.train"
81+
before_to_disk = null
82+
before_update = null
83+
84+
[training.batcher]
85+
@batchers = "spacy.batch_by_words.v1"
86+
discard_oversize = false
87+
tolerance = 0.2
88+
get_length = null
89+
90+
[training.batcher.size]
91+
@schedules = "compounding.v1"
92+
start = 100
93+
stop = 1000
94+
compound = 1.001
95+
t = 0.0
96+
97+
[training.logger]
98+
@loggers = "spacy.ConsoleLogger.v1"
99+
progress_bar = false
100+
101+
[training.optimizer]
102+
@optimizers = "Adam.v1"
103+
beta1 = 0.9
104+
beta2 = 0.999
105+
L2_is_weight_decay = true
106+
L2 = 0.01
107+
grad_clip = 1.0
108+
use_averages = false
109+
eps = 0.00000001
110+
learn_rate = 0.001
111+
112+
[training.score_weights]
113+
ents_f = 1.0
114+
ents_p = 0.0
115+
ents_r = 0.0
116+
ents_per_type = null
117+
118+
[pretraining]
119+
120+
[initialize]
121+
vectors = ${paths.vectors}
122+
init_tok2vec = ${paths.init_tok2vec}
123+
vocab_data = null
124+
lookups = null
125+
before_init = null
126+
after_init = null
127+
128+
[initialize.components]
129+
130+
[initialize.tokenizer]
Lines changed: 122 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,122 @@
1+
{
2+
"0": {
3+
"ner": 4802.388039036398
4+
},
5+
"1": {
6+
"ner": 3438.4395032675866
7+
},
8+
"2": {
9+
"ner": 2827.94393245209
10+
},
11+
"3": {
12+
"ner": 2412.4572408230288
13+
},
14+
"4": {
15+
"ner": 2188.735894150063
16+
},
17+
"5": {
18+
"ner": 1908.96445147932
19+
},
20+
"6": {
21+
"ner": 1894.3397682169134
22+
},
23+
"7": {
24+
"ner": 1702.2257415071354
25+
},
26+
"8": {
27+
"ner": 1615.2015468392465
28+
},
29+
"9": {
30+
"ner": 1567.4141720728862
31+
},
32+
"10": {
33+
"ner": 1428.0969692173633
34+
},
35+
"11": {
36+
"ner": 1412.258335482977
37+
},
38+
"12": {
39+
"ner": 1290.9376119847664
40+
},
41+
"13": {
42+
"ner": 1287.4875631474988
43+
},
44+
"14": {
45+
"ner": 1296.9892050374908
46+
},
47+
"15": {
48+
"ner": 1203.507959512251
49+
},
50+
"16": {
51+
"ner": 1140.983979298868
52+
},
53+
"17": {
54+
"ner": 1194.259869129556
55+
},
56+
"18": {
57+
"ner": 1103.1253703101077
58+
},
59+
"19": {
60+
"ner": 1065.4706941012037
61+
},
62+
"20": {
63+
"ner": 986.9654182265089
64+
},
65+
"21": {
66+
"ner": 980.7948596421411
67+
},
68+
"22": {
69+
"ner": 959.8385475552886
70+
},
71+
"23": {
72+
"ner": 1011.502807016833
73+
},
74+
"24": {
75+
"ner": 952.4556438620727
76+
},
77+
"25": {
78+
"ner": 916.1662904750109
79+
},
80+
"26": {
81+
"ner": 887.7737379491912
82+
},
83+
"27": {
84+
"ner": 890.191895858633
85+
},
86+
"28": {
87+
"ner": 919.5846847199219
88+
},
89+
"29": {
90+
"ner": 817.6113931712281
91+
},
92+
"30": {
93+
"ner": 800.1440236747252
94+
},
95+
"31": {
96+
"ner": 767.2179148542099
97+
},
98+
"32": {
99+
"ner": 807.7469139540956
100+
},
101+
"33": {
102+
"ner": 743.6463610931854
103+
},
104+
"34": {
105+
"ner": 726.275117122479
106+
},
107+
"35": {
108+
"ner": 789.9216052093495
109+
},
110+
"36": {
111+
"ner": 770.8247413277267
112+
},
113+
"37": {
114+
"ner": 753.9640471296772
115+
},
116+
"38": {
117+
"ner": 734.032792442225
118+
},
119+
"39": {
120+
"ner": 775.5143593831364
121+
}
122+
}
Lines changed: 40 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,40 @@
1+
{
2+
"lang":"he",
3+
"name":"singer_ner_he",
4+
"version":"0.0.0",
5+
"spacy_version":">=3.7.5,<3.8.0",
6+
"description":"Model for recognizing singer names in Hebrew song titles",
7+
"author":"nhlocal",
8+
"email":"[email protected]",
9+
"url":"",
10+
"license":"MIT",
11+
"spacy_git_version":"a6d0fc360",
12+
"vectors":{
13+
"width":0,
14+
"vectors":0,
15+
"keys":0,
16+
"name":null,
17+
"mode":"default"
18+
},
19+
"labels":{
20+
"ner":[
21+
"SINGER"
22+
]
23+
},
24+
"pipeline":[
25+
"ner"
26+
],
27+
"components":[
28+
"ner"
29+
],
30+
"disabled":[
31+
32+
],
33+
"tags":[
34+
"NER",
35+
"Hebrew",
36+
"Singer",
37+
"Named Entity Recognition",
38+
"Text Classification"
39+
]
40+
}
Lines changed: 13 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,13 @@
1+
{
2+
"moves":null,
3+
"update_with_oracle_cut_size":100,
4+
"multitasks":[
5+
6+
],
7+
"min_action_freq":1,
8+
"learn_tokens":false,
9+
"beam_width":1,
10+
"beam_density":0.0,
11+
"beam_update_prob":0.0,
12+
"incorrect_spans_key":null
13+
}
3.66 MB
Binary file not shown.
Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1 @@
1+
��moves�`{"0":{},"1":{"SINGER":-1},"2":{"SINGER":-1},"3":{"SINGER":-1},"4":{"":1,"SINGER":-1},"5":{"":1}}�cfg��neg_key�

machine-learn/custom_ner_model29+23-1git/tokenizer

Lines changed: 3 additions & 0 deletions
Large diffs are not rendered by default.
Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1 @@
1+
Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1 @@
1+

0 commit comments

Comments
 (0)