liat-nakayama commited on
Commit
770f862
1 Parent(s): a11f386

Upload 5 files

Browse files
Files changed (5) hide show
  1. config.json +210 -0
  2. config.yaml +59 -0
  3. evaluate.log +0 -0
  4. pytorch_model.bin +3 -0
  5. train.log +0 -0
config.json ADDED
@@ -0,0 +1,210 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "num_labels": 7,
3
+ "ene_tags": [
4
+ "1.0",
5
+ "1.1",
6
+ "1.10.0",
7
+ "1.10.1",
8
+ "1.11",
9
+ "1.2",
10
+ "1.3.1.0",
11
+ "1.3.1.1",
12
+ "1.3.2",
13
+ "1.4.0",
14
+ "1.4.1",
15
+ "1.4.2",
16
+ "1.4.3",
17
+ "1.4.4.0",
18
+ "1.4.4.1",
19
+ "1.4.5.0",
20
+ "1.4.5.1",
21
+ "1.4.5.2",
22
+ "1.4.5.3",
23
+ "1.4.6.0",
24
+ "1.4.6.1",
25
+ "1.4.6.2",
26
+ "1.4.6.3",
27
+ "1.4.7.0",
28
+ "1.4.7.1",
29
+ "1.4.7.2",
30
+ "1.4.7.3",
31
+ "1.4.7.4",
32
+ "1.5.0",
33
+ "1.5.1.0",
34
+ "1.5.1.1",
35
+ "1.5.1.2",
36
+ "1.5.1.3",
37
+ "1.5.2.0",
38
+ "1.5.2.1",
39
+ "1.5.2.2",
40
+ "1.5.3.0",
41
+ "1.5.3.1",
42
+ "1.5.3.2",
43
+ "1.5.3.3",
44
+ "1.5.3.4",
45
+ "1.5.3.5",
46
+ "1.5.3.6",
47
+ "1.5.3.7",
48
+ "1.5.4.0",
49
+ "1.5.4.1",
50
+ "1.5.4.2",
51
+ "1.5.4.3",
52
+ "1.5.4.4",
53
+ "1.5.4.5",
54
+ "1.5.5.1",
55
+ "1.6.0",
56
+ "1.6.1",
57
+ "1.6.2",
58
+ "1.6.3.0",
59
+ "1.6.3.1",
60
+ "1.6.4.0",
61
+ "1.6.4.1",
62
+ "1.6.4.10",
63
+ "1.6.4.11",
64
+ "1.6.4.12",
65
+ "1.6.4.13",
66
+ "1.6.4.14",
67
+ "1.6.4.15",
68
+ "1.6.4.16",
69
+ "1.6.4.17",
70
+ "1.6.4.18",
71
+ "1.6.4.2",
72
+ "1.6.4.3",
73
+ "1.6.4.4",
74
+ "1.6.4.5",
75
+ "1.6.4.6",
76
+ "1.6.4.7",
77
+ "1.6.4.8",
78
+ "1.6.4.9",
79
+ "1.6.5.0",
80
+ "1.6.5.1",
81
+ "1.6.5.2",
82
+ "1.6.5.3",
83
+ "1.6.5.4",
84
+ "1.6.5.5",
85
+ "1.6.5.6",
86
+ "1.6.6.0",
87
+ "1.6.6.1",
88
+ "1.6.6.2",
89
+ "1.6.6.3",
90
+ "1.6.6.4",
91
+ "1.6.6.5",
92
+ "1.6.6.6",
93
+ "1.7.0",
94
+ "1.7.1",
95
+ "1.7.10",
96
+ "1.7.11",
97
+ "1.7.12",
98
+ "1.7.13.0",
99
+ "1.7.13.1",
100
+ "1.7.13.2",
101
+ "1.7.13.3",
102
+ "1.7.13.4",
103
+ "1.7.13.5",
104
+ "1.7.13.6",
105
+ "1.7.14.0",
106
+ "1.7.14.1",
107
+ "1.7.14.2",
108
+ "1.7.14.3",
109
+ "1.7.15.0",
110
+ "1.7.15.1",
111
+ "1.7.16.0",
112
+ "1.7.16.1",
113
+ "1.7.17.0",
114
+ "1.7.17.1",
115
+ "1.7.18.0",
116
+ "1.7.18.1",
117
+ "1.7.18.2",
118
+ "1.7.18.3",
119
+ "1.7.18.4",
120
+ "1.7.18.5",
121
+ "1.7.18.6",
122
+ "1.7.18.7",
123
+ "1.7.18.8",
124
+ "1.7.19.0",
125
+ "1.7.19.1",
126
+ "1.7.19.10",
127
+ "1.7.19.11",
128
+ "1.7.19.12",
129
+ "1.7.19.13",
130
+ "1.7.19.14",
131
+ "1.7.19.15",
132
+ "1.7.19.16",
133
+ "1.7.19.17",
134
+ "1.7.19.2",
135
+ "1.7.19.3",
136
+ "1.7.19.4",
137
+ "1.7.19.5",
138
+ "1.7.19.6",
139
+ "1.7.19.7",
140
+ "1.7.19.8",
141
+ "1.7.19.9",
142
+ "1.7.2",
143
+ "1.7.20.0",
144
+ "1.7.20.1",
145
+ "1.7.20.2",
146
+ "1.7.21.0",
147
+ "1.7.21.1",
148
+ "1.7.22.0",
149
+ "1.7.22.1",
150
+ "1.7.23.0",
151
+ "1.7.23.1",
152
+ "1.7.24.0",
153
+ "1.7.24.1",
154
+ "1.7.24.2",
155
+ "1.7.24.4",
156
+ "1.7.3",
157
+ "1.7.4",
158
+ "1.7.5",
159
+ "1.7.6",
160
+ "1.7.7",
161
+ "1.7.8",
162
+ "1.7.9",
163
+ "1.8.0",
164
+ "1.8.1",
165
+ "1.8.2.0",
166
+ "1.8.2.1",
167
+ "1.8.2.2",
168
+ "1.8.3.0",
169
+ "1.8.3.1",
170
+ "1.8.3.2",
171
+ "1.8.3.3",
172
+ "1.8.3.4",
173
+ "1.8.3.5",
174
+ "1.8.4.0",
175
+ "1.8.4.1",
176
+ "1.8.4.2",
177
+ "1.8.4.3",
178
+ "1.9.0",
179
+ "1.9.1",
180
+ "1.9.2",
181
+ "1.9.3",
182
+ "1.9.4.0",
183
+ "1.9.4.1",
184
+ "1.9.4.10",
185
+ "1.9.4.11",
186
+ "1.9.4.12",
187
+ "1.9.4.13",
188
+ "1.9.4.2",
189
+ "1.9.4.3",
190
+ "1.9.4.4",
191
+ "1.9.4.5",
192
+ "1.9.4.6",
193
+ "1.9.4.7",
194
+ "1.9.4.8",
195
+ "1.9.4.9",
196
+ "1.9.5.0",
197
+ "1.9.5.1",
198
+ "1.9.5.2"
199
+ ],
200
+ "num_tags": 3,
201
+ "set_labels": {
202
+ "0": "START",
203
+ "1": "END",
204
+ "2": "O",
205
+ "3": "B-NE",
206
+ "4": "I-NE",
207
+ "5": "L-NE",
208
+ "6": "U-NE"
209
+ }
210
+ }
config.yaml ADDED
@@ -0,0 +1,59 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ optim:
2
+ gradient_clip:
3
+ active: active
4
+ clip: 0.01
5
+ cls: AdamW
6
+ param:
7
+ lr: 3.0e-05
8
+ betas:
9
+ - 0.9
10
+ - 0.999
11
+ eps: 1.0e-06
12
+ weight_decay: 0.01
13
+ amsgrad: false
14
+ loss:
15
+ class_weight:
16
+ active: true
17
+ seed: 1234
18
+ device:
19
+ device: cuda
20
+ n_gpu: 8
21
+ model:
22
+ bert:
23
+ name: roberta_base_ja_20190121_m10000_v24000_u500000
24
+ train:
25
+ epoch: 10
26
+ batch_size: 400
27
+ eval:
28
+ batch_size: 800
29
+ data:
30
+ wikipedia:
31
+ debug_size: null
32
+ dir: ./dataset/jawiki-20190121-cirrussearch-content
33
+ add_dir: ./outputs/large_el_base_wikilink_extention/predicts/jawiki-20190121-cirrussearch-content
34
+ filter_no_link: false
35
+ ene:
36
+ path: ./dataset/Shinra2023_Classification_train_20230416.jsonl
37
+ add_path: ./outputs/ene_classifier/jawiki-20190121-cirrussearch-content/predict.jsonl
38
+ encoding: BIOUL
39
+ dev_size: 100
40
+ seq_len: 512
41
+ dup_len: 32
42
+ dataloader:
43
+ num_workers: 8
44
+ setting:
45
+ trainer:
46
+ cls: BaselineTrainer
47
+ type:
48
+ dataset:
49
+ cls: NERCRFDataset
50
+ model:
51
+ cls: NERCRFModel
52
+ crf:
53
+ cls: PatialEERCRF
54
+ partial: true
55
+ add_se_tag: true
56
+ eer:
57
+ ratio: null
58
+ margin: 0.0
59
+ weight: 10
evaluate.log ADDED
File without changes
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:844493c99c469ccd35d4915640f26b95c6ec3ae970d26ac2d4a4cf3a1b3e17b6
3
+ size 420988565
train.log ADDED
The diff for this file is too large to render. See raw diff