therealcyberlord commited on
Commit
6eaaead
1 Parent(s): dc24761

deleted unnessary files

Browse files
Files changed (5) hide show
  1. optimizer.pt +0 -3
  2. rng_state.pth +0 -3
  3. scheduler.pt +0 -3
  4. trainer_state.json +0 -196
  5. training_args.bin +0 -3
optimizer.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:9a1df273c7f0d4cb5fa35a5a355d9c935806889ac22bb2228aa64c269fec75d9
3
- size 535700065
 
 
 
 
rng_state.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:d0f2f74f7f558ab164dc08759a1603062c3c4de00034a78823223667cabbb076
3
- size 14503
 
 
 
 
scheduler.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:a8d5cd2984885ae326d50c41c5c631bf58ec64cba465012f723e0614d1cf06ec
3
- size 623
 
 
 
 
trainer_state.json DELETED
@@ -1,196 +0,0 @@
1
- {
2
- "best_metric": null,
3
- "best_model_checkpoint": null,
4
- "epoch": 0.9891196834817013,
5
- "global_step": 1000,
6
- "is_hyper_param_search": false,
7
- "is_local_process_zero": true,
8
- "is_world_process_zero": true,
9
- "log_history": [
10
- {
11
- "epoch": 0.1,
12
- "learning_rate": 1e-05,
13
- "loss": 1.012,
14
- "step": 100
15
- },
16
- {
17
- "epoch": 0.1,
18
- "eval_acc": 0.9251113585746102,
19
- "eval_f1 score": 0.9269220320565063,
20
- "eval_loss": 0.1983393132686615,
21
- "eval_precision": 0.8821096173733195,
22
- "eval_recall": 0.976531196336577,
23
- "eval_runtime": 29.7994,
24
- "eval_samples_per_second": 120.54,
25
- "eval_steps_per_second": 3.792,
26
- "step": 100
27
- },
28
- {
29
- "epoch": 0.2,
30
- "learning_rate": 2e-05,
31
- "loss": 0.0588,
32
- "step": 200
33
- },
34
- {
35
- "epoch": 0.2,
36
- "eval_acc": 0.9974944320712695,
37
- "eval_f1 score": 0.9974307736226092,
38
- "eval_loss": 0.008134149946272373,
39
- "eval_precision": 0.994874715261959,
40
- "eval_recall": 1.0,
41
- "eval_runtime": 29.7706,
42
- "eval_samples_per_second": 120.656,
43
- "eval_steps_per_second": 3.796,
44
- "step": 200
45
- },
46
- {
47
- "epoch": 0.3,
48
- "learning_rate": 3e-05,
49
- "loss": 0.0094,
50
- "step": 300
51
- },
52
- {
53
- "epoch": 0.3,
54
- "eval_acc": 0.9991648106904232,
55
- "eval_f1 score": 0.9991421218187019,
56
- "eval_loss": 0.0014619326684623957,
57
- "eval_precision": 0.9982857142857143,
58
- "eval_recall": 1.0,
59
- "eval_runtime": 29.7156,
60
- "eval_samples_per_second": 120.879,
61
- "eval_steps_per_second": 3.803,
62
- "step": 300
63
- },
64
- {
65
- "epoch": 0.4,
66
- "learning_rate": 4e-05,
67
- "loss": 0.003,
68
- "step": 400
69
- },
70
- {
71
- "epoch": 0.4,
72
- "eval_acc": 0.9991648106904232,
73
- "eval_f1 score": 0.9991411394217007,
74
- "eval_loss": 0.0031169140711426735,
75
- "eval_precision": 0.9994272623138603,
76
- "eval_recall": 0.9988551803091014,
77
- "eval_runtime": 29.7394,
78
- "eval_samples_per_second": 120.782,
79
- "eval_steps_per_second": 3.8,
80
- "step": 400
81
- },
82
- {
83
- "epoch": 0.49,
84
- "learning_rate": 5e-05,
85
- "loss": 0.0033,
86
- "step": 500
87
- },
88
- {
89
- "epoch": 0.49,
90
- "eval_acc": 0.998608017817372,
91
- "eval_f1 score": 0.9985710202915119,
92
- "eval_loss": 0.009261890314519405,
93
- "eval_precision": 0.9971461187214612,
94
- "eval_recall": 1.0,
95
- "eval_runtime": 29.7575,
96
- "eval_samples_per_second": 120.709,
97
- "eval_steps_per_second": 3.797,
98
- "step": 500
99
- },
100
- {
101
- "epoch": 0.59,
102
- "learning_rate": 4.021526418786693e-05,
103
- "loss": 0.0059,
104
- "step": 600
105
- },
106
- {
107
- "epoch": 0.59,
108
- "eval_acc": 0.9997216035634744,
109
- "eval_f1 score": 0.9997138769670958,
110
- "eval_loss": 0.002947951899841428,
111
- "eval_precision": 0.9994279176201373,
112
- "eval_recall": 1.0,
113
- "eval_runtime": 29.8118,
114
- "eval_samples_per_second": 120.489,
115
- "eval_steps_per_second": 3.79,
116
- "step": 600
117
- },
118
- {
119
- "epoch": 0.69,
120
- "learning_rate": 3.0430528375733857e-05,
121
- "loss": 0.0025,
122
- "step": 700
123
- },
124
- {
125
- "epoch": 0.69,
126
- "eval_acc": 1.0,
127
- "eval_f1 score": 1.0,
128
- "eval_loss": 0.00011875820928253233,
129
- "eval_precision": 1.0,
130
- "eval_recall": 1.0,
131
- "eval_runtime": 29.727,
132
- "eval_samples_per_second": 120.833,
133
- "eval_steps_per_second": 3.801,
134
- "step": 700
135
- },
136
- {
137
- "epoch": 0.79,
138
- "learning_rate": 2.064579256360078e-05,
139
- "loss": 0.0001,
140
- "step": 800
141
- },
142
- {
143
- "epoch": 0.79,
144
- "eval_acc": 0.9994432071269488,
145
- "eval_f1 score": 0.9994272623138604,
146
- "eval_loss": 0.0010784701444208622,
147
- "eval_precision": 1.0,
148
- "eval_recall": 0.9988551803091014,
149
- "eval_runtime": 29.689,
150
- "eval_samples_per_second": 120.987,
151
- "eval_steps_per_second": 3.806,
152
- "step": 800
153
- },
154
- {
155
- "epoch": 0.89,
156
- "learning_rate": 1.086105675146771e-05,
157
- "loss": 0.0042,
158
- "step": 900
159
- },
160
- {
161
- "epoch": 0.89,
162
- "eval_acc": 1.0,
163
- "eval_f1 score": 1.0,
164
- "eval_loss": 0.00021645698870997876,
165
- "eval_precision": 1.0,
166
- "eval_recall": 1.0,
167
- "eval_runtime": 29.7217,
168
- "eval_samples_per_second": 120.855,
169
- "eval_steps_per_second": 3.802,
170
- "step": 900
171
- },
172
- {
173
- "epoch": 0.99,
174
- "learning_rate": 1.076320939334638e-06,
175
- "loss": 0.0037,
176
- "step": 1000
177
- },
178
- {
179
- "epoch": 0.99,
180
- "eval_acc": 1.0,
181
- "eval_f1 score": 1.0,
182
- "eval_loss": 0.0003033815883100033,
183
- "eval_precision": 1.0,
184
- "eval_recall": 1.0,
185
- "eval_runtime": 29.7302,
186
- "eval_samples_per_second": 120.82,
187
- "eval_steps_per_second": 3.801,
188
- "step": 1000
189
- }
190
- ],
191
- "max_steps": 1011,
192
- "num_train_epochs": 1,
193
- "total_flos": 4238956756992000.0,
194
- "trial_name": null,
195
- "trial_params": null
196
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
training_args.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:13e47fbc29a305256c2ef1fe242107315741a33435bfeded3027f2780b50e58a
3
- size 3247