player1537 commited on
Commit
422f1d4
·
1 Parent(s): b557d4a

Training in progress, step 524

Browse files
adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cb3c4343d5b79891e68e969b5db2e8b5a3bba2fc92883108865dd3097a7d1357
3
  size 3163457
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb3e39c69cf87ac8f88f27ce6f33ebc40816ea621b5669a014b039c0efc7f541
3
  size 3163457
last-checkpoint/adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cb3c4343d5b79891e68e969b5db2e8b5a3bba2fc92883108865dd3097a7d1357
3
  size 3163457
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb3e39c69cf87ac8f88f27ce6f33ebc40816ea621b5669a014b039c0efc7f541
3
  size 3163457
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e8901fba30f9688d20aa8e15379a7066e298045a8bb0b9de8851afdbe035d623
3
  size 6319689
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d687ffed6510ec1c76cffe4448a4eb5c5312677e63e6ba40479737f7ad1b8a7f
3
  size 6319689
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c5063f67e2c88884cab54e05296e5e83ac9a3c954c9e23cfb2d9a21a6c8d8e10
3
  size 14639
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6227a8020263fdf5f88e2d88cee5778418bbde4b0cf3767c692dc92f26c6f75d
3
  size 14639
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a55327b521b10efdd88cd32140805678860f8977b7eba62e5ac86192f50bb738
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0efecc10e44e390de6dc6bd5194bdbd19c81b879ba1d4cdb7a5e0d951d3f168
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.1501432664756447,
5
- "global_step": 262,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -72,11 +72,71 @@
72
  "learning_rate": 1.702005730659026e-05,
73
  "loss": 2.7529,
74
  "step": 260
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
75
  }
76
  ],
77
  "max_steps": 1745,
78
  "num_train_epochs": 1,
79
- "total_flos": 487908402266112.0,
80
  "trial_name": null,
81
  "trial_params": null
82
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.3002865329512894,
5
+ "global_step": 524,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
72
  "learning_rate": 1.702005730659026e-05,
73
  "loss": 2.7529,
74
  "step": 260
75
+ },
76
+ {
77
+ "epoch": 0.16,
78
+ "learning_rate": 1.6722063037249286e-05,
79
+ "loss": 2.7147,
80
+ "step": 286
81
+ },
82
+ {
83
+ "epoch": 0.18,
84
+ "learning_rate": 1.642406876790831e-05,
85
+ "loss": 2.695,
86
+ "step": 312
87
+ },
88
+ {
89
+ "epoch": 0.19,
90
+ "learning_rate": 1.6137535816618913e-05,
91
+ "loss": 2.7071,
92
+ "step": 338
93
+ },
94
+ {
95
+ "epoch": 0.21,
96
+ "learning_rate": 1.583954154727794e-05,
97
+ "loss": 2.7039,
98
+ "step": 364
99
+ },
100
+ {
101
+ "epoch": 0.22,
102
+ "learning_rate": 1.5541547277936964e-05,
103
+ "loss": 2.7586,
104
+ "step": 390
105
+ },
106
+ {
107
+ "epoch": 0.24,
108
+ "learning_rate": 1.5243553008595991e-05,
109
+ "loss": 2.8132,
110
+ "step": 416
111
+ },
112
+ {
113
+ "epoch": 0.25,
114
+ "learning_rate": 1.495702005730659e-05,
115
+ "loss": 2.7552,
116
+ "step": 442
117
+ },
118
+ {
119
+ "epoch": 0.27,
120
+ "learning_rate": 1.4659025787965618e-05,
121
+ "loss": 2.7388,
122
+ "step": 468
123
+ },
124
+ {
125
+ "epoch": 0.28,
126
+ "learning_rate": 1.4361031518624645e-05,
127
+ "loss": 2.6576,
128
+ "step": 494
129
+ },
130
+ {
131
+ "epoch": 0.3,
132
+ "learning_rate": 1.4063037249283669e-05,
133
+ "loss": 2.6962,
134
+ "step": 520
135
  }
136
  ],
137
  "max_steps": 1745,
138
  "num_train_epochs": 1,
139
+ "total_flos": 975816804532224.0,
140
  "trial_name": null,
141
  "trial_params": null
142
  }
runs/Jul30_21-45-15_04d48b04b124/events.out.tfevents.1690753519.04d48b04b124.12710.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:862ab2bfec1ac04bfcc6c7b6745e05a9197bf0013e1824069f79c8e70bec11ee
3
- size 5915
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08b8b3fba46577efad57cda38fc4207645b4446372c05c26f20f746cc1d5014e
3
+ size 7485