nttx commited on
Commit
1f341ca
·
verified ·
1 Parent(s): 2f66c7b

Training in progress, step 2000, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:42bdf7a12daee72631644ff26e7c9f80bbf2ff91189adeb79844f41ec3b3a0de
3
  size 138995824
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53e52b6d2329dc025f309262138c685c2d456edec0bf62d31a7b72dcedba0776
3
  size 138995824
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1dd720e9bd3c6b76823b903b091b8513f63bb3e34dff5623eb6c72cf14934888
3
  size 71078228
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18bed64a2488c7a6d5c52b9cbb86e65f981cc01aeb77c06f9737f6691ab28f75
3
  size 71078228
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:912d3b1d35846784f3679bfe983446d30830056bb9c64fff6ed2d9239f2efee7
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2cd2165ee95963f994c4fb0318462352e4521cc9252f74bcb019a89c3a0d1bb4
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f2d1d3e656c776bd4cb00d51e16dbc3c67347908a818c2aee478de24ffb13283
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6a1e3232c9dd0558d3b582345b4a537ca2d63d9ae2df7d7189cbdc92c4e384f
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.8344256281852722,
3
  "best_model_checkpoint": "miner_id_24/checkpoint-1800",
4
- "epoch": 2.179176755447942,
5
  "eval_steps": 200,
6
- "global_step": 1800,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -339,6 +339,42 @@
339
  "eval_samples_per_second": 64.244,
340
  "eval_steps_per_second": 16.061,
341
  "step": 1800
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
342
  }
343
  ],
344
  "logging_steps": 50,
@@ -353,7 +389,7 @@
353
  "early_stopping_threshold": 0.0
354
  },
355
  "attributes": {
356
- "early_stopping_patience_counter": 0
357
  }
358
  },
359
  "TrainerControl": {
@@ -362,12 +398,12 @@
362
  "should_evaluate": false,
363
  "should_log": false,
364
  "should_save": true,
365
- "should_training_stop": false
366
  },
367
  "attributes": {}
368
  }
369
  },
370
- "total_flos": 3.446460309307392e+16,
371
  "train_batch_size": 4,
372
  "trial_name": null,
373
  "trial_params": null
 
1
  {
2
  "best_metric": 0.8344256281852722,
3
  "best_model_checkpoint": "miner_id_24/checkpoint-1800",
4
+ "epoch": 2.4213075060532687,
5
  "eval_steps": 200,
6
+ "global_step": 2000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
339
  "eval_samples_per_second": 64.244,
340
  "eval_steps_per_second": 16.061,
341
  "step": 1800
342
+ },
343
+ {
344
+ "epoch": 2.2397094430992737,
345
+ "grad_norm": 0.766105592250824,
346
+ "learning_rate": 1.5299867030334814e-06,
347
+ "loss": 0.7791,
348
+ "step": 1850
349
+ },
350
+ {
351
+ "epoch": 2.3002421307506054,
352
+ "grad_norm": 0.9087867140769958,
353
+ "learning_rate": 6.819348298638839e-07,
354
+ "loss": 0.8034,
355
+ "step": 1900
356
+ },
357
+ {
358
+ "epoch": 2.360774818401937,
359
+ "grad_norm": 0.7230655550956726,
360
+ "learning_rate": 1.7077534966650766e-07,
361
+ "loss": 0.8078,
362
+ "step": 1950
363
+ },
364
+ {
365
+ "epoch": 2.4213075060532687,
366
+ "grad_norm": 0.8146218657493591,
367
+ "learning_rate": 0.0,
368
+ "loss": 0.7728,
369
+ "step": 2000
370
+ },
371
+ {
372
+ "epoch": 2.4213075060532687,
373
+ "eval_loss": 0.8369823694229126,
374
+ "eval_runtime": 10.8447,
375
+ "eval_samples_per_second": 64.179,
376
+ "eval_steps_per_second": 16.045,
377
+ "step": 2000
378
  }
379
  ],
380
  "logging_steps": 50,
 
389
  "early_stopping_threshold": 0.0
390
  },
391
  "attributes": {
392
+ "early_stopping_patience_counter": 1
393
  }
394
  },
395
  "TrainerControl": {
 
398
  "should_evaluate": false,
399
  "should_log": false,
400
  "should_save": true,
401
+ "should_training_stop": true
402
  },
403
  "attributes": {}
404
  }
405
  },
406
+ "total_flos": 3.82940034367488e+16,
407
  "train_batch_size": 4,
408
  "trial_name": null,
409
  "trial_params": null