leixa commited on
Commit
1c75e2c
1 Parent(s): 9721c5c

Training in progress, step 249, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c03cc5a79be0ba30ad0320be99eba132052fb920252f4f639abfb0267ea350a0
3
  size 191968
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec309510b4a87175ef5a1513cca05828a4dc3d8f570cdf3286d715b5d21cb5dd
3
  size 191968
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c6554ffe7014b0c305fc27e46e009d8002b5e22780cf3137e2842ed01d2e8fb0
3
  size 253144
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bea90bae910a7b8d4bba238e71b511c3801b8731427e6d690d08c3fb8150bc89
3
  size 253144
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2b3a05bdcba00a37dc9e6fb656aa0abeeb8eb45eca58cc80e1b27558770bab32
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5df2975a82f3511ba3393fb6029de32864ff15e1fa286047e0cb10e71b975b0e
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2fc5b95cc0db21cf56336a583c8dd7fb1d3824838e4cb847d2705abaaeeca402
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e454b41427ceaf5a552ecf234755def1c3b814a84af8caf7693b503fc58c46c
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.797583081570997,
5
  "eval_steps": 21,
6
- "global_step": 231,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -642,6 +642,48 @@
642
  "eval_samples_per_second": 538.147,
643
  "eval_steps_per_second": 69.19,
644
  "step": 231
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
645
  }
646
  ],
647
  "logging_steps": 3,
@@ -656,12 +698,12 @@
656
  "should_evaluate": false,
657
  "should_log": false,
658
  "should_save": true,
659
- "should_training_stop": false
660
  },
661
  "attributes": {}
662
  }
663
  },
664
- "total_flos": 25768202600448.0,
665
  "train_batch_size": 8,
666
  "trial_name": null,
667
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 3.0181268882175227,
5
  "eval_steps": 21,
6
+ "global_step": 249,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
642
  "eval_samples_per_second": 538.147,
643
  "eval_steps_per_second": 69.19,
644
  "step": 231
645
+ },
646
+ {
647
+ "epoch": 2.8338368580060425,
648
+ "grad_norm": 0.20488251745700836,
649
+ "learning_rate": 9.687663137678604e-07,
650
+ "loss": 10.175,
651
+ "step": 234
652
+ },
653
+ {
654
+ "epoch": 2.8700906344410875,
655
+ "grad_norm": 0.1691775619983673,
656
+ "learning_rate": 6.207343615165561e-07,
657
+ "loss": 10.1781,
658
+ "step": 237
659
+ },
660
+ {
661
+ "epoch": 2.906344410876133,
662
+ "grad_norm": 0.19150525331497192,
663
+ "learning_rate": 3.494800565275125e-07,
664
+ "loss": 10.184,
665
+ "step": 240
666
+ },
667
+ {
668
+ "epoch": 2.9425981873111784,
669
+ "grad_norm": 0.16350044310092926,
670
+ "learning_rate": 1.554251601833201e-07,
671
+ "loss": 10.1778,
672
+ "step": 243
673
+ },
674
+ {
675
+ "epoch": 2.9788519637462234,
676
+ "grad_norm": 0.16869449615478516,
677
+ "learning_rate": 3.8871399903134265e-08,
678
+ "loss": 10.1763,
679
+ "step": 246
680
+ },
681
+ {
682
+ "epoch": 3.0181268882175227,
683
+ "grad_norm": 0.19018259644508362,
684
+ "learning_rate": 0.0,
685
+ "loss": 12.1418,
686
+ "step": 249
687
  }
688
  ],
689
  "logging_steps": 3,
 
698
  "should_evaluate": false,
699
  "should_log": false,
700
  "should_save": true,
701
+ "should_training_stop": true
702
  },
703
  "attributes": {}
704
  }
705
  },
706
+ "total_flos": 27776114491392.0,
707
  "train_batch_size": 8,
708
  "trial_name": null,
709
  "trial_params": null