ZeroUniqueness commited on
Commit
234d4c8
Β·
1 Parent(s): dacd1b1

Training in progress, step 2800

Browse files
Files changed (25) hide show
  1. adapter_model.bin +1 -1
  2. {checkpoint-2400 β†’ checkpoint-2700/adapter_model}/README.md +0 -0
  3. {checkpoint-2400 β†’ checkpoint-2700/adapter_model}/adapter_config.json +0 -0
  4. {checkpoint-2400 β†’ checkpoint-2700/adapter_model}/adapter_model.bin +1 -1
  5. {checkpoint-2400/adapter_model β†’ checkpoint-2800}/README.md +0 -0
  6. {checkpoint-2400/adapter_model β†’ checkpoint-2800}/adapter_config.json +0 -0
  7. {checkpoint-2400/adapter_model β†’ checkpoint-2800}/adapter_model.bin +1 -1
  8. {checkpoint-2400 β†’ checkpoint-2800}/optimizer.pt +1 -1
  9. {checkpoint-2400 β†’ checkpoint-2800}/rng_state_0.pth +1 -1
  10. {checkpoint-2400 β†’ checkpoint-2800}/rng_state_1.pth +1 -1
  11. {checkpoint-2400 β†’ checkpoint-2800}/rng_state_10.pth +1 -1
  12. {checkpoint-2400 β†’ checkpoint-2800}/rng_state_11.pth +1 -1
  13. {checkpoint-2400 β†’ checkpoint-2800}/rng_state_12.pth +1 -1
  14. {checkpoint-2400 β†’ checkpoint-2800}/rng_state_13.pth +1 -1
  15. {checkpoint-2400 β†’ checkpoint-2800}/rng_state_2.pth +1 -1
  16. {checkpoint-2400 β†’ checkpoint-2800}/rng_state_3.pth +1 -1
  17. {checkpoint-2400 β†’ checkpoint-2800}/rng_state_4.pth +1 -1
  18. {checkpoint-2400 β†’ checkpoint-2800}/rng_state_5.pth +1 -1
  19. {checkpoint-2400 β†’ checkpoint-2800}/rng_state_6.pth +1 -1
  20. {checkpoint-2400 β†’ checkpoint-2800}/rng_state_7.pth +1 -1
  21. {checkpoint-2400 β†’ checkpoint-2800}/rng_state_8.pth +1 -1
  22. {checkpoint-2400 β†’ checkpoint-2800}/rng_state_9.pth +1 -1
  23. {checkpoint-2400 β†’ checkpoint-2800}/scheduler.pt +1 -1
  24. {checkpoint-2400 β†’ checkpoint-2800}/trainer_state.json +99 -3
  25. {checkpoint-2400 β†’ checkpoint-2800}/training_args.bin +0 -0
adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:72857c4351001ef2bdba0e7acda85bdabe013b254c505a3fec540300b8b69221
3
  size 500897101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ea36cf8e55409a14da3fc648b1dfbd6758083b72318e4742d7d9efc2963c331
3
  size 500897101
{checkpoint-2400 β†’ checkpoint-2700/adapter_model}/README.md RENAMED
File without changes
{checkpoint-2400 β†’ checkpoint-2700/adapter_model}/adapter_config.json RENAMED
File without changes
{checkpoint-2400 β†’ checkpoint-2700/adapter_model}/adapter_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9a78f07f6c25ff3a384ba787025398b099c4ded28cf5a456badfb2abdeac5d61
3
  size 500897101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72857c4351001ef2bdba0e7acda85bdabe013b254c505a3fec540300b8b69221
3
  size 500897101
{checkpoint-2400/adapter_model β†’ checkpoint-2800}/README.md RENAMED
File without changes
{checkpoint-2400/adapter_model β†’ checkpoint-2800}/adapter_config.json RENAMED
File without changes
{checkpoint-2400/adapter_model β†’ checkpoint-2800}/adapter_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9a78f07f6c25ff3a384ba787025398b099c4ded28cf5a456badfb2abdeac5d61
3
  size 500897101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ea36cf8e55409a14da3fc648b1dfbd6758083b72318e4742d7d9efc2963c331
3
  size 500897101
{checkpoint-2400 β†’ checkpoint-2800}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:442f0fed82ae5467ffbfbea1da70c37dc0aa8f203aa2acc1af02f5551c32b764
3
  size 1001752701
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ad547cbbf1779bc43d5f541ea80ff23dfadca360f5b7fbe6b9210bdabd5b0a3
3
  size 1001752701
{checkpoint-2400 β†’ checkpoint-2800}/rng_state_0.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:25acea38e8d5bd8784604757d457a14328f73f9d42017801732c3673ffcbfc19
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54ceaf70d5ffe3e642b177d8e34d1f05742963af64a1bcc361535a9360b397c4
3
  size 27772
{checkpoint-2400 β†’ checkpoint-2800}/rng_state_1.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3505b23dfaf76f0323c2ce25bb39a0407b98df2fa7f7f93ac6e58b365baaf761
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9607a8c2ef03708a5690aea65c1585d4ddbd8e01d7e279a5781ba30e8f1917ff
3
  size 27772
{checkpoint-2400 β†’ checkpoint-2800}/rng_state_10.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:96eb3af611e5c6385bb1c8067036789858b5ea043db87fec2ad208b395fffc57
3
  size 27789
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8681f4b5196d1fde8691794cb783ea1dab72c5077dbcf5394c6998bd4136e731
3
  size 27789
{checkpoint-2400 β†’ checkpoint-2800}/rng_state_11.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2bb10515bb0a74ed81dcf9a34118607a62c4ccb79c19d815ce2d4bdb2d1592d9
3
  size 27789
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd6cb0b4fef9e193eda245bff5fbcc8df9769fc61966e5f1cdf256150779c1da
3
  size 27789
{checkpoint-2400 β†’ checkpoint-2800}/rng_state_12.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:24fbdd560259eca962bf8c98ba80f05b15bff2710d82866301aa92e4d53e6796
3
  size 27789
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b66ef66b2b0e1dce0083092ba63e49bdf210999432342b9c2a3993ca381ca353
3
  size 27789
{checkpoint-2400 β†’ checkpoint-2800}/rng_state_13.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f77df3ee11bff786b83de93e9a70beacac88e03056ae7179237d27b9de8bea35
3
  size 27789
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5cec3ba0fdf94eca1cdf6294a4f5fddb5e3c4f431222a020f6b0acac68bcd0b2
3
  size 27789
{checkpoint-2400 β†’ checkpoint-2800}/rng_state_2.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:766dffdd000bec26f59585fd09f364b34726c28f571693e392e5ad0bcc023f25
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c53913af6dbe6026773029476e95c35bab12c198a7f90d679010f0fd21198df
3
  size 27772
{checkpoint-2400 β†’ checkpoint-2800}/rng_state_3.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:af7057ffcb1d3910adbeb89bdb03cf4db72e06b97d19d39d45a5fe88814dc8fd
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:811ad146e12ad4449d58b59f6fcb92f298ffd443e1a43261d70a55e3eb6343d9
3
  size 27772
{checkpoint-2400 β†’ checkpoint-2800}/rng_state_4.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f7b19904fa5333a4aafd38d77ad2ee464c195a29f00b1ba0693aff3710185b33
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5da3f408ca3cd0e89a66524e7f4846e322256ba24237784526bdc51b9ede18b
3
  size 27772
{checkpoint-2400 β†’ checkpoint-2800}/rng_state_5.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4d6ca6b609b5c555ef0a17f2d40c5a0ac1a71bb332d258ec785e0a74ff79d3df
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c659f82e6a038ab94307ae424a29fedf3767fe4eabecd42c8ea9b1fb19e36fc
3
  size 27772
{checkpoint-2400 β†’ checkpoint-2800}/rng_state_6.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:27777665ad4b9dc253fdd2761e1c9d90b9e208f74c07efc1915794ca03143b09
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3d5c97078c0cd3e6af8628033620fd2ade2aea530684443c37b10455b6826ae1
3
  size 27772
{checkpoint-2400 β†’ checkpoint-2800}/rng_state_7.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d32c2e57af55e62f6ebb560ee9f279e7a2d4cf944db5c350acc71b49224172b1
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7dd4ff6e318b6e48ea5386ceaf02104c9a56c201311646c4a4e1f4c3be379fe7
3
  size 27772
{checkpoint-2400 β†’ checkpoint-2800}/rng_state_8.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d0b4976b266fb6cb141d47782aeb00f44806fb3e77fd565e3b1d784d985b712c
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31d89de68577a860ceffdb664eb8eb7a44e5a8dd6aa62c351c0caf7b931e6a02
3
  size 27772
{checkpoint-2400 β†’ checkpoint-2800}/rng_state_9.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7d3562833238738c3d7b0e7d94f70e453b7694fc096cd6651e5e76b9fc45a3ed
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76b3e7281559d95415194847aba99c3c754c2f0ad8f10ac4eb274f044a763cf1
3
  size 27772
{checkpoint-2400 β†’ checkpoint-2800}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f85b645b3956f71e88b844e74e8a1785c175b8f1cad016ae6807e31a99fe657c
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0008ae7bce85f92437f0e149969fba2477d40c35a55a3a590f361670b6eb7290
3
  size 627
{checkpoint-2400 β†’ checkpoint-2800}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.9305932531989143,
5
- "global_step": 2400,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -574,11 +574,107 @@
574
  "learning_rate": 0.00015638878010665672,
575
  "loss": 0.8289,
576
  "step": 2400
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
577
  }
578
  ],
579
  "max_steps": 7737,
580
  "num_train_epochs": 3,
581
- "total_flos": 1.0337240915667583e+19,
582
  "trial_name": null,
583
  "trial_params": null
584
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.0856921287320667,
5
+ "global_step": 2800,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
574
  "learning_rate": 0.00015638878010665672,
575
  "loss": 0.8289,
576
  "step": 2400
577
+ },
578
+ {
579
+ "epoch": 0.94,
580
+ "learning_rate": 0.00015554645868399205,
581
+ "loss": 0.832,
582
+ "step": 2425
583
+ },
584
+ {
585
+ "epoch": 0.95,
586
+ "learning_rate": 0.00015469839860026308,
587
+ "loss": 0.8294,
588
+ "step": 2450
589
+ },
590
+ {
591
+ "epoch": 0.96,
592
+ "learning_rate": 0.0001538446874709452,
593
+ "loss": 0.8281,
594
+ "step": 2475
595
+ },
596
+ {
597
+ "epoch": 0.97,
598
+ "learning_rate": 0.00015298541349533925,
599
+ "loss": 0.8314,
600
+ "step": 2500
601
+ },
602
+ {
603
+ "epoch": 0.98,
604
+ "learning_rate": 0.00015212066544745926,
605
+ "loss": 0.831,
606
+ "step": 2525
607
+ },
608
+ {
609
+ "epoch": 0.99,
610
+ "learning_rate": 0.00015125053266686124,
611
+ "loss": 0.8319,
612
+ "step": 2550
613
+ },
614
+ {
615
+ "epoch": 1.0,
616
+ "learning_rate": 0.00015037510504941303,
617
+ "loss": 0.8259,
618
+ "step": 2575
619
+ },
620
+ {
621
+ "epoch": 1.01,
622
+ "learning_rate": 0.00014949447303800695,
623
+ "loss": 0.8133,
624
+ "step": 2600
625
+ },
626
+ {
627
+ "epoch": 1.02,
628
+ "learning_rate": 0.00014860872761321593,
629
+ "loss": 0.8139,
630
+ "step": 2625
631
+ },
632
+ {
633
+ "epoch": 1.03,
634
+ "learning_rate": 0.00014771796028389405,
635
+ "loss": 0.804,
636
+ "step": 2650
637
+ },
638
+ {
639
+ "epoch": 1.04,
640
+ "learning_rate": 0.0001468222630777225,
641
+ "loss": 0.8011,
642
+ "step": 2675
643
+ },
644
+ {
645
+ "epoch": 1.05,
646
+ "learning_rate": 0.00014592172853170193,
647
+ "loss": 0.8037,
648
+ "step": 2700
649
+ },
650
+ {
651
+ "epoch": 1.06,
652
+ "learning_rate": 0.00014501644968259212,
653
+ "loss": 0.8063,
654
+ "step": 2725
655
+ },
656
+ {
657
+ "epoch": 1.07,
658
+ "learning_rate": 0.00014410652005730025,
659
+ "loss": 0.8155,
660
+ "step": 2750
661
+ },
662
+ {
663
+ "epoch": 1.08,
664
+ "learning_rate": 0.00014319203366321826,
665
+ "loss": 0.8066,
666
+ "step": 2775
667
+ },
668
+ {
669
+ "epoch": 1.09,
670
+ "learning_rate": 0.0001422730849785107,
671
+ "loss": 0.8091,
672
+ "step": 2800
673
  }
674
  ],
675
  "max_steps": 7737,
676
  "num_train_epochs": 3,
677
+ "total_flos": 1.205858669606155e+19,
678
  "trial_name": null,
679
  "trial_params": null
680
  }
{checkpoint-2400 β†’ checkpoint-2800}/training_args.bin RENAMED
File without changes