Commit
Β·
234d4c8
1
Parent(s):
dacd1b1
Training in progress, step 2800
Browse files- adapter_model.bin +1 -1
- {checkpoint-2400 β checkpoint-2700/adapter_model}/README.md +0 -0
- {checkpoint-2400 β checkpoint-2700/adapter_model}/adapter_config.json +0 -0
- {checkpoint-2400 β checkpoint-2700/adapter_model}/adapter_model.bin +1 -1
- {checkpoint-2400/adapter_model β checkpoint-2800}/README.md +0 -0
- {checkpoint-2400/adapter_model β checkpoint-2800}/adapter_config.json +0 -0
- {checkpoint-2400/adapter_model β checkpoint-2800}/adapter_model.bin +1 -1
- {checkpoint-2400 β checkpoint-2800}/optimizer.pt +1 -1
- {checkpoint-2400 β checkpoint-2800}/rng_state_0.pth +1 -1
- {checkpoint-2400 β checkpoint-2800}/rng_state_1.pth +1 -1
- {checkpoint-2400 β checkpoint-2800}/rng_state_10.pth +1 -1
- {checkpoint-2400 β checkpoint-2800}/rng_state_11.pth +1 -1
- {checkpoint-2400 β checkpoint-2800}/rng_state_12.pth +1 -1
- {checkpoint-2400 β checkpoint-2800}/rng_state_13.pth +1 -1
- {checkpoint-2400 β checkpoint-2800}/rng_state_2.pth +1 -1
- {checkpoint-2400 β checkpoint-2800}/rng_state_3.pth +1 -1
- {checkpoint-2400 β checkpoint-2800}/rng_state_4.pth +1 -1
- {checkpoint-2400 β checkpoint-2800}/rng_state_5.pth +1 -1
- {checkpoint-2400 β checkpoint-2800}/rng_state_6.pth +1 -1
- {checkpoint-2400 β checkpoint-2800}/rng_state_7.pth +1 -1
- {checkpoint-2400 β checkpoint-2800}/rng_state_8.pth +1 -1
- {checkpoint-2400 β checkpoint-2800}/rng_state_9.pth +1 -1
- {checkpoint-2400 β checkpoint-2800}/scheduler.pt +1 -1
- {checkpoint-2400 β checkpoint-2800}/trainer_state.json +99 -3
- {checkpoint-2400 β checkpoint-2800}/training_args.bin +0 -0
adapter_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 500897101
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ea36cf8e55409a14da3fc648b1dfbd6758083b72318e4742d7d9efc2963c331
|
3 |
size 500897101
|
{checkpoint-2400 β checkpoint-2700/adapter_model}/README.md
RENAMED
File without changes
|
{checkpoint-2400 β checkpoint-2700/adapter_model}/adapter_config.json
RENAMED
File without changes
|
{checkpoint-2400 β checkpoint-2700/adapter_model}/adapter_model.bin
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 500897101
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:72857c4351001ef2bdba0e7acda85bdabe013b254c505a3fec540300b8b69221
|
3 |
size 500897101
|
{checkpoint-2400/adapter_model β checkpoint-2800}/README.md
RENAMED
File without changes
|
{checkpoint-2400/adapter_model β checkpoint-2800}/adapter_config.json
RENAMED
File without changes
|
{checkpoint-2400/adapter_model β checkpoint-2800}/adapter_model.bin
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 500897101
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ea36cf8e55409a14da3fc648b1dfbd6758083b72318e4742d7d9efc2963c331
|
3 |
size 500897101
|
{checkpoint-2400 β checkpoint-2800}/optimizer.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1001752701
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ad547cbbf1779bc43d5f541ea80ff23dfadca360f5b7fbe6b9210bdabd5b0a3
|
3 |
size 1001752701
|
{checkpoint-2400 β checkpoint-2800}/rng_state_0.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:54ceaf70d5ffe3e642b177d8e34d1f05742963af64a1bcc361535a9360b397c4
|
3 |
size 27772
|
{checkpoint-2400 β checkpoint-2800}/rng_state_1.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9607a8c2ef03708a5690aea65c1585d4ddbd8e01d7e279a5781ba30e8f1917ff
|
3 |
size 27772
|
{checkpoint-2400 β checkpoint-2800}/rng_state_10.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27789
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8681f4b5196d1fde8691794cb783ea1dab72c5077dbcf5394c6998bd4136e731
|
3 |
size 27789
|
{checkpoint-2400 β checkpoint-2800}/rng_state_11.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27789
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fd6cb0b4fef9e193eda245bff5fbcc8df9769fc61966e5f1cdf256150779c1da
|
3 |
size 27789
|
{checkpoint-2400 β checkpoint-2800}/rng_state_12.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27789
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b66ef66b2b0e1dce0083092ba63e49bdf210999432342b9c2a3993ca381ca353
|
3 |
size 27789
|
{checkpoint-2400 β checkpoint-2800}/rng_state_13.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27789
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5cec3ba0fdf94eca1cdf6294a4f5fddb5e3c4f431222a020f6b0acac68bcd0b2
|
3 |
size 27789
|
{checkpoint-2400 β checkpoint-2800}/rng_state_2.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1c53913af6dbe6026773029476e95c35bab12c198a7f90d679010f0fd21198df
|
3 |
size 27772
|
{checkpoint-2400 β checkpoint-2800}/rng_state_3.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:811ad146e12ad4449d58b59f6fcb92f298ffd443e1a43261d70a55e3eb6343d9
|
3 |
size 27772
|
{checkpoint-2400 β checkpoint-2800}/rng_state_4.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d5da3f408ca3cd0e89a66524e7f4846e322256ba24237784526bdc51b9ede18b
|
3 |
size 27772
|
{checkpoint-2400 β checkpoint-2800}/rng_state_5.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4c659f82e6a038ab94307ae424a29fedf3767fe4eabecd42c8ea9b1fb19e36fc
|
3 |
size 27772
|
{checkpoint-2400 β checkpoint-2800}/rng_state_6.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3d5c97078c0cd3e6af8628033620fd2ade2aea530684443c37b10455b6826ae1
|
3 |
size 27772
|
{checkpoint-2400 β checkpoint-2800}/rng_state_7.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7dd4ff6e318b6e48ea5386ceaf02104c9a56c201311646c4a4e1f4c3be379fe7
|
3 |
size 27772
|
{checkpoint-2400 β checkpoint-2800}/rng_state_8.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31d89de68577a860ceffdb664eb8eb7a44e5a8dd6aa62c351c0caf7b931e6a02
|
3 |
size 27772
|
{checkpoint-2400 β checkpoint-2800}/rng_state_9.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:76b3e7281559d95415194847aba99c3c754c2f0ad8f10ac4eb274f044a763cf1
|
3 |
size 27772
|
{checkpoint-2400 β checkpoint-2800}/scheduler.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 627
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0008ae7bce85f92437f0e149969fba2477d40c35a55a3a590f361670b6eb7290
|
3 |
size 627
|
{checkpoint-2400 β checkpoint-2800}/trainer_state.json
RENAMED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch":
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -574,11 +574,107 @@
|
|
574 |
"learning_rate": 0.00015638878010665672,
|
575 |
"loss": 0.8289,
|
576 |
"step": 2400
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
577 |
}
|
578 |
],
|
579 |
"max_steps": 7737,
|
580 |
"num_train_epochs": 3,
|
581 |
-
"total_flos": 1.
|
582 |
"trial_name": null,
|
583 |
"trial_params": null
|
584 |
}
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 1.0856921287320667,
|
5 |
+
"global_step": 2800,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
574 |
"learning_rate": 0.00015638878010665672,
|
575 |
"loss": 0.8289,
|
576 |
"step": 2400
|
577 |
+
},
|
578 |
+
{
|
579 |
+
"epoch": 0.94,
|
580 |
+
"learning_rate": 0.00015554645868399205,
|
581 |
+
"loss": 0.832,
|
582 |
+
"step": 2425
|
583 |
+
},
|
584 |
+
{
|
585 |
+
"epoch": 0.95,
|
586 |
+
"learning_rate": 0.00015469839860026308,
|
587 |
+
"loss": 0.8294,
|
588 |
+
"step": 2450
|
589 |
+
},
|
590 |
+
{
|
591 |
+
"epoch": 0.96,
|
592 |
+
"learning_rate": 0.0001538446874709452,
|
593 |
+
"loss": 0.8281,
|
594 |
+
"step": 2475
|
595 |
+
},
|
596 |
+
{
|
597 |
+
"epoch": 0.97,
|
598 |
+
"learning_rate": 0.00015298541349533925,
|
599 |
+
"loss": 0.8314,
|
600 |
+
"step": 2500
|
601 |
+
},
|
602 |
+
{
|
603 |
+
"epoch": 0.98,
|
604 |
+
"learning_rate": 0.00015212066544745926,
|
605 |
+
"loss": 0.831,
|
606 |
+
"step": 2525
|
607 |
+
},
|
608 |
+
{
|
609 |
+
"epoch": 0.99,
|
610 |
+
"learning_rate": 0.00015125053266686124,
|
611 |
+
"loss": 0.8319,
|
612 |
+
"step": 2550
|
613 |
+
},
|
614 |
+
{
|
615 |
+
"epoch": 1.0,
|
616 |
+
"learning_rate": 0.00015037510504941303,
|
617 |
+
"loss": 0.8259,
|
618 |
+
"step": 2575
|
619 |
+
},
|
620 |
+
{
|
621 |
+
"epoch": 1.01,
|
622 |
+
"learning_rate": 0.00014949447303800695,
|
623 |
+
"loss": 0.8133,
|
624 |
+
"step": 2600
|
625 |
+
},
|
626 |
+
{
|
627 |
+
"epoch": 1.02,
|
628 |
+
"learning_rate": 0.00014860872761321593,
|
629 |
+
"loss": 0.8139,
|
630 |
+
"step": 2625
|
631 |
+
},
|
632 |
+
{
|
633 |
+
"epoch": 1.03,
|
634 |
+
"learning_rate": 0.00014771796028389405,
|
635 |
+
"loss": 0.804,
|
636 |
+
"step": 2650
|
637 |
+
},
|
638 |
+
{
|
639 |
+
"epoch": 1.04,
|
640 |
+
"learning_rate": 0.0001468222630777225,
|
641 |
+
"loss": 0.8011,
|
642 |
+
"step": 2675
|
643 |
+
},
|
644 |
+
{
|
645 |
+
"epoch": 1.05,
|
646 |
+
"learning_rate": 0.00014592172853170193,
|
647 |
+
"loss": 0.8037,
|
648 |
+
"step": 2700
|
649 |
+
},
|
650 |
+
{
|
651 |
+
"epoch": 1.06,
|
652 |
+
"learning_rate": 0.00014501644968259212,
|
653 |
+
"loss": 0.8063,
|
654 |
+
"step": 2725
|
655 |
+
},
|
656 |
+
{
|
657 |
+
"epoch": 1.07,
|
658 |
+
"learning_rate": 0.00014410652005730025,
|
659 |
+
"loss": 0.8155,
|
660 |
+
"step": 2750
|
661 |
+
},
|
662 |
+
{
|
663 |
+
"epoch": 1.08,
|
664 |
+
"learning_rate": 0.00014319203366321826,
|
665 |
+
"loss": 0.8066,
|
666 |
+
"step": 2775
|
667 |
+
},
|
668 |
+
{
|
669 |
+
"epoch": 1.09,
|
670 |
+
"learning_rate": 0.0001422730849785107,
|
671 |
+
"loss": 0.8091,
|
672 |
+
"step": 2800
|
673 |
}
|
674 |
],
|
675 |
"max_steps": 7737,
|
676 |
"num_train_epochs": 3,
|
677 |
+
"total_flos": 1.205858669606155e+19,
|
678 |
"trial_name": null,
|
679 |
"trial_params": null
|
680 |
}
|
{checkpoint-2400 β checkpoint-2800}/training_args.bin
RENAMED
File without changes
|