Commit
Β·
dacd1b1
1
Parent(s):
1b2dcca
Training in progress, step 2700
Browse files- adapter_model.bin +1 -1
- {checkpoint-2300 β checkpoint-2600/adapter_model}/README.md +0 -0
- {checkpoint-2300 β checkpoint-2600/adapter_model}/adapter_config.json +0 -0
- {checkpoint-2300 β checkpoint-2600/adapter_model}/adapter_model.bin +1 -1
- {checkpoint-2300/adapter_model β checkpoint-2700}/README.md +0 -0
- {checkpoint-2300/adapter_model β checkpoint-2700}/adapter_config.json +0 -0
- {checkpoint-2300/adapter_model β checkpoint-2700}/adapter_model.bin +1 -1
- {checkpoint-2300 β checkpoint-2700}/optimizer.pt +1 -1
- {checkpoint-2300 β checkpoint-2700}/rng_state_0.pth +1 -1
- {checkpoint-2300 β checkpoint-2700}/rng_state_1.pth +1 -1
- {checkpoint-2300 β checkpoint-2700}/rng_state_10.pth +1 -1
- {checkpoint-2300 β checkpoint-2700}/rng_state_11.pth +1 -1
- {checkpoint-2300 β checkpoint-2700}/rng_state_12.pth +1 -1
- {checkpoint-2300 β checkpoint-2700}/rng_state_13.pth +1 -1
- {checkpoint-2300 β checkpoint-2700}/rng_state_2.pth +1 -1
- {checkpoint-2300 β checkpoint-2700}/rng_state_3.pth +1 -1
- {checkpoint-2300 β checkpoint-2700}/rng_state_4.pth +1 -1
- {checkpoint-2300 β checkpoint-2700}/rng_state_5.pth +1 -1
- {checkpoint-2300 β checkpoint-2700}/rng_state_6.pth +1 -1
- {checkpoint-2300 β checkpoint-2700}/rng_state_7.pth +1 -1
- {checkpoint-2300 β checkpoint-2700}/rng_state_8.pth +1 -1
- {checkpoint-2300 β checkpoint-2700}/rng_state_9.pth +1 -1
- {checkpoint-2300 β checkpoint-2700}/scheduler.pt +1 -1
- {checkpoint-2300 β checkpoint-2700}/trainer_state.json +99 -3
- {checkpoint-2300 β checkpoint-2700}/training_args.bin +0 -0
adapter_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 500897101
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:72857c4351001ef2bdba0e7acda85bdabe013b254c505a3fec540300b8b69221
|
3 |
size 500897101
|
{checkpoint-2300 β checkpoint-2600/adapter_model}/README.md
RENAMED
File without changes
|
{checkpoint-2300 β checkpoint-2600/adapter_model}/adapter_config.json
RENAMED
File without changes
|
{checkpoint-2300 β checkpoint-2600/adapter_model}/adapter_model.bin
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 500897101
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:56dc05e4b75a13b83ba7370f0c76297d690a74a3feda12d5b102e996353b81b9
|
3 |
size 500897101
|
{checkpoint-2300/adapter_model β checkpoint-2700}/README.md
RENAMED
File without changes
|
{checkpoint-2300/adapter_model β checkpoint-2700}/adapter_config.json
RENAMED
File without changes
|
{checkpoint-2300/adapter_model β checkpoint-2700}/adapter_model.bin
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 500897101
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:72857c4351001ef2bdba0e7acda85bdabe013b254c505a3fec540300b8b69221
|
3 |
size 500897101
|
{checkpoint-2300 β checkpoint-2700}/optimizer.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1001752701
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1e6581d1b0c10687bb3a3bc5ccd55dd7742012f93950a83aa87e181175ba0dae
|
3 |
size 1001752701
|
{checkpoint-2300 β checkpoint-2700}/rng_state_0.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f207e68632bac90f957ee4b69848b1b3bf1823589f0084ffda5fe51a062cda66
|
3 |
size 27772
|
{checkpoint-2300 β checkpoint-2700}/rng_state_1.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:22862d05c3516b301c0029fcde0e8d61ec3a7a699c06f10b45b2038d258705bf
|
3 |
size 27772
|
{checkpoint-2300 β checkpoint-2700}/rng_state_10.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27789
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ce953efa19f78d1504d60b13e76d782935e5997327dfbb7ccffdc0d67cd8ce63
|
3 |
size 27789
|
{checkpoint-2300 β checkpoint-2700}/rng_state_11.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27789
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f1474d4132d013009328b51314e14a4557202e7a03fe1c5dd72c4bee493ebc32
|
3 |
size 27789
|
{checkpoint-2300 β checkpoint-2700}/rng_state_12.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27789
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d397934e98e2af089f95cd3ebfbb6349d0d5379338b81dcdd71225e616b7d2d4
|
3 |
size 27789
|
{checkpoint-2300 β checkpoint-2700}/rng_state_13.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27789
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1c5aad35bbee83cb807b5f372f846229966f29c49d44cb351799da3e78c3739b
|
3 |
size 27789
|
{checkpoint-2300 β checkpoint-2700}/rng_state_2.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:54f1ed3e8d7bf0d86bd6d9acac91b9cfaabc266a2ecb5c2e05b800f5fb314129
|
3 |
size 27772
|
{checkpoint-2300 β checkpoint-2700}/rng_state_3.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:01f289536347abba01b49789dfbc3e30589b75cea2b08c3d776318c525f868ad
|
3 |
size 27772
|
{checkpoint-2300 β checkpoint-2700}/rng_state_4.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:203e94cac471cc2d7046694caa3b10e20010a25498536913b857d68ce1af2d43
|
3 |
size 27772
|
{checkpoint-2300 β checkpoint-2700}/rng_state_5.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:03a357f3ee8bad9901505c5f66d44c603f13d92ab451726200a0ee872b5550ca
|
3 |
size 27772
|
{checkpoint-2300 β checkpoint-2700}/rng_state_6.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:632d1189cca460782dd94b618a185a39301197e1ac0644b87bc12e7d639eb0db
|
3 |
size 27772
|
{checkpoint-2300 β checkpoint-2700}/rng_state_7.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c082c3485e7cf0ad8b46608970b89a1aec712ccf501f38bb2fbacfb0063ff84
|
3 |
size 27772
|
{checkpoint-2300 β checkpoint-2700}/rng_state_8.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f661148a14bf7645d198ffbee78fd27e53207bc2df14b4ac8eaf8cb1ec10b9d2
|
3 |
size 27772
|
{checkpoint-2300 β checkpoint-2700}/rng_state_9.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:302a97fe98bf1022f079fb5f4731e03dbd6c8c435be26dfdcac5c3191c75b913
|
3 |
size 27772
|
{checkpoint-2300 β checkpoint-2700}/scheduler.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 627
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:165954622b82d5ed3c4b0d29e582a52b9368810b632d35b84ef87387e9f95006
|
3 |
size 627
|
{checkpoint-2300 β checkpoint-2700}/trainer_state.json
RENAMED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch":
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -550,11 +550,107 @@
|
|
550 |
"learning_rate": 0.0001596989478162339,
|
551 |
"loss": 0.8334,
|
552 |
"step": 2300
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
553 |
}
|
554 |
],
|
555 |
"max_steps": 7737,
|
556 |
"num_train_epochs": 3,
|
557 |
-
"total_flos":
|
558 |
"trial_name": null,
|
559 |
"trial_params": null
|
560 |
}
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 1.0469174098487786,
|
5 |
+
"global_step": 2700,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
550 |
"learning_rate": 0.0001596989478162339,
|
551 |
"loss": 0.8334,
|
552 |
"step": 2300
|
553 |
+
},
|
554 |
+
{
|
555 |
+
"epoch": 0.9,
|
556 |
+
"learning_rate": 0.00015888044520055106,
|
557 |
+
"loss": 0.8352,
|
558 |
+
"step": 2325
|
559 |
+
},
|
560 |
+
{
|
561 |
+
"epoch": 0.91,
|
562 |
+
"learning_rate": 0.00015805585948026852,
|
563 |
+
"loss": 0.823,
|
564 |
+
"step": 2350
|
565 |
+
},
|
566 |
+
{
|
567 |
+
"epoch": 0.92,
|
568 |
+
"learning_rate": 0.000157225275845659,
|
569 |
+
"loss": 0.8293,
|
570 |
+
"step": 2375
|
571 |
+
},
|
572 |
+
{
|
573 |
+
"epoch": 0.93,
|
574 |
+
"learning_rate": 0.00015638878010665672,
|
575 |
+
"loss": 0.8289,
|
576 |
+
"step": 2400
|
577 |
+
},
|
578 |
+
{
|
579 |
+
"epoch": 0.94,
|
580 |
+
"learning_rate": 0.00015554645868399205,
|
581 |
+
"loss": 0.832,
|
582 |
+
"step": 2425
|
583 |
+
},
|
584 |
+
{
|
585 |
+
"epoch": 0.95,
|
586 |
+
"learning_rate": 0.00015469839860026308,
|
587 |
+
"loss": 0.8294,
|
588 |
+
"step": 2450
|
589 |
+
},
|
590 |
+
{
|
591 |
+
"epoch": 0.96,
|
592 |
+
"learning_rate": 0.0001538446874709452,
|
593 |
+
"loss": 0.8281,
|
594 |
+
"step": 2475
|
595 |
+
},
|
596 |
+
{
|
597 |
+
"epoch": 0.97,
|
598 |
+
"learning_rate": 0.00015298541349533925,
|
599 |
+
"loss": 0.8314,
|
600 |
+
"step": 2500
|
601 |
+
},
|
602 |
+
{
|
603 |
+
"epoch": 0.98,
|
604 |
+
"learning_rate": 0.00015212066544745926,
|
605 |
+
"loss": 0.831,
|
606 |
+
"step": 2525
|
607 |
+
},
|
608 |
+
{
|
609 |
+
"epoch": 0.99,
|
610 |
+
"learning_rate": 0.00015125053266686124,
|
611 |
+
"loss": 0.8319,
|
612 |
+
"step": 2550
|
613 |
+
},
|
614 |
+
{
|
615 |
+
"epoch": 1.0,
|
616 |
+
"learning_rate": 0.00015037510504941303,
|
617 |
+
"loss": 0.8259,
|
618 |
+
"step": 2575
|
619 |
+
},
|
620 |
+
{
|
621 |
+
"epoch": 1.01,
|
622 |
+
"learning_rate": 0.00014949447303800695,
|
623 |
+
"loss": 0.8133,
|
624 |
+
"step": 2600
|
625 |
+
},
|
626 |
+
{
|
627 |
+
"epoch": 1.02,
|
628 |
+
"learning_rate": 0.00014860872761321593,
|
629 |
+
"loss": 0.8139,
|
630 |
+
"step": 2625
|
631 |
+
},
|
632 |
+
{
|
633 |
+
"epoch": 1.03,
|
634 |
+
"learning_rate": 0.00014771796028389405,
|
635 |
+
"loss": 0.804,
|
636 |
+
"step": 2650
|
637 |
+
},
|
638 |
+
{
|
639 |
+
"epoch": 1.04,
|
640 |
+
"learning_rate": 0.0001468222630777225,
|
641 |
+
"loss": 0.8011,
|
642 |
+
"step": 2675
|
643 |
+
},
|
644 |
+
{
|
645 |
+
"epoch": 1.05,
|
646 |
+
"learning_rate": 0.00014592172853170193,
|
647 |
+
"loss": 0.8037,
|
648 |
+
"step": 2700
|
649 |
}
|
650 |
],
|
651 |
"max_steps": 7737,
|
652 |
"num_train_epochs": 3,
|
653 |
+
"total_flos": 1.1628331844604264e+19,
|
654 |
"trial_name": null,
|
655 |
"trial_params": null
|
656 |
}
|
{checkpoint-2300 β checkpoint-2700}/training_args.bin
RENAMED
File without changes
|