ZeroUniqueness
commited on
Commit
β’
ffa4692
1
Parent(s):
ba9b273
Training in progress, step 6800
Browse files- adapter_model.bin +1 -1
- {checkpoint-6400 β checkpoint-6700/adapter_model}/README.md +0 -0
- {checkpoint-6400 β checkpoint-6700/adapter_model}/adapter_config.json +0 -0
- {checkpoint-6400 β checkpoint-6700/adapter_model}/adapter_model.bin +1 -1
- {checkpoint-6400/adapter_model β checkpoint-6800}/README.md +0 -0
- {checkpoint-6400/adapter_model β checkpoint-6800}/adapter_config.json +0 -0
- {checkpoint-6400/adapter_model β checkpoint-6800}/adapter_model.bin +1 -1
- {checkpoint-6400 β checkpoint-6800}/optimizer.pt +1 -1
- {checkpoint-6400 β checkpoint-6800}/rng_state_0.pth +1 -1
- {checkpoint-6400 β checkpoint-6800}/rng_state_1.pth +1 -1
- {checkpoint-6400 β checkpoint-6800}/rng_state_10.pth +1 -1
- {checkpoint-6400 β checkpoint-6800}/rng_state_11.pth +1 -1
- {checkpoint-6400 β checkpoint-6800}/rng_state_12.pth +1 -1
- {checkpoint-6400 β checkpoint-6800}/rng_state_13.pth +1 -1
- {checkpoint-6400 β checkpoint-6800}/rng_state_2.pth +1 -1
- {checkpoint-6400 β checkpoint-6800}/rng_state_3.pth +1 -1
- {checkpoint-6400 β checkpoint-6800}/rng_state_4.pth +1 -1
- {checkpoint-6400 β checkpoint-6800}/rng_state_5.pth +1 -1
- {checkpoint-6400 β checkpoint-6800}/rng_state_6.pth +1 -1
- {checkpoint-6400 β checkpoint-6800}/rng_state_7.pth +1 -1
- {checkpoint-6400 β checkpoint-6800}/rng_state_8.pth +1 -1
- {checkpoint-6400 β checkpoint-6800}/rng_state_9.pth +1 -1
- {checkpoint-6400 β checkpoint-6800}/scheduler.pt +1 -1
- {checkpoint-6400 β checkpoint-6800}/trainer_state.json +99 -3
- {checkpoint-6400 β checkpoint-6800}/training_args.bin +0 -0
adapter_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 500897101
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:caee01e1da9f7e92223499414f8bb25b28ea34daf6fb927c9bd869dcba2559fd
|
3 |
size 500897101
|
{checkpoint-6400 β checkpoint-6700/adapter_model}/README.md
RENAMED
File without changes
|
{checkpoint-6400 β checkpoint-6700/adapter_model}/adapter_config.json
RENAMED
File without changes
|
{checkpoint-6400 β checkpoint-6700/adapter_model}/adapter_model.bin
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 500897101
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bcb96297919ffccc23a8f48a581a3185b03d83d73a72799941d2f235cad389d3
|
3 |
size 500897101
|
{checkpoint-6400/adapter_model β checkpoint-6800}/README.md
RENAMED
File without changes
|
{checkpoint-6400/adapter_model β checkpoint-6800}/adapter_config.json
RENAMED
File without changes
|
{checkpoint-6400/adapter_model β checkpoint-6800}/adapter_model.bin
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 500897101
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:caee01e1da9f7e92223499414f8bb25b28ea34daf6fb927c9bd869dcba2559fd
|
3 |
size 500897101
|
{checkpoint-6400 β checkpoint-6800}/optimizer.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1001752701
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a8797c2a2a21d3c99399832b3c5e9972ada7dec6e83cff5de4273cfa1c8c9f7
|
3 |
size 1001752701
|
{checkpoint-6400 β checkpoint-6800}/rng_state_0.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:76a69b101b534038a0d1cd30c8b1e9841f687d0b3b07df6d02b3916e19b719c2
|
3 |
size 27772
|
{checkpoint-6400 β checkpoint-6800}/rng_state_1.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f5e8706d00c08c82d30b24671bce72e1fd88ccda2d435bfc8570ef4280b40d47
|
3 |
size 27772
|
{checkpoint-6400 β checkpoint-6800}/rng_state_10.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27789
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f82da6b92d2dd42eda022db14fa263f4d03e28910c03bf4e97c967f1d893d8f
|
3 |
size 27789
|
{checkpoint-6400 β checkpoint-6800}/rng_state_11.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27789
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:864477484049b3efdc98311c8185fa709645f956dfcbc5f22f55344bde84d440
|
3 |
size 27789
|
{checkpoint-6400 β checkpoint-6800}/rng_state_12.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27789
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b26c1496ef4023f2612561635f505e587abbdb9e2a946f7d90f08aaa3337aa4
|
3 |
size 27789
|
{checkpoint-6400 β checkpoint-6800}/rng_state_13.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27789
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f3c96078789fb495fd632c506d1671752f888d28d828331ac9ab1506089b50ed
|
3 |
size 27789
|
{checkpoint-6400 β checkpoint-6800}/rng_state_2.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:61e915fcf4dd8f755df46cb9e5050aaae8b843699fa9edd019950564b2fda05c
|
3 |
size 27772
|
{checkpoint-6400 β checkpoint-6800}/rng_state_3.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1e81ee1af73dd375865e86e8bf7e0efc15b3d4e65d58ca9f4d3ed4d33561879b
|
3 |
size 27772
|
{checkpoint-6400 β checkpoint-6800}/rng_state_4.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f9150b049fc2e88708149ace562a8a4c9fef4ae5ea0bb2b8a584401d2abf84b2
|
3 |
size 27772
|
{checkpoint-6400 β checkpoint-6800}/rng_state_5.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b9632ffce62364279230205690bdfad30fc16e17ef6a0f7efacfbeb73e2b1496
|
3 |
size 27772
|
{checkpoint-6400 β checkpoint-6800}/rng_state_6.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f0510fe79de24ae1d1cce464b86e9ee2bc9d2fa77099fb7dc30a7866117bd6e7
|
3 |
size 27772
|
{checkpoint-6400 β checkpoint-6800}/rng_state_7.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3c084b8f84126bddadb7fcd64d22191438d565af4562b1fa9ef192f15ed39f43
|
3 |
size 27772
|
{checkpoint-6400 β checkpoint-6800}/rng_state_8.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7a3c330abb87810692a9b735e5edfdf7a74760562ee2e69753f40e14ef0d2404
|
3 |
size 27772
|
{checkpoint-6400 β checkpoint-6800}/rng_state_9.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:002d98d8a4fb73f32df6d2c88a43fb21668bf0821b126886c8586170e99c43d9
|
3 |
size 27772
|
{checkpoint-6400 β checkpoint-6800}/scheduler.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 627
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:89396b89609adca20f26c9861c9dcc008dc9de0fbc3e7816552f07bbb0b807a7
|
3 |
size 627
|
{checkpoint-6400 β checkpoint-6800}/trainer_state.json
RENAMED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch": 2.
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -1566,11 +1566,107 @@
|
|
1566 |
"learning_rate": 1.4414188367884907e-05,
|
1567 |
"loss": 0.7668,
|
1568 |
"step": 6400
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1569 |
}
|
1570 |
],
|
1571 |
"max_steps": 7737,
|
1572 |
"num_train_epochs": 3,
|
1573 |
-
"total_flos": 2.
|
1574 |
"trial_name": null,
|
1575 |
"trial_params": null
|
1576 |
}
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 2.6366808840635905,
|
5 |
+
"global_step": 6800,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
1566 |
"learning_rate": 1.4414188367884907e-05,
|
1567 |
"loss": 0.7668,
|
1568 |
"step": 6400
|
1569 |
+
},
|
1570 |
+
{
|
1571 |
+
"epoch": 2.49,
|
1572 |
+
"learning_rate": 1.3892908218015654e-05,
|
1573 |
+
"loss": 0.7662,
|
1574 |
+
"step": 6425
|
1575 |
+
},
|
1576 |
+
{
|
1577 |
+
"epoch": 2.5,
|
1578 |
+
"learning_rate": 1.3380524034274122e-05,
|
1579 |
+
"loss": 0.7689,
|
1580 |
+
"step": 6450
|
1581 |
+
},
|
1582 |
+
{
|
1583 |
+
"epoch": 2.51,
|
1584 |
+
"learning_rate": 1.2877088752513189e-05,
|
1585 |
+
"loss": 0.7694,
|
1586 |
+
"step": 6475
|
1587 |
+
},
|
1588 |
+
{
|
1589 |
+
"epoch": 2.52,
|
1590 |
+
"learning_rate": 1.2382654384049475e-05,
|
1591 |
+
"loss": 0.7714,
|
1592 |
+
"step": 6500
|
1593 |
+
},
|
1594 |
+
{
|
1595 |
+
"epoch": 2.53,
|
1596 |
+
"learning_rate": 1.1897272010289884e-05,
|
1597 |
+
"loss": 0.7701,
|
1598 |
+
"step": 6525
|
1599 |
+
},
|
1600 |
+
{
|
1601 |
+
"epoch": 2.54,
|
1602 |
+
"learning_rate": 1.1420991777454315e-05,
|
1603 |
+
"loss": 0.7628,
|
1604 |
+
"step": 6550
|
1605 |
+
},
|
1606 |
+
{
|
1607 |
+
"epoch": 2.55,
|
1608 |
+
"learning_rate": 1.0953862891394795e-05,
|
1609 |
+
"loss": 0.7661,
|
1610 |
+
"step": 6575
|
1611 |
+
},
|
1612 |
+
{
|
1613 |
+
"epoch": 2.56,
|
1614 |
+
"learning_rate": 1.0495933612511976e-05,
|
1615 |
+
"loss": 0.7729,
|
1616 |
+
"step": 6600
|
1617 |
+
},
|
1618 |
+
{
|
1619 |
+
"epoch": 2.57,
|
1620 |
+
"learning_rate": 1.0047251250769175e-05,
|
1621 |
+
"loss": 0.772,
|
1622 |
+
"step": 6625
|
1623 |
+
},
|
1624 |
+
{
|
1625 |
+
"epoch": 2.58,
|
1626 |
+
"learning_rate": 9.60786216080466e-06,
|
1627 |
+
"loss": 0.7702,
|
1628 |
+
"step": 6650
|
1629 |
+
},
|
1630 |
+
{
|
1631 |
+
"epoch": 2.59,
|
1632 |
+
"learning_rate": 9.177811737142627e-06,
|
1633 |
+
"loss": 0.7711,
|
1634 |
+
"step": 6675
|
1635 |
+
},
|
1636 |
+
{
|
1637 |
+
"epoch": 2.6,
|
1638 |
+
"learning_rate": 8.757144409503359e-06,
|
1639 |
+
"loss": 0.765,
|
1640 |
+
"step": 6700
|
1641 |
+
},
|
1642 |
+
{
|
1643 |
+
"epoch": 2.61,
|
1644 |
+
"learning_rate": 8.34590363821306e-06,
|
1645 |
+
"loss": 0.7713,
|
1646 |
+
"step": 6725
|
1647 |
+
},
|
1648 |
+
{
|
1649 |
+
"epoch": 2.62,
|
1650 |
+
"learning_rate": 7.944131909713859e-06,
|
1651 |
+
"loss": 0.7631,
|
1652 |
+
"step": 6750
|
1653 |
+
},
|
1654 |
+
{
|
1655 |
+
"epoch": 2.63,
|
1656 |
+
"learning_rate": 7.551870732174416e-06,
|
1657 |
+
"loss": 0.767,
|
1658 |
+
"step": 6775
|
1659 |
+
},
|
1660 |
+
{
|
1661 |
+
"epoch": 2.64,
|
1662 |
+
"learning_rate": 7.169160631201566e-06,
|
1663 |
+
"loss": 0.7692,
|
1664 |
+
"step": 6800
|
1665 |
}
|
1666 |
],
|
1667 |
"max_steps": 7737,
|
1668 |
"num_train_epochs": 3,
|
1669 |
+
"total_flos": 2.928513074136613e+19,
|
1670 |
"trial_name": null,
|
1671 |
"trial_params": null
|
1672 |
}
|
{checkpoint-6400 β checkpoint-6800}/training_args.bin
RENAMED
File without changes
|