ZeroUniqueness commited on
Commit
ffa4692
β€’
1 Parent(s): ba9b273

Training in progress, step 6800

Browse files
Files changed (25) hide show
  1. adapter_model.bin +1 -1
  2. {checkpoint-6400 β†’ checkpoint-6700/adapter_model}/README.md +0 -0
  3. {checkpoint-6400 β†’ checkpoint-6700/adapter_model}/adapter_config.json +0 -0
  4. {checkpoint-6400 β†’ checkpoint-6700/adapter_model}/adapter_model.bin +1 -1
  5. {checkpoint-6400/adapter_model β†’ checkpoint-6800}/README.md +0 -0
  6. {checkpoint-6400/adapter_model β†’ checkpoint-6800}/adapter_config.json +0 -0
  7. {checkpoint-6400/adapter_model β†’ checkpoint-6800}/adapter_model.bin +1 -1
  8. {checkpoint-6400 β†’ checkpoint-6800}/optimizer.pt +1 -1
  9. {checkpoint-6400 β†’ checkpoint-6800}/rng_state_0.pth +1 -1
  10. {checkpoint-6400 β†’ checkpoint-6800}/rng_state_1.pth +1 -1
  11. {checkpoint-6400 β†’ checkpoint-6800}/rng_state_10.pth +1 -1
  12. {checkpoint-6400 β†’ checkpoint-6800}/rng_state_11.pth +1 -1
  13. {checkpoint-6400 β†’ checkpoint-6800}/rng_state_12.pth +1 -1
  14. {checkpoint-6400 β†’ checkpoint-6800}/rng_state_13.pth +1 -1
  15. {checkpoint-6400 β†’ checkpoint-6800}/rng_state_2.pth +1 -1
  16. {checkpoint-6400 β†’ checkpoint-6800}/rng_state_3.pth +1 -1
  17. {checkpoint-6400 β†’ checkpoint-6800}/rng_state_4.pth +1 -1
  18. {checkpoint-6400 β†’ checkpoint-6800}/rng_state_5.pth +1 -1
  19. {checkpoint-6400 β†’ checkpoint-6800}/rng_state_6.pth +1 -1
  20. {checkpoint-6400 β†’ checkpoint-6800}/rng_state_7.pth +1 -1
  21. {checkpoint-6400 β†’ checkpoint-6800}/rng_state_8.pth +1 -1
  22. {checkpoint-6400 β†’ checkpoint-6800}/rng_state_9.pth +1 -1
  23. {checkpoint-6400 β†’ checkpoint-6800}/scheduler.pt +1 -1
  24. {checkpoint-6400 β†’ checkpoint-6800}/trainer_state.json +99 -3
  25. {checkpoint-6400 β†’ checkpoint-6800}/training_args.bin +0 -0
adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bcb96297919ffccc23a8f48a581a3185b03d83d73a72799941d2f235cad389d3
3
  size 500897101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:caee01e1da9f7e92223499414f8bb25b28ea34daf6fb927c9bd869dcba2559fd
3
  size 500897101
{checkpoint-6400 β†’ checkpoint-6700/adapter_model}/README.md RENAMED
File without changes
{checkpoint-6400 β†’ checkpoint-6700/adapter_model}/adapter_config.json RENAMED
File without changes
{checkpoint-6400 β†’ checkpoint-6700/adapter_model}/adapter_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:90226543ac07d2ffe305a17c9351436408a800fb2798a5a37995d29cfa11cdec
3
  size 500897101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bcb96297919ffccc23a8f48a581a3185b03d83d73a72799941d2f235cad389d3
3
  size 500897101
{checkpoint-6400/adapter_model β†’ checkpoint-6800}/README.md RENAMED
File without changes
{checkpoint-6400/adapter_model β†’ checkpoint-6800}/adapter_config.json RENAMED
File without changes
{checkpoint-6400/adapter_model β†’ checkpoint-6800}/adapter_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:90226543ac07d2ffe305a17c9351436408a800fb2798a5a37995d29cfa11cdec
3
  size 500897101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:caee01e1da9f7e92223499414f8bb25b28ea34daf6fb927c9bd869dcba2559fd
3
  size 500897101
{checkpoint-6400 β†’ checkpoint-6800}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:498cd6646ca27d259b758938350aa23c6521abf4c2e2e7ad5c89c29393ef9c1f
3
  size 1001752701
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a8797c2a2a21d3c99399832b3c5e9972ada7dec6e83cff5de4273cfa1c8c9f7
3
  size 1001752701
{checkpoint-6400 β†’ checkpoint-6800}/rng_state_0.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:28dca7865869f4b6acc2f12dccd0fb29d6ef17a6e533975d532c1cf6e37e11d2
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76a69b101b534038a0d1cd30c8b1e9841f687d0b3b07df6d02b3916e19b719c2
3
  size 27772
{checkpoint-6400 β†’ checkpoint-6800}/rng_state_1.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6e95bbfc662c04f7d23d557ef4f14e26a584a804cd946876565cd79d3d1e5395
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5e8706d00c08c82d30b24671bce72e1fd88ccda2d435bfc8570ef4280b40d47
3
  size 27772
{checkpoint-6400 β†’ checkpoint-6800}/rng_state_10.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3a2dbf6e4afff30fb600631c828f6c4c1912077153655c0461e63ffb7c879162
3
  size 27789
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f82da6b92d2dd42eda022db14fa263f4d03e28910c03bf4e97c967f1d893d8f
3
  size 27789
{checkpoint-6400 β†’ checkpoint-6800}/rng_state_11.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5d5da328b9e2cfadac7217a3b12ebdf223bce01441fbb5a17edda72c92eeff44
3
  size 27789
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:864477484049b3efdc98311c8185fa709645f956dfcbc5f22f55344bde84d440
3
  size 27789
{checkpoint-6400 β†’ checkpoint-6800}/rng_state_12.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3a6396a02b3c9fddf0f353e31c8917f8cc7ea2204873bd2f4e0c28162e34ae43
3
  size 27789
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b26c1496ef4023f2612561635f505e587abbdb9e2a946f7d90f08aaa3337aa4
3
  size 27789
{checkpoint-6400 β†’ checkpoint-6800}/rng_state_13.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:26c3b73c9edd077374308e10afe3bc005239a39405fc2b10ee7113b60e422175
3
  size 27789
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3c96078789fb495fd632c506d1671752f888d28d828331ac9ab1506089b50ed
3
  size 27789
{checkpoint-6400 β†’ checkpoint-6800}/rng_state_2.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:08c5ca5a5628b5625b372e5488a7dee8c4f85acbb5354ff6d66f2598a5588c2b
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61e915fcf4dd8f755df46cb9e5050aaae8b843699fa9edd019950564b2fda05c
3
  size 27772
{checkpoint-6400 β†’ checkpoint-6800}/rng_state_3.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:21a349f1d80528bfaed715a90e1ab0cc38dcbe474a5753e02758e4de13823c66
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e81ee1af73dd375865e86e8bf7e0efc15b3d4e65d58ca9f4d3ed4d33561879b
3
  size 27772
{checkpoint-6400 β†’ checkpoint-6800}/rng_state_4.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:75aa1cbfd6e20ff25a627f7aabdabf69a55c2919dbb6f0133b93d94a03326d25
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9150b049fc2e88708149ace562a8a4c9fef4ae5ea0bb2b8a584401d2abf84b2
3
  size 27772
{checkpoint-6400 β†’ checkpoint-6800}/rng_state_5.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c3767f9dbacf7f7a87c95de7127c5a2e9cede78d6705a5058e7c152a0c95be20
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9632ffce62364279230205690bdfad30fc16e17ef6a0f7efacfbeb73e2b1496
3
  size 27772
{checkpoint-6400 β†’ checkpoint-6800}/rng_state_6.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6736745fefc84acda69d21cca4210db1f2401990416ab7e86d4b97098b677a94
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0510fe79de24ae1d1cce464b86e9ee2bc9d2fa77099fb7dc30a7866117bd6e7
3
  size 27772
{checkpoint-6400 β†’ checkpoint-6800}/rng_state_7.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5c8fad12f554df98e8ba12231bfa25343972f0990eb9688e02db0ecc021980e7
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c084b8f84126bddadb7fcd64d22191438d565af4562b1fa9ef192f15ed39f43
3
  size 27772
{checkpoint-6400 β†’ checkpoint-6800}/rng_state_8.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:602e5b7b74cd1c25d9273dbce9513df4d9b1b8f459502b8973c5bc8ca815aeb9
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a3c330abb87810692a9b735e5edfdf7a74760562ee2e69753f40e14ef0d2404
3
  size 27772
{checkpoint-6400 β†’ checkpoint-6800}/rng_state_9.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:185367afc7f2b90a34c4a5da4f23b94cb09be4dbc5724516759fc2da4c464581
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:002d98d8a4fb73f32df6d2c88a43fb21668bf0821b126886c8586170e99c43d9
3
  size 27772
{checkpoint-6400 β†’ checkpoint-6800}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:12e968b9fe43b01b005367c0524e704d117f3484589d1270b46af1f5c106a7eb
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89396b89609adca20f26c9861c9dcc008dc9de0fbc3e7816552f07bbb0b807a7
3
  size 627
{checkpoint-6400 β†’ checkpoint-6800}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.481582008530438,
5
- "global_step": 6400,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -1566,11 +1566,107 @@
1566
  "learning_rate": 1.4414188367884907e-05,
1567
  "loss": 0.7668,
1568
  "step": 6400
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1569
  }
1570
  ],
1571
  "max_steps": 7737,
1572
  "num_train_epochs": 3,
1573
- "total_flos": 2.7563086736728785e+19,
1574
  "trial_name": null,
1575
  "trial_params": null
1576
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 2.6366808840635905,
5
+ "global_step": 6800,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
1566
  "learning_rate": 1.4414188367884907e-05,
1567
  "loss": 0.7668,
1568
  "step": 6400
1569
+ },
1570
+ {
1571
+ "epoch": 2.49,
1572
+ "learning_rate": 1.3892908218015654e-05,
1573
+ "loss": 0.7662,
1574
+ "step": 6425
1575
+ },
1576
+ {
1577
+ "epoch": 2.5,
1578
+ "learning_rate": 1.3380524034274122e-05,
1579
+ "loss": 0.7689,
1580
+ "step": 6450
1581
+ },
1582
+ {
1583
+ "epoch": 2.51,
1584
+ "learning_rate": 1.2877088752513189e-05,
1585
+ "loss": 0.7694,
1586
+ "step": 6475
1587
+ },
1588
+ {
1589
+ "epoch": 2.52,
1590
+ "learning_rate": 1.2382654384049475e-05,
1591
+ "loss": 0.7714,
1592
+ "step": 6500
1593
+ },
1594
+ {
1595
+ "epoch": 2.53,
1596
+ "learning_rate": 1.1897272010289884e-05,
1597
+ "loss": 0.7701,
1598
+ "step": 6525
1599
+ },
1600
+ {
1601
+ "epoch": 2.54,
1602
+ "learning_rate": 1.1420991777454315e-05,
1603
+ "loss": 0.7628,
1604
+ "step": 6550
1605
+ },
1606
+ {
1607
+ "epoch": 2.55,
1608
+ "learning_rate": 1.0953862891394795e-05,
1609
+ "loss": 0.7661,
1610
+ "step": 6575
1611
+ },
1612
+ {
1613
+ "epoch": 2.56,
1614
+ "learning_rate": 1.0495933612511976e-05,
1615
+ "loss": 0.7729,
1616
+ "step": 6600
1617
+ },
1618
+ {
1619
+ "epoch": 2.57,
1620
+ "learning_rate": 1.0047251250769175e-05,
1621
+ "loss": 0.772,
1622
+ "step": 6625
1623
+ },
1624
+ {
1625
+ "epoch": 2.58,
1626
+ "learning_rate": 9.60786216080466e-06,
1627
+ "loss": 0.7702,
1628
+ "step": 6650
1629
+ },
1630
+ {
1631
+ "epoch": 2.59,
1632
+ "learning_rate": 9.177811737142627e-06,
1633
+ "loss": 0.7711,
1634
+ "step": 6675
1635
+ },
1636
+ {
1637
+ "epoch": 2.6,
1638
+ "learning_rate": 8.757144409503359e-06,
1639
+ "loss": 0.765,
1640
+ "step": 6700
1641
+ },
1642
+ {
1643
+ "epoch": 2.61,
1644
+ "learning_rate": 8.34590363821306e-06,
1645
+ "loss": 0.7713,
1646
+ "step": 6725
1647
+ },
1648
+ {
1649
+ "epoch": 2.62,
1650
+ "learning_rate": 7.944131909713859e-06,
1651
+ "loss": 0.7631,
1652
+ "step": 6750
1653
+ },
1654
+ {
1655
+ "epoch": 2.63,
1656
+ "learning_rate": 7.551870732174416e-06,
1657
+ "loss": 0.767,
1658
+ "step": 6775
1659
+ },
1660
+ {
1661
+ "epoch": 2.64,
1662
+ "learning_rate": 7.169160631201566e-06,
1663
+ "loss": 0.7692,
1664
+ "step": 6800
1665
  }
1666
  ],
1667
  "max_steps": 7737,
1668
  "num_train_epochs": 3,
1669
+ "total_flos": 2.928513074136613e+19,
1670
  "trial_name": null,
1671
  "trial_params": null
1672
  }
{checkpoint-6400 β†’ checkpoint-6800}/training_args.bin RENAMED
File without changes