diff --git a/adapter_config.json b/adapter_config.json index 76a873c20cee3d723689a7add20df73d51f0aa62..f56af3425142720a41fdaf57a5953ffe09e3778c 100644 --- a/adapter_config.json +++ b/adapter_config.json @@ -14,12 +14,12 @@ "r": 32, "revision": null, "target_modules": [ - "k_proj", - "down_proj", - "o_proj", "up_proj", "gate_proj", + "down_proj", "q_proj", + "k_proj", + "o_proj", "v_proj" ], "task_type": "CAUSAL_LM" diff --git a/adapter_model.bin b/adapter_model.bin index 74ff5a581629a7f5ddc9c641d61ce97e81bb3584..4c7f81b52d130b9867f7186c7d23e337252e2a04 100644 --- a/adapter_model.bin +++ b/adapter_model.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:bbb9d05e18d21539814aa33a75bcd59ecfa1423d749f7def1fa099eac295c773 +oid sha256:3febec860772b82c489867736d215315d0909ffc43a3ba7b9fbc1d0b41fd7a20 size 500897101 diff --git a/checkpoint-5700/adapter_model.bin b/checkpoint-5700/adapter_model.bin deleted file mode 100644 index 02526e93c7101a3c9d0727acfe024831696398f1..0000000000000000000000000000000000000000 --- a/checkpoint-5700/adapter_model.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6bdd5402d919c62a264000ec96b1dd621956e56ddd66679cf8a429f111552d95 -size 500897101 diff --git a/checkpoint-5700/adapter_model/adapter_model.bin b/checkpoint-5700/adapter_model/adapter_model.bin deleted file mode 100644 index 02526e93c7101a3c9d0727acfe024831696398f1..0000000000000000000000000000000000000000 --- a/checkpoint-5700/adapter_model/adapter_model.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6bdd5402d919c62a264000ec96b1dd621956e56ddd66679cf8a429f111552d95 -size 500897101 diff --git a/checkpoint-5700/optimizer.pt b/checkpoint-5700/optimizer.pt deleted file mode 100644 index 8d3c8aee3e9ab00a5c3caededd68fa2b6406534b..0000000000000000000000000000000000000000 --- a/checkpoint-5700/optimizer.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8847b7875d322ad5570a300587a0f3924a360ae4df3e2feeb97a8a2e21a3cbff -size 1001752701 diff --git a/checkpoint-5700/rng_state_0.pth b/checkpoint-5700/rng_state_0.pth deleted file mode 100644 index 3c2a9137bfd1f9c3efd5228cb92aa36dc82cc29a..0000000000000000000000000000000000000000 --- a/checkpoint-5700/rng_state_0.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f06ce8fd6a33ec4407e0888bbcc8c7e40f4d820c9b7b7024f808c1cb08bac1f9 -size 27772 diff --git a/checkpoint-5700/rng_state_1.pth b/checkpoint-5700/rng_state_1.pth deleted file mode 100644 index 07bb8ba3171f9114ca378631f850b16a8ca02a83..0000000000000000000000000000000000000000 --- a/checkpoint-5700/rng_state_1.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:218ef7d643b85f18451d0ff4e11963ac2483f153fb71cc3ca1ab2bc1c0c67051 -size 27772 diff --git a/checkpoint-5700/rng_state_10.pth b/checkpoint-5700/rng_state_10.pth deleted file mode 100644 index 62f27578ae3c5f05071b9cf5c702eeb81bc6d415..0000000000000000000000000000000000000000 --- a/checkpoint-5700/rng_state_10.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9d52fed50c25d75d7fa962b9f10f71f848700ff11f9305a37b16ca126fee5481 -size 27789 diff --git a/checkpoint-5700/rng_state_11.pth b/checkpoint-5700/rng_state_11.pth deleted file mode 100644 index c2efdd8e880e555c19f213e77989c03985c1fd8a..0000000000000000000000000000000000000000 --- a/checkpoint-5700/rng_state_11.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ca4cdcdc956f43b62d0d18dc1d662748eb79bf6714c90145fc90101a1ea2249d -size 27789 diff --git a/checkpoint-5700/rng_state_12.pth b/checkpoint-5700/rng_state_12.pth deleted file mode 100644 index 35ffc9df08e4edd6abf3d1d242d2d90918445da0..0000000000000000000000000000000000000000 --- a/checkpoint-5700/rng_state_12.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8305db4caf39e6fd5e1f06f849d2a6d65681cf5c367dd8a754a886f1d32d4456 -size 27789 diff --git a/checkpoint-5700/rng_state_13.pth b/checkpoint-5700/rng_state_13.pth deleted file mode 100644 index 9951d89ea973b30e68cd7319d1009ce908729213..0000000000000000000000000000000000000000 --- a/checkpoint-5700/rng_state_13.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:bd9d3dc3cf0abd594c579dd75cbe79170df6d02cec6c38d47e042b3dd26300d9 -size 27789 diff --git a/checkpoint-5700/rng_state_2.pth b/checkpoint-5700/rng_state_2.pth deleted file mode 100644 index 8d36198d13637177c88509187eec27963707dbc4..0000000000000000000000000000000000000000 --- a/checkpoint-5700/rng_state_2.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:348612a8cf3a488b2de324430f631e10c4e8156112e6c50cecda44157e829595 -size 27772 diff --git a/checkpoint-5700/rng_state_3.pth b/checkpoint-5700/rng_state_3.pth deleted file mode 100644 index 8f72210cf61d845505e06c0f681a11f782d2d543..0000000000000000000000000000000000000000 --- a/checkpoint-5700/rng_state_3.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c688a5f058c380a72ea06519f8b004106c3bf62f4ac8ae5b0e96c473dbac963c -size 27772 diff --git a/checkpoint-5700/rng_state_4.pth b/checkpoint-5700/rng_state_4.pth deleted file mode 100644 index 062d0bace80c1db35317fbd29fd2698c02cb8cd8..0000000000000000000000000000000000000000 --- a/checkpoint-5700/rng_state_4.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:20ebd3abf1496a95cb8a1cc494c974137f7880bb1069b7813817b8600444464d -size 27772 diff --git a/checkpoint-5700/rng_state_5.pth b/checkpoint-5700/rng_state_5.pth deleted file mode 100644 index 337c9b58db07231bee27e8d458d57f2f970e7da4..0000000000000000000000000000000000000000 --- a/checkpoint-5700/rng_state_5.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a0ad3339005efdbfae3bb272ea3ce0907371f54b4834a96fa9c864807063f63d -size 27772 diff --git a/checkpoint-5700/rng_state_6.pth b/checkpoint-5700/rng_state_6.pth deleted file mode 100644 index b6b7bdf4e47fc358d7c2daa8c1e04e4eae152289..0000000000000000000000000000000000000000 --- a/checkpoint-5700/rng_state_6.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0f13556a5091d1d8f3874fe4a97ac3fc222b586812ceab6167e99bc25dc28fc0 -size 27772 diff --git a/checkpoint-5700/rng_state_7.pth b/checkpoint-5700/rng_state_7.pth deleted file mode 100644 index c2beb3e1bd8f4fe6a018c96e8cc80233ad1384b9..0000000000000000000000000000000000000000 --- a/checkpoint-5700/rng_state_7.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6b76a223c2ea9e5262b69fc056b9f29e0dd62a728f58a99ac77374aeb72fce68 -size 27772 diff --git a/checkpoint-5700/rng_state_8.pth b/checkpoint-5700/rng_state_8.pth deleted file mode 100644 index 73e55c77fc49eb5929193d73402cd3d20c1f563e..0000000000000000000000000000000000000000 --- a/checkpoint-5700/rng_state_8.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ae0f14b82c516564368a80f0d993ef826bf389434bdd326ac982efc3e52dc286 -size 27772 diff --git a/checkpoint-5700/rng_state_9.pth b/checkpoint-5700/rng_state_9.pth deleted file mode 100644 index c7da4b43531a42c31650b4c283559a7d8f311a95..0000000000000000000000000000000000000000 --- a/checkpoint-5700/rng_state_9.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ff589c2de9aa0e8b005f5e548e65245c51b773411b16d01c505e9d491673af3f -size 27772 diff --git a/checkpoint-5700/scheduler.pt b/checkpoint-5700/scheduler.pt deleted file mode 100644 index 7e36ca6a96764eeccb6aa7d9c5028585fed23370..0000000000000000000000000000000000000000 --- a/checkpoint-5700/scheduler.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:935f0139e1e2ffb90e75a6a1904fe50b37854f0d00a6d9b7dc07c85fc7a0d97c -size 627 diff --git a/checkpoint-5700/training_args.bin b/checkpoint-5700/training_args.bin deleted file mode 100644 index c456116f688fe6cb6deecb1e0a1cf8d153d349fb..0000000000000000000000000000000000000000 --- a/checkpoint-5700/training_args.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:df5d13b3f1b9942f80afde79010ef0947feee3df761d245fef1699bc397648b2 -size 4027 diff --git a/checkpoint-5800/adapter_model.bin b/checkpoint-5800/adapter_model.bin deleted file mode 100644 index b25d3eaace758c6638b956d27554c51cfd758425..0000000000000000000000000000000000000000 --- a/checkpoint-5800/adapter_model.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c6c8948b163d7faf80bcb4ea3c791311da3d9b14d4257794aeb4a2b35935a025 -size 500897101 diff --git a/checkpoint-5800/adapter_model/adapter_model.bin b/checkpoint-5800/adapter_model/adapter_model.bin deleted file mode 100644 index b25d3eaace758c6638b956d27554c51cfd758425..0000000000000000000000000000000000000000 --- a/checkpoint-5800/adapter_model/adapter_model.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c6c8948b163d7faf80bcb4ea3c791311da3d9b14d4257794aeb4a2b35935a025 -size 500897101 diff --git a/checkpoint-5800/optimizer.pt b/checkpoint-5800/optimizer.pt deleted file mode 100644 index 3ff99dd4e8de03fbb3706e831716b20cdc36b029..0000000000000000000000000000000000000000 --- a/checkpoint-5800/optimizer.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:fdafcf17dcbaf493ce7420b5efc55cc37f121d6d18e479f66229dfb7d3ebfe9a -size 1001752701 diff --git a/checkpoint-5800/rng_state_0.pth b/checkpoint-5800/rng_state_0.pth deleted file mode 100644 index 32576f7fea9a909e430c2379d78ec5bf846b1367..0000000000000000000000000000000000000000 --- a/checkpoint-5800/rng_state_0.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:fdcc97c3d5ae4ead7b5285c5c5b8dddcbec730d6aced698514214e40163f6c80 -size 27772 diff --git a/checkpoint-5800/rng_state_1.pth b/checkpoint-5800/rng_state_1.pth deleted file mode 100644 index 4427827aec35702513d131a1ce0ecb968ec72c8f..0000000000000000000000000000000000000000 --- a/checkpoint-5800/rng_state_1.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8f0dfb5773126adda2e927345797eb8babdfc8aa673a963e413f06bda803f6b8 -size 27772 diff --git a/checkpoint-5800/rng_state_10.pth b/checkpoint-5800/rng_state_10.pth deleted file mode 100644 index d7d02c96cf7f3da06779c0b9becde5f1e0927402..0000000000000000000000000000000000000000 --- a/checkpoint-5800/rng_state_10.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:481ee2d6343e3ee249f8f13ba72e97689ec745d34ca3eb731c5977d455e68087 -size 27789 diff --git a/checkpoint-5800/rng_state_11.pth b/checkpoint-5800/rng_state_11.pth deleted file mode 100644 index 02f266ae42f742e7af0f68aa48bb5e1d97f9854a..0000000000000000000000000000000000000000 --- a/checkpoint-5800/rng_state_11.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:56d4288a9e908f82added428e5a14ff5dd6e86473ebd372733e241f3c2a4e833 -size 27789 diff --git a/checkpoint-5800/rng_state_12.pth b/checkpoint-5800/rng_state_12.pth deleted file mode 100644 index a5bf2100846d316c907c004cdcf4f53dec78dbc4..0000000000000000000000000000000000000000 --- a/checkpoint-5800/rng_state_12.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5749fda2bb629d9c3e4a0bb894676f98047fc123c7ada64e2385c1692f194369 -size 27789 diff --git a/checkpoint-5800/rng_state_13.pth b/checkpoint-5800/rng_state_13.pth deleted file mode 100644 index 6e4c8ec65ba23f1127297f14df1c0e5a815972bc..0000000000000000000000000000000000000000 --- a/checkpoint-5800/rng_state_13.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2ac848792be0fda751cfdebaa1419f845e441f823e55d97dc332cb6ebecab888 -size 27789 diff --git a/checkpoint-5800/rng_state_2.pth b/checkpoint-5800/rng_state_2.pth deleted file mode 100644 index 339b13aaf629629acd363207d06b803f3164cc48..0000000000000000000000000000000000000000 --- a/checkpoint-5800/rng_state_2.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:004ca3f2557bec1000ed01ad0ac091380c145ff4d9054e495042d9673b164cd3 -size 27772 diff --git a/checkpoint-5800/rng_state_3.pth b/checkpoint-5800/rng_state_3.pth deleted file mode 100644 index fdc8655bc3b73b1d48fe9069eff355b73e1cd4de..0000000000000000000000000000000000000000 --- a/checkpoint-5800/rng_state_3.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:83a6e03a2771bdfefb81f6b70a469b27bf46d9bac7c91cec25fbd8fc2e1bb9fd -size 27772 diff --git a/checkpoint-5800/rng_state_4.pth b/checkpoint-5800/rng_state_4.pth deleted file mode 100644 index a33983d78492d1d9d9a320f02bab9fd7437fd447..0000000000000000000000000000000000000000 --- a/checkpoint-5800/rng_state_4.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:027cc230cd1577ece8a43abc1ed88fcc51ac874f84b8bcbe865b8338b17825dc -size 27772 diff --git a/checkpoint-5800/rng_state_5.pth b/checkpoint-5800/rng_state_5.pth deleted file mode 100644 index 9c12ce4de318110b659e68db3eb100c4aa128f72..0000000000000000000000000000000000000000 --- a/checkpoint-5800/rng_state_5.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5e15c6848b49b0375761f21215e2d56ea5a16e27885192cc4af7b1a3f9c325a2 -size 27772 diff --git a/checkpoint-5800/rng_state_6.pth b/checkpoint-5800/rng_state_6.pth deleted file mode 100644 index 2fcdb815d79ea791d2753a0db4b146458c95e3d7..0000000000000000000000000000000000000000 --- a/checkpoint-5800/rng_state_6.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0290c211df0a25ca2b739876f096befd7a2f50010f23fcfb700c648fc7c37b88 -size 27772 diff --git a/checkpoint-5800/rng_state_7.pth b/checkpoint-5800/rng_state_7.pth deleted file mode 100644 index c97a750c2dea4a44ea85d28ef92f4d91c42180b9..0000000000000000000000000000000000000000 --- a/checkpoint-5800/rng_state_7.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:fe7bdf51b5f2867802a2660bdbfa211be18d28a9f5e7325d4957f7ee65895a3a -size 27772 diff --git a/checkpoint-5800/rng_state_8.pth b/checkpoint-5800/rng_state_8.pth deleted file mode 100644 index eb02047c3a256a4e8dc65a9507f137abe27d4048..0000000000000000000000000000000000000000 --- a/checkpoint-5800/rng_state_8.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0c7043986c3cfa7014abbd2eb87d4f8ccda04f6a243deda922c9522e5c66f2fd -size 27772 diff --git a/checkpoint-5800/rng_state_9.pth b/checkpoint-5800/rng_state_9.pth deleted file mode 100644 index 45ac65bb884854298d454760ce2735e8ecec7624..0000000000000000000000000000000000000000 --- a/checkpoint-5800/rng_state_9.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a3371033bac6e8e8c6fb2001ca45e33bd941b91fd370cce2d2edc6bac7df0e55 -size 27772 diff --git a/checkpoint-5800/scheduler.pt b/checkpoint-5800/scheduler.pt deleted file mode 100644 index f744f85c5c20ec4e390e284fde44a23de16db37c..0000000000000000000000000000000000000000 --- a/checkpoint-5800/scheduler.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d7e2a15463250851f8f0353fd93191418e2b4e589eb68be6185d12012957a33f -size 627 diff --git a/checkpoint-5800/training_args.bin b/checkpoint-5800/training_args.bin deleted file mode 100644 index c456116f688fe6cb6deecb1e0a1cf8d153d349fb..0000000000000000000000000000000000000000 --- a/checkpoint-5800/training_args.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:df5d13b3f1b9942f80afde79010ef0947feee3df761d245fef1699bc397648b2 -size 4027 diff --git a/checkpoint-5700/README.md b/checkpoint-6000/adapter_model/README.md similarity index 100% rename from checkpoint-5700/README.md rename to checkpoint-6000/adapter_model/README.md diff --git a/checkpoint-5700/adapter_config.json b/checkpoint-6000/adapter_model/adapter_config.json similarity index 94% rename from checkpoint-5700/adapter_config.json rename to checkpoint-6000/adapter_model/adapter_config.json index 7052646debaf453de93d6176727714122c31b64a..76a873c20cee3d723689a7add20df73d51f0aa62 100644 --- a/checkpoint-5700/adapter_config.json +++ b/checkpoint-6000/adapter_model/adapter_config.json @@ -14,13 +14,13 @@ "r": 32, "revision": null, "target_modules": [ - "q_proj", - "v_proj", - "gate_proj", - "up_proj", - "o_proj", "k_proj", - "down_proj" + "down_proj", + "o_proj", + "up_proj", + "gate_proj", + "q_proj", + "v_proj" ], "task_type": "CAUSAL_LM" } \ No newline at end of file diff --git a/checkpoint-6000/adapter_model/adapter_model.bin b/checkpoint-6000/adapter_model/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..74ff5a581629a7f5ddc9c641d61ce97e81bb3584 --- /dev/null +++ b/checkpoint-6000/adapter_model/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbb9d05e18d21539814aa33a75bcd59ecfa1423d749f7def1fa099eac295c773 +size 500897101 diff --git a/checkpoint-5700/adapter_model/README.md b/checkpoint-6100/README.md similarity index 100% rename from checkpoint-5700/adapter_model/README.md rename to checkpoint-6100/README.md diff --git a/checkpoint-5800/adapter_config.json b/checkpoint-6100/adapter_config.json similarity index 94% rename from checkpoint-5800/adapter_config.json rename to checkpoint-6100/adapter_config.json index 7052646debaf453de93d6176727714122c31b64a..76a873c20cee3d723689a7add20df73d51f0aa62 100644 --- a/checkpoint-5800/adapter_config.json +++ b/checkpoint-6100/adapter_config.json @@ -14,13 +14,13 @@ "r": 32, "revision": null, "target_modules": [ - "q_proj", - "v_proj", - "gate_proj", - "up_proj", - "o_proj", "k_proj", - "down_proj" + "down_proj", + "o_proj", + "up_proj", + "gate_proj", + "q_proj", + "v_proj" ], "task_type": "CAUSAL_LM" } \ No newline at end of file diff --git a/checkpoint-6100/adapter_model.bin b/checkpoint-6100/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..54820d7d4fcaad389083f94e118ab24d1e4fd5dd --- /dev/null +++ b/checkpoint-6100/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:388cd46150cf53754b4f0d276e98973e5a1f43862ebd435181705f9ab3d56f52 +size 500897101 diff --git a/checkpoint-5800/README.md b/checkpoint-6100/adapter_model/README.md similarity index 100% rename from checkpoint-5800/README.md rename to checkpoint-6100/adapter_model/README.md diff --git a/checkpoint-5700/adapter_model/adapter_config.json b/checkpoint-6100/adapter_model/adapter_config.json similarity index 94% rename from checkpoint-5700/adapter_model/adapter_config.json rename to checkpoint-6100/adapter_model/adapter_config.json index 7052646debaf453de93d6176727714122c31b64a..76a873c20cee3d723689a7add20df73d51f0aa62 100644 --- a/checkpoint-5700/adapter_model/adapter_config.json +++ b/checkpoint-6100/adapter_model/adapter_config.json @@ -14,13 +14,13 @@ "r": 32, "revision": null, "target_modules": [ - "q_proj", - "v_proj", - "gate_proj", - "up_proj", - "o_proj", "k_proj", - "down_proj" + "down_proj", + "o_proj", + "up_proj", + "gate_proj", + "q_proj", + "v_proj" ], "task_type": "CAUSAL_LM" } \ No newline at end of file diff --git a/checkpoint-6100/adapter_model/adapter_model.bin b/checkpoint-6100/adapter_model/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..54820d7d4fcaad389083f94e118ab24d1e4fd5dd --- /dev/null +++ b/checkpoint-6100/adapter_model/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:388cd46150cf53754b4f0d276e98973e5a1f43862ebd435181705f9ab3d56f52 +size 500897101 diff --git a/checkpoint-6100/optimizer.pt b/checkpoint-6100/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..236521f8872ad884c9c3ec00efe6e3c8e33d6d90 --- /dev/null +++ b/checkpoint-6100/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23361198354be9afc19d0f3752c768fddef1e9604ebeb35127628f0a567c9868 +size 1001752701 diff --git a/checkpoint-6100/rng_state_0.pth b/checkpoint-6100/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..3d4a47f73e949bbef11239229abe7fcf4ec64d17 --- /dev/null +++ b/checkpoint-6100/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9162bd2b64fa6a1399b67a40366d8c08f7d3612b17f83dfde4accf31e0b7e38b +size 27772 diff --git a/checkpoint-6100/rng_state_1.pth b/checkpoint-6100/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..f7299208cd2a03cc118da47a24ed6840df25aa13 --- /dev/null +++ b/checkpoint-6100/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47eb09798665edeada4b80de705ecf394a69e60f01cd9bd340d95b3c9d0be22e +size 27772 diff --git a/checkpoint-6100/rng_state_10.pth b/checkpoint-6100/rng_state_10.pth new file mode 100644 index 0000000000000000000000000000000000000000..b9220a2f64478a35017450dc79c4640366ff2fc9 --- /dev/null +++ b/checkpoint-6100/rng_state_10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9c91cade997cd5e5e47ae09b2a295facdfbba964508a100db5e64faf0320f11 +size 27789 diff --git a/checkpoint-6100/rng_state_11.pth b/checkpoint-6100/rng_state_11.pth new file mode 100644 index 0000000000000000000000000000000000000000..b68e1a6aac1debe7861bc251446a28a7525ecbef --- /dev/null +++ b/checkpoint-6100/rng_state_11.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b313ea64d5b302d9894ee7b5dd63f9c9a469ca1256ceab7619cb9f049f70138 +size 27789 diff --git a/checkpoint-6100/rng_state_12.pth b/checkpoint-6100/rng_state_12.pth new file mode 100644 index 0000000000000000000000000000000000000000..6e935ce8847def46ceac5f99a8e225a9a7d8edb1 --- /dev/null +++ b/checkpoint-6100/rng_state_12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e01b6efa92bd063f4cd80ddd2fa79082d2072f36bc4669abe0ec0742ab75223d +size 27789 diff --git a/checkpoint-6100/rng_state_13.pth b/checkpoint-6100/rng_state_13.pth new file mode 100644 index 0000000000000000000000000000000000000000..e466e358a4d1098d447607e8d28fb235bbc1bfcc --- /dev/null +++ b/checkpoint-6100/rng_state_13.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab0222a3e50c0985d9dbe1cad74c8abd56400e0d05ff489b51865ef156928695 +size 27789 diff --git a/checkpoint-6100/rng_state_2.pth b/checkpoint-6100/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..e47f0fef4d4d131f7895851af7fdd788203937c4 --- /dev/null +++ b/checkpoint-6100/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e13e105d97f9b5820cc4ad076585f2902cd3185bac7443faaead5cb3cef83c80 +size 27772 diff --git a/checkpoint-6100/rng_state_3.pth b/checkpoint-6100/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..51f2ae3113838728a60fbc7f22c20f3cab6b4f82 --- /dev/null +++ b/checkpoint-6100/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bf0b2a35e4af585c3a853ac8956e69ab3dc44f8f7b289beeed7bc8889382e11 +size 27772 diff --git a/checkpoint-6100/rng_state_4.pth b/checkpoint-6100/rng_state_4.pth new file mode 100644 index 0000000000000000000000000000000000000000..96afc0b45a88e997fd3a7e841b786b69c4bc1041 --- /dev/null +++ b/checkpoint-6100/rng_state_4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:daedb950d8b297b35aecd0341c5ab143df51662832bddabd61af69a80c0e2691 +size 27772 diff --git a/checkpoint-6100/rng_state_5.pth b/checkpoint-6100/rng_state_5.pth new file mode 100644 index 0000000000000000000000000000000000000000..d6a81d31fbb76a480039646aa7a04bf0b2d901ef --- /dev/null +++ b/checkpoint-6100/rng_state_5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:debe892fc62955687dbec8db9a770f303801833773975c37decce994212064ee +size 27772 diff --git a/checkpoint-6100/rng_state_6.pth b/checkpoint-6100/rng_state_6.pth new file mode 100644 index 0000000000000000000000000000000000000000..c5f8b319c935f095fd9c877560ad24a4cc761a67 --- /dev/null +++ b/checkpoint-6100/rng_state_6.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:166b098d25e88227361ec50688e81ef3c0a1c1b007617e16be45748918dd52df +size 27772 diff --git a/checkpoint-6100/rng_state_7.pth b/checkpoint-6100/rng_state_7.pth new file mode 100644 index 0000000000000000000000000000000000000000..c71b1da10579089ed792b24642c1ab457fb054f0 --- /dev/null +++ b/checkpoint-6100/rng_state_7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b699249cf37387b69dcd9425364424949a26a56a95817fe5db02f001d3e9c86f +size 27772 diff --git a/checkpoint-6100/rng_state_8.pth b/checkpoint-6100/rng_state_8.pth new file mode 100644 index 0000000000000000000000000000000000000000..417bd9a4bc746968759be438fdddb08f0a396961 --- /dev/null +++ b/checkpoint-6100/rng_state_8.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba57dff1a1b5008ba90bbde0f66039de21670cc736e37d954752bf67e9cb8130 +size 27772 diff --git a/checkpoint-6100/rng_state_9.pth b/checkpoint-6100/rng_state_9.pth new file mode 100644 index 0000000000000000000000000000000000000000..f4a3d29b8f0aa54965ff2c53cb81034bfa4e6f7d --- /dev/null +++ b/checkpoint-6100/rng_state_9.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90b54c02081eb6d595752be8c21725bd5098ac7be34d0c63c9a1d26e989ac033 +size 27772 diff --git a/checkpoint-6100/scheduler.pt b/checkpoint-6100/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ad046903b22f0a5af9f271fa92ec5807c3e3303 --- /dev/null +++ b/checkpoint-6100/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bbbf313199bcaa9e78b6da6162b405173b5ef683672f79c9847fdc8ee4406e8 +size 627 diff --git a/checkpoint-5800/trainer_state.json b/checkpoint-6100/trainer_state.json similarity index 94% rename from checkpoint-5800/trainer_state.json rename to checkpoint-6100/trainer_state.json index 253a82686a6ec59beff239685621e7860be41e45..ee7ec88e1dc4f1c446619b342628ee322a1e9870 100644 --- a/checkpoint-5800/trainer_state.json +++ b/checkpoint-6100/trainer_state.json @@ -1,8 +1,8 @@ { "best_metric": null, "best_model_checkpoint": null, - "epoch": 2.2489336952307095, - "global_step": 5800, + "epoch": 2.365257851880574, + "global_step": 6100, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, @@ -1414,11 +1414,91 @@ "learning_rate": 2.944041552425475e-05, "loss": 0.7687, "step": 5800 + }, + { + "epoch": 2.26, + "learning_rate": 2.8723813270606982e-05, + "loss": 0.7698, + "step": 5825 + }, + { + "epoch": 2.27, + "learning_rate": 2.8014574760522416e-05, + "loss": 0.7641, + "step": 5850 + }, + { + "epoch": 2.28, + "learning_rate": 2.731277326742876e-05, + "loss": 0.7746, + "step": 5875 + }, + { + "epoch": 2.29, + "learning_rate": 2.6618481296414522e-05, + "loss": 0.7722, + "step": 5900 + }, + { + "epoch": 2.3, + "learning_rate": 2.5931770576738313e-05, + "loss": 0.7698, + "step": 5925 + }, + { + "epoch": 2.31, + "learning_rate": 2.525271205441837e-05, + "loss": 0.7751, + "step": 5950 + }, + { + "epoch": 2.32, + "learning_rate": 2.45813758849028e-05, + "loss": 0.766, + "step": 5975 + }, + { + "epoch": 2.33, + "learning_rate": 2.3917831425821824e-05, + "loss": 0.7673, + "step": 6000 + }, + { + "epoch": 2.33, + "eval_loss": 0.806900680065155, + "eval_runtime": 58.3254, + "eval_samples_per_second": 12.516, + "eval_steps_per_second": 0.909, + "step": 6000 + }, + { + "epoch": 2.34, + "learning_rate": 2.3262147229821984e-05, + "loss": 0.7679, + "step": 6025 + }, + { + "epoch": 2.35, + "learning_rate": 2.2614391037483983e-05, + "loss": 0.7704, + "step": 6050 + }, + { + "epoch": 2.36, + "learning_rate": 2.1974629770324106e-05, + "loss": 0.7661, + "step": 6075 + }, + { + "epoch": 2.37, + "learning_rate": 2.1342929523880416e-05, + "loss": 0.7652, + "step": 6100 } ], "max_steps": 7737, "num_train_epochs": 3, - "total_flos": 2.4980935510562177e+19, + "total_flos": 2.6271635417086296e+19, "trial_name": null, "trial_params": null } diff --git a/checkpoint-6100/training_args.bin b/checkpoint-6100/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..f228863f67653da2b4fa244186402c05081ec243 --- /dev/null +++ b/checkpoint-6100/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c008d25bfaf7bb9a08aab93c029ae5c61570d5e3604fc9ca9ea2654e60b13cd6 +size 4027 diff --git a/checkpoint-5800/adapter_model/README.md b/checkpoint-6200/README.md similarity index 100% rename from checkpoint-5800/adapter_model/README.md rename to checkpoint-6200/README.md diff --git a/checkpoint-5800/adapter_model/adapter_config.json b/checkpoint-6200/adapter_config.json similarity index 94% rename from checkpoint-5800/adapter_model/adapter_config.json rename to checkpoint-6200/adapter_config.json index 7052646debaf453de93d6176727714122c31b64a..f56af3425142720a41fdaf57a5953ffe09e3778c 100644 --- a/checkpoint-5800/adapter_model/adapter_config.json +++ b/checkpoint-6200/adapter_config.json @@ -14,13 +14,13 @@ "r": 32, "revision": null, "target_modules": [ - "q_proj", - "v_proj", - "gate_proj", "up_proj", - "o_proj", + "gate_proj", + "down_proj", + "q_proj", "k_proj", - "down_proj" + "o_proj", + "v_proj" ], "task_type": "CAUSAL_LM" } \ No newline at end of file diff --git a/checkpoint-6200/adapter_model.bin b/checkpoint-6200/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..4c7f81b52d130b9867f7186c7d23e337252e2a04 --- /dev/null +++ b/checkpoint-6200/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3febec860772b82c489867736d215315d0909ffc43a3ba7b9fbc1d0b41fd7a20 +size 500897101 diff --git a/checkpoint-6200/optimizer.pt b/checkpoint-6200/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..08c5a952911823060030eebc914bbca2880c4d30 --- /dev/null +++ b/checkpoint-6200/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6c238a192e64d590edb62f130ceed462095ecf868445a5da756e160d8783d7e +size 1001752701 diff --git a/checkpoint-6200/rng_state_0.pth b/checkpoint-6200/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..46febc56bb8128d8b316eef6bc444f5d1a566bc5 --- /dev/null +++ b/checkpoint-6200/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a62682ba7e7cb26595ded7f48ec753d2eb9673721db81b0ec4152ba6856f2d2 +size 27772 diff --git a/checkpoint-6200/rng_state_1.pth b/checkpoint-6200/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..de7b7eef419f455e816fb95b3056a6b509c52e77 --- /dev/null +++ b/checkpoint-6200/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74be203c1e4634b2aa1037ec3a4a9edd5a7298915ce425cf1b9a31f6391efca1 +size 27772 diff --git a/checkpoint-6200/rng_state_10.pth b/checkpoint-6200/rng_state_10.pth new file mode 100644 index 0000000000000000000000000000000000000000..3a8ccd31e88b62b9d20c1c5817d852c32afd3645 --- /dev/null +++ b/checkpoint-6200/rng_state_10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c037a2c235445f0da915de6619ff6f7f42b2c0c8575b787c1a4ed16e35b61d21 +size 27789 diff --git a/checkpoint-6200/rng_state_11.pth b/checkpoint-6200/rng_state_11.pth new file mode 100644 index 0000000000000000000000000000000000000000..d77fc6c2f0c47f90b5b0290046e02c351376258b --- /dev/null +++ b/checkpoint-6200/rng_state_11.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b62b1f601e03a003f84cf80a8c292113d141ee87f5b1ca845fff2a924a30938e +size 27789 diff --git a/checkpoint-6200/rng_state_12.pth b/checkpoint-6200/rng_state_12.pth new file mode 100644 index 0000000000000000000000000000000000000000..626019e990ca29809e92f3e52cd62e9c8a5cb67e --- /dev/null +++ b/checkpoint-6200/rng_state_12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c758852b4f6179b67806b64c03556a85fc8cb6b2d7fc9b9802e599d92cb5060 +size 27789 diff --git a/checkpoint-6200/rng_state_13.pth b/checkpoint-6200/rng_state_13.pth new file mode 100644 index 0000000000000000000000000000000000000000..1eb443dad26419c0e52410a49bd3bbe2931d14ed --- /dev/null +++ b/checkpoint-6200/rng_state_13.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:212ebbd04054c53230c6f37560d76104b53022b0398cb77838fa4b24148235e3 +size 27789 diff --git a/checkpoint-6200/rng_state_2.pth b/checkpoint-6200/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..e460449a8986615ebe57738ff550825be4de1ed6 --- /dev/null +++ b/checkpoint-6200/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b20af4a6e33875e1906da2f4f958007730c9409557ca3cdfa5b4dc59f51e2d5 +size 27772 diff --git a/checkpoint-6200/rng_state_3.pth b/checkpoint-6200/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..04e040deb0b3282bc892d025a742ba07f6ac36c3 --- /dev/null +++ b/checkpoint-6200/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f749729546f0e74d9ecf3ad24fea7d29dd1ae76d88741fcdcf02b50df73302c +size 27772 diff --git a/checkpoint-6200/rng_state_4.pth b/checkpoint-6200/rng_state_4.pth new file mode 100644 index 0000000000000000000000000000000000000000..3cb98fa5e465183731934449ef7340668b18e016 --- /dev/null +++ b/checkpoint-6200/rng_state_4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c21e5a49b0e24cc974d1d7d4406b9728cbea5332e18346ba9afb35e0372f526 +size 27772 diff --git a/checkpoint-6200/rng_state_5.pth b/checkpoint-6200/rng_state_5.pth new file mode 100644 index 0000000000000000000000000000000000000000..95fe339f8a0ef625b72110e4b6cd467c29952a08 --- /dev/null +++ b/checkpoint-6200/rng_state_5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a33c776cc1ad3767cdac6f06b81c8d34fcc1d3ad73a9f8803254d0d817aa09a +size 27772 diff --git a/checkpoint-6200/rng_state_6.pth b/checkpoint-6200/rng_state_6.pth new file mode 100644 index 0000000000000000000000000000000000000000..37697849b5d9a76a3ef9bc35cb96d57f012fbf19 --- /dev/null +++ b/checkpoint-6200/rng_state_6.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64fcf9ef649f08b421dd4acc8e2b02fc8f3ffefc82b05ef17dde8609c9d4bb40 +size 27772 diff --git a/checkpoint-6200/rng_state_7.pth b/checkpoint-6200/rng_state_7.pth new file mode 100644 index 0000000000000000000000000000000000000000..725cbe48b099bf87fe4d7bf2b61a0140eed7d894 --- /dev/null +++ b/checkpoint-6200/rng_state_7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbea4f476c6f296b74387728b4c7179586b903ae8344e377cc5ce9725f14ba69 +size 27772 diff --git a/checkpoint-6200/rng_state_8.pth b/checkpoint-6200/rng_state_8.pth new file mode 100644 index 0000000000000000000000000000000000000000..b5ccf8d0b55f23fbf3d4d378c649300c394cc8c7 --- /dev/null +++ b/checkpoint-6200/rng_state_8.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecac165f822fec78a8825820ff7d48e36aa3f53cb41f7a57d2e9dfadf8de351a +size 27772 diff --git a/checkpoint-6200/rng_state_9.pth b/checkpoint-6200/rng_state_9.pth new file mode 100644 index 0000000000000000000000000000000000000000..5e1bc5d8e2a1291aefd6d9ae6f44829f57bdd0ee --- /dev/null +++ b/checkpoint-6200/rng_state_9.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba8091a98c98de998b6ead9067c77d9531ff0bb7b308e548615a3a1c2ec0f7e8 +size 27772 diff --git a/checkpoint-6200/scheduler.pt b/checkpoint-6200/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9334893cfebd90676cd213f0b92097c1990743a --- /dev/null +++ b/checkpoint-6200/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a2465347a031d34e4adae1fd19f3f075689a8b84714f2008d365cd61979bafe +size 627 diff --git a/checkpoint-5700/trainer_state.json b/checkpoint-6200/trainer_state.json similarity index 91% rename from checkpoint-5700/trainer_state.json rename to checkpoint-6200/trainer_state.json index 8c4091dad201566e2ffa5b495ce638f306686a5e..5fca4db16c366d43a40bb2c3ed16afec9cdbf5ca 100644 --- a/checkpoint-5700/trainer_state.json +++ b/checkpoint-6200/trainer_state.json @@ -1,8 +1,8 @@ { "best_metric": null, "best_model_checkpoint": null, - "epoch": 2.2101589763474214, - "global_step": 5700, + "epoch": 2.404032570763862, + "global_step": 6200, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, @@ -1390,11 +1390,139 @@ "learning_rate": 3.237897004017276e-05, "loss": 0.7716, "step": 5700 + }, + { + "epoch": 2.22, + "learning_rate": 3.163366064673427e-05, + "loss": 0.7721, + "step": 5725 + }, + { + "epoch": 2.23, + "learning_rate": 3.089541437233252e-05, + "loss": 0.7658, + "step": 5750 + }, + { + "epoch": 2.24, + "learning_rate": 3.0164307487268996e-05, + "loss": 0.7716, + "step": 5775 + }, + { + "epoch": 2.25, + "learning_rate": 2.944041552425475e-05, + "loss": 0.7687, + "step": 5800 + }, + { + "epoch": 2.26, + "learning_rate": 2.8723813270606982e-05, + "loss": 0.7698, + "step": 5825 + }, + { + "epoch": 2.27, + "learning_rate": 2.8014574760522416e-05, + "loss": 0.7641, + "step": 5850 + }, + { + "epoch": 2.28, + "learning_rate": 2.731277326742876e-05, + "loss": 0.7746, + "step": 5875 + }, + { + "epoch": 2.29, + "learning_rate": 2.6618481296414522e-05, + "loss": 0.7722, + "step": 5900 + }, + { + "epoch": 2.3, + "learning_rate": 2.5931770576738313e-05, + "loss": 0.7698, + "step": 5925 + }, + { + "epoch": 2.31, + "learning_rate": 2.525271205441837e-05, + "loss": 0.7751, + "step": 5950 + }, + { + "epoch": 2.32, + "learning_rate": 2.45813758849028e-05, + "loss": 0.766, + "step": 5975 + }, + { + "epoch": 2.33, + "learning_rate": 2.3917831425821824e-05, + "loss": 0.7673, + "step": 6000 + }, + { + "epoch": 2.33, + "eval_loss": 0.806900680065155, + "eval_runtime": 58.3254, + "eval_samples_per_second": 12.516, + "eval_steps_per_second": 0.909, + "step": 6000 + }, + { + "epoch": 2.34, + "learning_rate": 2.3262147229821984e-05, + "loss": 0.7679, + "step": 6025 + }, + { + "epoch": 2.35, + "learning_rate": 2.2614391037483983e-05, + "loss": 0.7704, + "step": 6050 + }, + { + "epoch": 2.36, + "learning_rate": 2.1974629770324106e-05, + "loss": 0.7661, + "step": 6075 + }, + { + "epoch": 2.37, + "learning_rate": 2.1342929523880416e-05, + "loss": 0.7652, + "step": 6100 + }, + { + "epoch": 2.37, + "learning_rate": 2.0719355560884246e-05, + "loss": 0.765, + "step": 6125 + }, + { + "epoch": 2.38, + "learning_rate": 2.010397230451766e-05, + "loss": 0.7704, + "step": 6150 + }, + { + "epoch": 2.39, + "learning_rate": 1.9496843331757784e-05, + "loss": 0.767, + "step": 6175 + }, + { + "epoch": 2.4, + "learning_rate": 1.8898031366808467e-05, + "loss": 0.7654, + "step": 6200 } ], "max_steps": 7737, "num_train_epochs": 3, - "total_flos": 2.4549667828507083e+19, + "total_flos": 2.6702654094117437e+19, "trial_name": null, "trial_params": null } diff --git a/checkpoint-6200/training_args.bin b/checkpoint-6200/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..dafe3bf543f65213de2af5317e277d3f4db5dc57 --- /dev/null +++ b/checkpoint-6200/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e85009bca9623c846e630c294adb80ecbcd9e720da8da9f9ee5311b562908b91 +size 4027 diff --git a/training_args.bin b/training_args.bin index f228863f67653da2b4fa244186402c05081ec243..dafe3bf543f65213de2af5317e277d3f4db5dc57 100644 --- a/training_args.bin +++ b/training_args.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c008d25bfaf7bb9a08aab93c029ae5c61570d5e3604fc9ca9ea2654e60b13cd6 +oid sha256:e85009bca9623c846e630c294adb80ecbcd9e720da8da9f9ee5311b562908b91 size 4027