goendalf666
/

falcon-7b-sql-instruction-lora

Model card Files Files and versions Community

tom813 commited on Jul 2, 2023

Commit

1c480f3

•

1 Parent(s): ed9b1f1

one table update 6000

Browse files

Files changed (7) hide show

adapter_model.bin +1 -1
optimizer.pt +1 -1
rng_state.pth +1 -1
scheduler.pt +1 -1
tokenizer.json +14 -2
trainer_state.json +8 -56
training_args.bin +1 -1

adapter_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:40e6069a78f8988dfcbd9ce8f46655ca2c28ead825b4d88fdb576649f6ba0e23
 size 261189898

 version https://git-lfs.github.com/spec/v1
+oid sha256:ed411523e825514d3a68061cdafdc3807eb42d802ff4f39fa2958d1ae57fe545
 size 261189898

optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5b37a23fdc89c1c57154a5bbb2b82bcdfebeae7b1f32913e8f5838b4365d5b94
 size 1044540346

 version https://git-lfs.github.com/spec/v1
+oid sha256:96599b7ccdf5b3a524ac5736c85b602d224dd22026f48a1002f23017f67c0b9f
 size 1044540346

rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:df5abd41fec659ebbe7dd2b4caff7408e32c39ef09f30071b012af22a9ef7d04
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:53de026ea02239c8920d0a8191312db2f91442b4779f916d3bb9e22f1bcba98b
 size 14244

scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ac7de8907e79c9f47fccf3aa89da8ca3d3d851fdb56e005195640f80ea9c8917
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:0bd3d777aeaba0b41d9a03c6730b70ea7cfcb24e68ae7498f71468201e53ab38
 size 1064

tokenizer.json CHANGED Viewed

@@ -1,7 +1,19 @@
 {
   "version": "1.0",
-  "truncation": null,
-  "padding": null,
   "added_tokens": [
     {
       "id": 0,

 {
   "version": "1.0",
+  "truncation": {
+    "direction": "Right",
+    "max_length": 256,
+    "strategy": "LongestFirst",
+    "stride": 0
+  },
+  "padding": {
+    "strategy": "BatchLongest",
+    "direction": "Right",
+    "pad_to_multiple_of": null,
+    "pad_id": 11,
+    "pad_type_id": 0,
+    "pad_token": "<|endoftext|>"
+  },
   "added_tokens": [
     {
       "id": 0,

trainer_state.json CHANGED Viewed

@@ -1,76 +1,28 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 9.176416609314062,
-  "global_step": 30000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
-      "epoch": 0.92,
       "learning_rate": 0.0002,
-      "loss": 0.4138,
       "step": 3000
     },
     {
-      "epoch": 1.84,
       "learning_rate": 0.0002,
-      "loss": 0.298,
       "step": 6000
-    },
-    {
-      "epoch": 2.75,
-      "learning_rate": 0.0002,
-      "loss": 0.2786,
-      "step": 9000
-    },
-    {
-      "epoch": 3.67,
-      "learning_rate": 0.0002,
-      "loss": 0.263,
-      "step": 12000
-    },
-    {
-      "epoch": 4.59,
-      "learning_rate": 0.0002,
-      "loss": 0.2507,
-      "step": 15000
-    },
-    {
-      "epoch": 5.51,
-      "learning_rate": 0.0002,
-      "loss": 0.2387,
-      "step": 18000
-    },
-    {
-      "epoch": 6.42,
-      "learning_rate": 0.0002,
-      "loss": 0.2279,
-      "step": 21000
-    },
-    {
-      "epoch": 7.34,
-      "learning_rate": 0.0002,
-      "loss": 0.2179,
-      "step": 24000
-    },
-    {
-      "epoch": 8.26,
-      "learning_rate": 0.0002,
-      "loss": 0.209,
-      "step": 27000
-    },
-    {
-      "epoch": 9.18,
-      "learning_rate": 0.0002,
-      "loss": 0.2015,
-      "step": 30000
     }
   ],
   "max_steps": 30000,
-  "num_train_epochs": 10,
-  "total_flos": 2.5389193589849457e+18,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 5.853658536585366,
+  "global_step": 6000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
+      "epoch": 2.93,
       "learning_rate": 0.0002,
+      "loss": 0.3963,
       "step": 3000
     },
     {
+      "epoch": 5.85,
       "learning_rate": 0.0002,
+      "loss": 0.2937,
       "step": 6000
     }
   ],
   "max_steps": 30000,
+  "num_train_epochs": 30,
+  "total_flos": 1.26953109061632e+18,
   "trial_name": null,
   "trial_params": null
 }

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f5569544233e3061e5e000ebbd0e69d9723778ac08056e5ec170696f4d0e2b11
 size 4408

 version https://git-lfs.github.com/spec/v1
+oid sha256:a1401c5ed0ace9fbb251f5d8a19a6ffcb1a44136d06be0bdc387ea4e700c4ba5
 size 4408