Model save
Browse files
README.md
CHANGED
@@ -46,37 +46,37 @@ The following hyperparameters were used during training:
|
|
46 |
|
47 |
| Training Loss | Epoch | Step | Validation Loss |
|
48 |
|:-------------:|:-----:|:----:|:---------------:|
|
49 |
-
| No log | 1.0 | 1 |
|
50 |
-
| No log | 2.0 | 2 |
|
51 |
-
| No log | 3.0 | 3 |
|
52 |
-
| No log | 4.0 | 4 |
|
53 |
-
| No log | 5.0 | 5 |
|
54 |
-
| No log | 6.0 | 6 |
|
55 |
-
| No log | 7.0 | 7 | 0.
|
56 |
-
| No log | 8.0 | 8 | 0.
|
57 |
-
| No log | 9.0 | 9 | 0.
|
58 |
-
| No log | 10.0 | 10 | 0.
|
59 |
-
| No log | 11.0 | 11 | 0.
|
60 |
-
| No log | 12.0 | 12 | 0.
|
61 |
-
| No log | 13.0 | 13 | 0.
|
62 |
-
| No log | 14.0 | 14 | 0.
|
63 |
| No log | 15.0 | 15 | 0.0002 |
|
64 |
-
| No log | 16.0 | 16 |
|
65 |
-
| No log | 17.0 | 17 |
|
66 |
-
| No log | 18.0 | 18 |
|
67 |
-
| No log | 19.0 | 19 |
|
68 |
-
| No log | 20.0 | 20 |
|
69 |
-
| No log | 21.0 | 21 |
|
70 |
-
| No log | 22.0 | 22 |
|
71 |
-
| No log | 23.0 | 23 | 0.
|
72 |
-
| No log | 24.0 | 24 | 0.
|
73 |
-
| No log | 25.0 | 25 | 0.
|
74 |
-
| No log | 26.0 | 26 | 0.
|
75 |
-
| No log | 27.0 | 27 |
|
76 |
-
| No log | 28.0 | 28 |
|
77 |
-
| No log | 29.0 | 29 | 0.
|
78 |
-
| No log | 30.0 | 30 | 0.
|
79 |
-
| No log | 31.0 | 31 | 0.
|
80 |
| No log | 32.0 | 32 | 0.0001 |
|
81 |
| No log | 33.0 | 33 | 0.0001 |
|
82 |
| No log | 34.0 | 34 | 0.0001 |
|
|
|
46 |
|
47 |
| Training Loss | Epoch | Step | Validation Loss |
|
48 |
|:-------------:|:-----:|:----:|:---------------:|
|
49 |
+
| No log | 1.0 | 1 | 4.8954 |
|
50 |
+
| No log | 2.0 | 2 | 2.6904 |
|
51 |
+
| No log | 3.0 | 3 | 2.2356 |
|
52 |
+
| No log | 4.0 | 4 | 4.8808 |
|
53 |
+
| No log | 5.0 | 5 | 1.5454 |
|
54 |
+
| No log | 6.0 | 6 | 3.2389 |
|
55 |
+
| No log | 7.0 | 7 | 0.6490 |
|
56 |
+
| No log | 8.0 | 8 | 0.0044 |
|
57 |
+
| No log | 9.0 | 9 | 0.0014 |
|
58 |
+
| No log | 10.0 | 10 | 0.0010 |
|
59 |
+
| No log | 11.0 | 11 | 0.0006 |
|
60 |
+
| No log | 12.0 | 12 | 0.0004 |
|
61 |
+
| No log | 13.0 | 13 | 0.0003 |
|
62 |
+
| No log | 14.0 | 14 | 0.0003 |
|
63 |
| No log | 15.0 | 15 | 0.0002 |
|
64 |
+
| No log | 16.0 | 16 | 1.1187 |
|
65 |
+
| No log | 17.0 | 17 | 1.0980 |
|
66 |
+
| No log | 18.0 | 18 | 1.6005 |
|
67 |
+
| No log | 19.0 | 19 | 1.3744 |
|
68 |
+
| No log | 20.0 | 20 | 1.0966 |
|
69 |
+
| No log | 21.0 | 21 | 1.1044 |
|
70 |
+
| No log | 22.0 | 22 | 1.2535 |
|
71 |
+
| No log | 23.0 | 23 | 0.0002 |
|
72 |
+
| No log | 24.0 | 24 | 0.0002 |
|
73 |
+
| No log | 25.0 | 25 | 0.0002 |
|
74 |
+
| No log | 26.0 | 26 | 0.0012 |
|
75 |
+
| No log | 27.0 | 27 | 0.0009 |
|
76 |
+
| No log | 28.0 | 28 | 0.0032 |
|
77 |
+
| No log | 29.0 | 29 | 0.0004 |
|
78 |
+
| No log | 30.0 | 30 | 0.0002 |
|
79 |
+
| No log | 31.0 | 31 | 0.0001 |
|
80 |
| No log | 32.0 | 32 | 0.0001 |
|
81 |
| No log | 33.0 | 33 | 0.0001 |
|
82 |
| No log | 34.0 | 34 | 0.0001 |
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 265470032
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf4302c01aa76f9e4f8c3cd27c917bab2533e30920ad5a345bb2aa15f55e8563
|
3 |
size 265470032
|
runs/Feb17_03-10-41_656f9d99e3cb/events.out.tfevents.1708139449.656f9d99e3cb.417.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97f1c74606c1acbb4c4a69849316d4f0f520074559f1f488a4b16f96e4fdd124
|
3 |
+
size 17911
|
runs/Feb17_03-10-41_656f9d99e3cb/events.out.tfevents.1708139637.656f9d99e3cb.417.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:70ad2192e99f60dbf0f3867239584b0429062e7a9bcaa1b5f4a1190de32b6125
|
3 |
+
size 354
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4728
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6fe50e8a218a38c5df0c7adaead4e9d2aa15ceea6c07c82b3f0648f95f492753
|
3 |
size 4728
|