Model save
Browse files- README.md +1 -1
- all_results.json +4 -4
- eval_results.json +4 -4
- trainer_state.json +8 -0
README.md
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
---
|
2 |
base_model: meta-llama/Llama-3.2-1B
|
3 |
library_name: transformers
|
4 |
-
model_name:
|
5 |
tags:
|
6 |
- generated_from_trainer
|
7 |
- trl
|
|
|
1 |
---
|
2 |
base_model: meta-llama/Llama-3.2-1B
|
3 |
library_name: transformers
|
4 |
+
model_name: results
|
5 |
tags:
|
6 |
- generated_from_trainer
|
7 |
- trl
|
all_results.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"epoch": 6.6440677966101696,
|
3 |
-
"eval_loss": 2.
|
4 |
-
"eval_runtime": 16.
|
5 |
-
"eval_samples_per_second": 43.
|
6 |
-
"eval_steps_per_second": 5.
|
7 |
"total_flos": 5.749859310737818e+16,
|
8 |
"train_loss": 0.9609878695740992,
|
9 |
"train_runtime": 1272.9991,
|
|
|
1 |
{
|
2 |
"epoch": 6.6440677966101696,
|
3 |
+
"eval_loss": 2.677806854248047,
|
4 |
+
"eval_runtime": 16.1742,
|
5 |
+
"eval_samples_per_second": 43.774,
|
6 |
+
"eval_steps_per_second": 5.503,
|
7 |
"total_flos": 5.749859310737818e+16,
|
8 |
"train_loss": 0.9609878695740992,
|
9 |
"train_runtime": 1272.9991,
|
eval_results.json
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
{
|
2 |
"epoch": 6.6440677966101696,
|
3 |
-
"eval_loss": 2.
|
4 |
-
"eval_runtime": 16.
|
5 |
-
"eval_samples_per_second": 43.
|
6 |
-
"eval_steps_per_second": 5.
|
7 |
}
|
|
|
1 |
{
|
2 |
"epoch": 6.6440677966101696,
|
3 |
+
"eval_loss": 2.677806854248047,
|
4 |
+
"eval_runtime": 16.1742,
|
5 |
+
"eval_samples_per_second": 43.774,
|
6 |
+
"eval_steps_per_second": 5.503
|
7 |
}
|
trainer_state.json
CHANGED
@@ -175,6 +175,14 @@
|
|
175 |
"eval_samples_per_second": 43.753,
|
176 |
"eval_steps_per_second": 5.5,
|
177 |
"step": 98
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
178 |
}
|
179 |
],
|
180 |
"logging_steps": 10,
|
|
|
175 |
"eval_samples_per_second": 43.753,
|
176 |
"eval_steps_per_second": 5.5,
|
177 |
"step": 98
|
178 |
+
},
|
179 |
+
{
|
180 |
+
"epoch": 6.6440677966101696,
|
181 |
+
"eval_loss": 2.681103229522705,
|
182 |
+
"eval_runtime": 16.2756,
|
183 |
+
"eval_samples_per_second": 43.501,
|
184 |
+
"eval_steps_per_second": 5.468,
|
185 |
+
"step": 98
|
186 |
}
|
187 |
],
|
188 |
"logging_steps": 10,
|