TheBug95 commited on
Commit
91f1f91
1 Parent(s): 5fa0619

Model save

Browse files
Files changed (4) hide show
  1. README.md +1 -1
  2. all_results.json +4 -4
  3. eval_results.json +4 -4
  4. trainer_state.json +8 -0
README.md CHANGED
@@ -1,7 +1,7 @@
1
  ---
2
  base_model: meta-llama/Llama-3.2-1B
3
  library_name: transformers
4
- model_name: Llama-3.2-1B-MS-MARCO-Qlora
5
  tags:
6
  - generated_from_trainer
7
  - trl
 
1
  ---
2
  base_model: meta-llama/Llama-3.2-1B
3
  library_name: transformers
4
+ model_name: results
5
  tags:
6
  - generated_from_trainer
7
  - trl
all_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "epoch": 6.6440677966101696,
3
- "eval_loss": 2.681103229522705,
4
- "eval_runtime": 16.2756,
5
- "eval_samples_per_second": 43.501,
6
- "eval_steps_per_second": 5.468,
7
  "total_flos": 5.749859310737818e+16,
8
  "train_loss": 0.9609878695740992,
9
  "train_runtime": 1272.9991,
 
1
  {
2
  "epoch": 6.6440677966101696,
3
+ "eval_loss": 2.677806854248047,
4
+ "eval_runtime": 16.1742,
5
+ "eval_samples_per_second": 43.774,
6
+ "eval_steps_per_second": 5.503,
7
  "total_flos": 5.749859310737818e+16,
8
  "train_loss": 0.9609878695740992,
9
  "train_runtime": 1272.9991,
eval_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "epoch": 6.6440677966101696,
3
- "eval_loss": 2.681103229522705,
4
- "eval_runtime": 16.2756,
5
- "eval_samples_per_second": 43.501,
6
- "eval_steps_per_second": 5.468
7
  }
 
1
  {
2
  "epoch": 6.6440677966101696,
3
+ "eval_loss": 2.677806854248047,
4
+ "eval_runtime": 16.1742,
5
+ "eval_samples_per_second": 43.774,
6
+ "eval_steps_per_second": 5.503
7
  }
trainer_state.json CHANGED
@@ -175,6 +175,14 @@
175
  "eval_samples_per_second": 43.753,
176
  "eval_steps_per_second": 5.5,
177
  "step": 98
 
 
 
 
 
 
 
 
178
  }
179
  ],
180
  "logging_steps": 10,
 
175
  "eval_samples_per_second": 43.753,
176
  "eval_steps_per_second": 5.5,
177
  "step": 98
178
+ },
179
+ {
180
+ "epoch": 6.6440677966101696,
181
+ "eval_loss": 2.681103229522705,
182
+ "eval_runtime": 16.2756,
183
+ "eval_samples_per_second": 43.501,
184
+ "eval_steps_per_second": 5.468,
185
+ "step": 98
186
  }
187
  ],
188
  "logging_steps": 10,