PEFT
Safetensors
llama
alignment-handbook
trl
sft
Generated from Trainer
nthakur's picture
End of training
b11aa57 verified
raw
history blame contribute delete
421 Bytes
{
"epoch": 0.999896960329727,
"eval_loss": 0.25926071405410767,
"eval_runtime": 2934.4316,
"eval_samples": 8000,
"eval_samples_per_second": 2.726,
"eval_steps_per_second": 0.341,
"total_flos": 2.4144679757152256e+16,
"train_loss": 0.3040192322367887,
"train_runtime": 137718.1009,
"train_samples": 77636,
"train_samples_per_second": 0.564,
"train_steps_per_second": 0.035
}