nirmalendu01 commited on
Commit
b4f7098
1 Parent(s): 7f0a914

Training in progress, step 123

Browse files
model-00001-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:db7512a5199c05ba44c1f08aec2662a08a8570c7c2b3550c640e7d2a845d6d6b
3
  size 4965805240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8004df829581f071a7fceb9f36552238d9722cec93c0e4572c68d1095e7a2f64
3
  size 4965805240
model-00002-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3a4f7a31c8ef4f890d96fde4b21c20a37840bf1c5a51e113e8f3d2bd756029bd
3
  size 1459729952
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3216a8cdc37ff72b8815dd35bee33b18b4a5645f15fb989c6f18796812ab1fda
3
  size 1459729952
sft_sentimentbackdoors_sft_Llama-3.2-3B_experiment_3.3.txt CHANGED
@@ -317,3 +317,11 @@ Deleted local checkpoint-117.
317
  {'loss': 0.9633, 'grad_norm': 0.953125, 'learning_rate': 7.018020889533348e-06, 'epoch': 1.9}
318
  {'eval_loss': 0.9540155529975891, 'eval_runtime': 115.9483, 'eval_samples_per_second': 13.886, 'eval_steps_per_second': 1.742, 'epoch': 1.9}
319
  {'loss': 0.9944, 'grad_norm': 0.8984375, 'learning_rate': 6.837923331031761e-06, 'epoch': 1.92}
 
 
 
 
 
 
 
 
 
317
  {'loss': 0.9633, 'grad_norm': 0.953125, 'learning_rate': 7.018020889533348e-06, 'epoch': 1.9}
318
  {'eval_loss': 0.9540155529975891, 'eval_runtime': 115.9483, 'eval_samples_per_second': 13.886, 'eval_steps_per_second': 1.742, 'epoch': 1.9}
319
  {'loss': 0.9944, 'grad_norm': 0.8984375, 'learning_rate': 6.837923331031761e-06, 'epoch': 1.92}
320
+ {'eval_loss': 0.9536876082420349, 'eval_runtime': 116.1982, 'eval_samples_per_second': 13.856, 'eval_steps_per_second': 1.738, 'epoch': 1.92}
321
+ Pushed checkpoint-120 to Hugging Face Hub.
322
+ Deleted local checkpoint-120.
323
+ {'loss': 0.8953, 'grad_norm': 0.94921875, 'learning_rate': 6.6589582850261025e-06, 'epoch': 1.94}
324
+ {'eval_loss': 0.953357458114624, 'eval_runtime': 115.8383, 'eval_samples_per_second': 13.899, 'eval_steps_per_second': 1.744, 'epoch': 1.94}
325
+ {'loss': 0.898, 'grad_norm': 0.9375, 'learning_rate': 6.48118984868167e-06, 'epoch': 1.95}
326
+ {'eval_loss': 0.9531052708625793, 'eval_runtime': 116.237, 'eval_samples_per_second': 13.851, 'eval_steps_per_second': 1.738, 'epoch': 1.95}
327
+ {'loss': 0.9456, 'grad_norm': 0.89453125, 'learning_rate': 6.304681690592431e-06, 'epoch': 1.97}