marcelovidigal commited on
Commit
6efadbc
1 Parent(s): cf5d08f

Training in progress, epoch 21

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dde74ab64751bd948f2089f033ab9ed4ec866afaeb97f83f3ec4d2380b5f58c2
3
  size 267832560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4918ded49d06748fc4d0bf1acebc7cef25f445e331b893d8d5d2ce1bdd74a026
3
  size 267832560
wandb/debug-internal.log CHANGED
The diff for this file is too large to render. See raw diff
 
wandb/run-20240924_172630-x9iddikd/files/output.log CHANGED
@@ -55,3 +55,4 @@ You should probably TRAIN this model on a down-stream task to be able to use it
55
  {'eval_loss': 0.5907241106033325, 'eval_accuracy': 0.901, 'eval_runtime': 37.9133, 'eval_samples_per_second': 26.376, 'eval_steps_per_second': 0.844, 'epoch': 18.0}
56
  {'eval_loss': 0.517770528793335, 'eval_accuracy': 0.917, 'eval_runtime': 37.8369, 'eval_samples_per_second': 26.429, 'eval_steps_per_second': 0.846, 'epoch': 19.0}
57
  {'loss': 0.0187, 'grad_norm': 0.01947682909667492, 'learning_rate': 6e-06, 'epoch': 20.0}
 
 
55
  {'eval_loss': 0.5907241106033325, 'eval_accuracy': 0.901, 'eval_runtime': 37.9133, 'eval_samples_per_second': 26.376, 'eval_steps_per_second': 0.844, 'epoch': 18.0}
56
  {'eval_loss': 0.517770528793335, 'eval_accuracy': 0.917, 'eval_runtime': 37.8369, 'eval_samples_per_second': 26.429, 'eval_steps_per_second': 0.846, 'epoch': 19.0}
57
  {'loss': 0.0187, 'grad_norm': 0.01947682909667492, 'learning_rate': 6e-06, 'epoch': 20.0}
58
+ {'eval_loss': 0.5195603966712952, 'eval_accuracy': 0.92, 'eval_runtime': 37.9909, 'eval_samples_per_second': 26.322, 'eval_steps_per_second': 0.842, 'epoch': 20.0}
wandb/run-20240924_172630-x9iddikd/files/wandb-summary.json CHANGED
@@ -1 +1 @@
1
- {"eval/loss": 0.5195603966712952, "eval/accuracy": 0.92, "eval/runtime": 37.9909, "eval/samples_per_second": 26.322, "eval/steps_per_second": 0.842, "train/epoch": 20.0, "train/global_step": 2500, "_timestamp": 1727254719.74196, "_runtime": 45128.869050979614, "_step": 32, "train/loss": 0.0187, "train/grad_norm": 0.01947682909667492, "train/learning_rate": 6e-06, "train_runtime": 8026.8642, "train_samples_per_second": 2.492, "train_steps_per_second": 0.156, "total_flos": 2396475988298112.0, "train_loss": 0.11480112991333008}
 
1
+ {"eval/loss": 0.8739770650863647, "eval/accuracy": 0.617, "eval/runtime": 213.6265, "eval/samples_per_second": 4.681, "eval/steps_per_second": 0.15, "train/epoch": 21.0, "train/global_step": 2625, "_timestamp": 1727257219.806164, "_runtime": 47628.9332549572, "_step": 33, "train/loss": 0.0187, "train/grad_norm": 0.01947682909667492, "train/learning_rate": 6e-06, "train_runtime": 8026.8642, "train_samples_per_second": 2.492, "train_steps_per_second": 0.156, "total_flos": 2396475988298112.0, "train_loss": 0.11480112991333008}
wandb/run-20240924_172630-x9iddikd/logs/debug-internal.log CHANGED
The diff for this file is too large to render. See raw diff
 
wandb/run-20240924_172630-x9iddikd/run-x9iddikd.wandb CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:928144a1be5757f0385988ce82942ee4f2429f7e6752e9071b3b840cf07d41a9
3
- size 1237111
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b45a4a0fdb974a3d95ac5ad151db2bb81cdb2ef134a497304617a4fd2f1cbd9f
3
+ size 1306435