Silemo commited on
Commit
10a137a
1 Parent(s): 164f825

Training in progress, step 2400, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ce5374a700f6cb8856fec0d069890cb1c699a8142cbab7571daa3287a2b3058b
3
  size 966995080
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:427ae072cbc49ae148942a74b9f051c838d316269f69b8f3611c391c8a391f3c
3
  size 966995080
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:10dcd11e2cb1895f7c3e1c68032ca79221ba9837804ddc4c0ad628db4cb3bbbb
3
  size 1925064044
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08fe004ed695904662ce35ea3ec86602835c8a8f59b8179ec9a51565518cb6bf
3
  size 1925064044
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a9f1fe924fb046e82f32a9e9633992150d028a3f688d46144a5a5c7f5cbc6bad
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff499e04130faa18bab8a5b949aa9f38474523cf8282520e9cbda71727ce4299
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d6c2e8507c15e11b5d34f126b0dbb02f39afdf32066bd4c386593945bed215e3
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b19556c05ce15c76b44c442588d62a6615081b49579cf8217e66cc8d1a38558
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 70.1955074875208,
3
  "best_model_checkpoint": "./whisper-it/checkpoint-300",
4
- "epoch": 4.00763358778626,
5
  "eval_steps": 100,
6
- "global_step": 2100,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -700,6 +700,105 @@
700
  "eval_steps_per_second": 0.111,
701
  "eval_wer": 134.65058236272878,
702
  "step": 2100
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
703
  }
704
  ],
705
  "logging_steps": 25,
@@ -707,7 +806,7 @@
707
  "num_input_tokens_seen": 0,
708
  "num_train_epochs": 8,
709
  "save_steps": 100,
710
- "total_flos": 1.938485851029504e+19,
711
  "trial_name": null,
712
  "trial_params": null
713
  }
 
1
  {
2
  "best_metric": 70.1955074875208,
3
  "best_model_checkpoint": "./whisper-it/checkpoint-300",
4
+ "epoch": 4.580152671755725,
5
  "eval_steps": 100,
6
+ "global_step": 2400,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
700
  "eval_steps_per_second": 0.111,
701
  "eval_wer": 134.65058236272878,
702
  "step": 2100
703
+ },
704
+ {
705
+ "epoch": 4.06,
706
+ "learning_rate": 5.374285714285715e-06,
707
+ "loss": 0.018,
708
+ "step": 2125
709
+ },
710
+ {
711
+ "epoch": 4.1,
712
+ "learning_rate": 5.3028571428571425e-06,
713
+ "loss": 0.0165,
714
+ "step": 2150
715
+ },
716
+ {
717
+ "epoch": 4.15,
718
+ "learning_rate": 5.2314285714285716e-06,
719
+ "loss": 0.0157,
720
+ "step": 2175
721
+ },
722
+ {
723
+ "epoch": 4.2,
724
+ "learning_rate": 5.1600000000000006e-06,
725
+ "loss": 0.0173,
726
+ "step": 2200
727
+ },
728
+ {
729
+ "epoch": 4.2,
730
+ "eval_loss": 0.4140649735927582,
731
+ "eval_runtime": 1834.1524,
732
+ "eval_samples_per_second": 0.818,
733
+ "eval_steps_per_second": 0.102,
734
+ "eval_wer": 189.33721575152524,
735
+ "step": 2200
736
+ },
737
+ {
738
+ "epoch": 4.25,
739
+ "learning_rate": 5.08857142857143e-06,
740
+ "loss": 0.0157,
741
+ "step": 2225
742
+ },
743
+ {
744
+ "epoch": 4.29,
745
+ "learning_rate": 5.017142857142857e-06,
746
+ "loss": 0.015,
747
+ "step": 2250
748
+ },
749
+ {
750
+ "epoch": 4.34,
751
+ "learning_rate": 4.945714285714286e-06,
752
+ "loss": 0.0146,
753
+ "step": 2275
754
+ },
755
+ {
756
+ "epoch": 4.39,
757
+ "learning_rate": 4.874285714285715e-06,
758
+ "loss": 0.0174,
759
+ "step": 2300
760
+ },
761
+ {
762
+ "epoch": 4.39,
763
+ "eval_loss": 0.41064801812171936,
764
+ "eval_runtime": 1771.4749,
765
+ "eval_samples_per_second": 0.847,
766
+ "eval_steps_per_second": 0.106,
767
+ "eval_wer": 175.0207986688852,
768
+ "step": 2300
769
+ },
770
+ {
771
+ "epoch": 4.44,
772
+ "learning_rate": 4.802857142857143e-06,
773
+ "loss": 0.0164,
774
+ "step": 2325
775
+ },
776
+ {
777
+ "epoch": 4.48,
778
+ "learning_rate": 4.731428571428572e-06,
779
+ "loss": 0.0156,
780
+ "step": 2350
781
+ },
782
+ {
783
+ "epoch": 4.53,
784
+ "learning_rate": 4.66e-06,
785
+ "loss": 0.0145,
786
+ "step": 2375
787
+ },
788
+ {
789
+ "epoch": 4.58,
790
+ "learning_rate": 4.588571428571429e-06,
791
+ "loss": 0.0165,
792
+ "step": 2400
793
+ },
794
+ {
795
+ "epoch": 4.58,
796
+ "eval_loss": 0.4204367697238922,
797
+ "eval_runtime": 1768.9183,
798
+ "eval_samples_per_second": 0.848,
799
+ "eval_steps_per_second": 0.106,
800
+ "eval_wer": 179.64503605102607,
801
+ "step": 2400
802
  }
803
  ],
804
  "logging_steps": 25,
 
806
  "num_input_tokens_seen": 0,
807
  "num_train_epochs": 8,
808
  "save_steps": 100,
809
+ "total_flos": 2.215527835336704e+19,
810
  "trial_name": null,
811
  "trial_params": null
812
  }
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:77aa736647908221a6b18a6489ddd200e9a64629e700dfb2729d6eac836a4004
3
  size 4856
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec4f3c4eccd10d40b1e2a9f33f5736b02d4539dda80932770d03eaca234d4288
3
  size 4856