joe611 commited on
Commit
2df5d08
1 Parent(s): d1a3cb9

Training in progress, epoch 70, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8afc1746185cec16643e581fb9ab5321c6d13ec4eecbac00df77e4a2ef3926cb
3
  size 166496880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa812769d7086f7d6e19077f55b8e92cd7d402c7253b4b8e5b162c1020e22881
3
  size 166496880
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:475525798608d625979c7d71f2941abe896d06146dd33aea4d8d715b4e8faefd
3
  size 330495866
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:650ddd0fde638547cf9b2a00a224f109876334850aa5fcdf74e8cbf8ca681f89
3
  size 330495866
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:11db7bd7e6b331ec7027c1f9a58bac7d1a561357af84f38d3e10be5a0609cf76
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:685346e99c461788ef127f10b4458c9a0913ccd9cd3182686a88d0c9875a0b90
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9598ad7b14a1bbfb3ebd21f90fe1eb55454683653bdb0336d16fa0ddbc0fd33b
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3dd2e1f761a5703283541aef2eeade4dd37cc067c721190ff4ee0690c491491b
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.3433947265148163,
3
  "best_model_checkpoint": "chickens-composite-201616161616-150-epochs-w-transform/checkpoint-33000",
4
- "epoch": 69.0,
5
  "eval_steps": 500,
6
- "global_step": 34500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -9851,6 +9851,144 @@
9851
  "eval_samples_per_second": 7.579,
9852
  "eval_steps_per_second": 0.985,
9853
  "step": 34500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
9854
  }
9855
  ],
9856
  "logging_steps": 30,
@@ -9870,7 +10008,7 @@
9870
  "attributes": {}
9871
  }
9872
  },
9873
- "total_flos": 1.18687973953536e+19,
9874
  "train_batch_size": 2,
9875
  "trial_name": null,
9876
  "trial_params": null
 
1
  {
2
  "best_metric": 0.3433947265148163,
3
  "best_model_checkpoint": "chickens-composite-201616161616-150-epochs-w-transform/checkpoint-33000",
4
+ "epoch": 70.0,
5
  "eval_steps": 500,
6
+ "global_step": 35000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
9851
  "eval_samples_per_second": 7.579,
9852
  "eval_steps_per_second": 0.985,
9853
  "step": 34500
9854
+ },
9855
+ {
9856
+ "epoch": 69.06,
9857
+ "grad_norm": 5.733088619308546e-05,
9858
+ "learning_rate": 5.620432034152107e-06,
9859
+ "loss": 0.4275,
9860
+ "step": 34530
9861
+ },
9862
+ {
9863
+ "epoch": 69.12,
9864
+ "grad_norm": 51.50437927246094,
9865
+ "learning_rate": 5.614196920735822e-06,
9866
+ "loss": 0.4622,
9867
+ "step": 34560
9868
+ },
9869
+ {
9870
+ "epoch": 69.18,
9871
+ "grad_norm": 38.773948669433594,
9872
+ "learning_rate": 5.607960837418763e-06,
9873
+ "loss": 0.4583,
9874
+ "step": 34590
9875
+ },
9876
+ {
9877
+ "epoch": 69.24,
9878
+ "grad_norm": 43.785675048828125,
9879
+ "learning_rate": 5.601723794048558e-06,
9880
+ "loss": 0.4097,
9881
+ "step": 34620
9882
+ },
9883
+ {
9884
+ "epoch": 69.3,
9885
+ "grad_norm": 45.26587677001953,
9886
+ "learning_rate": 5.59548580047435e-06,
9887
+ "loss": 0.4097,
9888
+ "step": 34650
9889
+ },
9890
+ {
9891
+ "epoch": 69.36,
9892
+ "grad_norm": 28.66240882873535,
9893
+ "learning_rate": 5.58924686654678e-06,
9894
+ "loss": 0.4591,
9895
+ "step": 34680
9896
+ },
9897
+ {
9898
+ "epoch": 69.42,
9899
+ "grad_norm": 43.78499984741211,
9900
+ "learning_rate": 5.5830070021179785e-06,
9901
+ "loss": 0.4095,
9902
+ "step": 34710
9903
+ },
9904
+ {
9905
+ "epoch": 69.48,
9906
+ "grad_norm": 32.92940139770508,
9907
+ "learning_rate": 5.576766217041541e-06,
9908
+ "loss": 0.4634,
9909
+ "step": 34740
9910
+ },
9911
+ {
9912
+ "epoch": 69.54,
9913
+ "grad_norm": 50.84819793701172,
9914
+ "learning_rate": 5.570524521172523e-06,
9915
+ "loss": 0.4746,
9916
+ "step": 34770
9917
+ },
9918
+ {
9919
+ "epoch": 69.6,
9920
+ "grad_norm": 38.97684097290039,
9921
+ "learning_rate": 5.5642819243674085e-06,
9922
+ "loss": 0.3952,
9923
+ "step": 34800
9924
+ },
9925
+ {
9926
+ "epoch": 69.66,
9927
+ "grad_norm": 100.71194458007812,
9928
+ "learning_rate": 5.558038436484116e-06,
9929
+ "loss": 0.4176,
9930
+ "step": 34830
9931
+ },
9932
+ {
9933
+ "epoch": 69.72,
9934
+ "grad_norm": 33.512420654296875,
9935
+ "learning_rate": 5.551794067381959e-06,
9936
+ "loss": 0.4269,
9937
+ "step": 34860
9938
+ },
9939
+ {
9940
+ "epoch": 69.78,
9941
+ "grad_norm": 54.8726692199707,
9942
+ "learning_rate": 5.545548826921653e-06,
9943
+ "loss": 0.3438,
9944
+ "step": 34890
9945
+ },
9946
+ {
9947
+ "epoch": 69.84,
9948
+ "grad_norm": 0.00013334951654542238,
9949
+ "learning_rate": 5.5393027249652844e-06,
9950
+ "loss": 0.4642,
9951
+ "step": 34920
9952
+ },
9953
+ {
9954
+ "epoch": 69.9,
9955
+ "grad_norm": 9.714184125186875e-05,
9956
+ "learning_rate": 5.5330557713763e-06,
9957
+ "loss": 0.3817,
9958
+ "step": 34950
9959
+ },
9960
+ {
9961
+ "epoch": 69.96,
9962
+ "grad_norm": 55.636146545410156,
9963
+ "learning_rate": 5.526807976019492e-06,
9964
+ "loss": 0.4091,
9965
+ "step": 34980
9966
+ },
9967
+ {
9968
+ "epoch": 70.0,
9969
+ "eval_loss": 0.3745727241039276,
9970
+ "eval_map": 0.7332,
9971
+ "eval_map_50": 0.9476,
9972
+ "eval_map_75": 0.8716,
9973
+ "eval_map_chicken": 0.7196,
9974
+ "eval_map_duck": 0.6808,
9975
+ "eval_map_large": 0.7409,
9976
+ "eval_map_medium": 0.728,
9977
+ "eval_map_plant": 0.7992,
9978
+ "eval_map_small": 0.1368,
9979
+ "eval_mar_1": 0.3026,
9980
+ "eval_mar_10": 0.7781,
9981
+ "eval_mar_100": 0.7825,
9982
+ "eval_mar_100_chicken": 0.7726,
9983
+ "eval_mar_100_duck": 0.7351,
9984
+ "eval_mar_100_plant": 0.8397,
9985
+ "eval_mar_large": 0.7993,
9986
+ "eval_mar_medium": 0.7767,
9987
+ "eval_mar_small": 0.2071,
9988
+ "eval_runtime": 14.4354,
9989
+ "eval_samples_per_second": 6.927,
9990
+ "eval_steps_per_second": 0.901,
9991
+ "step": 35000
9992
  }
9993
  ],
9994
  "logging_steps": 30,
 
10008
  "attributes": {}
10009
  }
10010
  },
10011
+ "total_flos": 1.2040808951808e+19,
10012
  "train_batch_size": 2,
10013
  "trial_name": null,
10014
  "trial_params": null