Training in progress, epoch 70, checkpoint
Browse files
last-checkpoint/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 166496880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa812769d7086f7d6e19077f55b8e92cd7d402c7253b4b8e5b162c1020e22881
|
3 |
size 166496880
|
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 330495866
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:650ddd0fde638547cf9b2a00a224f109876334850aa5fcdf74e8cbf8ca681f89
|
3 |
size 330495866
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14244
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:685346e99c461788ef127f10b4458c9a0913ccd9cd3182686a88d0c9875a0b90
|
3 |
size 14244
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3dd2e1f761a5703283541aef2eeade4dd37cc067c721190ff4ee0690c491491b
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"best_metric": 0.3433947265148163,
|
3 |
"best_model_checkpoint": "chickens-composite-201616161616-150-epochs-w-transform/checkpoint-33000",
|
4 |
-
"epoch":
|
5 |
"eval_steps": 500,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -9851,6 +9851,144 @@
|
|
9851 |
"eval_samples_per_second": 7.579,
|
9852 |
"eval_steps_per_second": 0.985,
|
9853 |
"step": 34500
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
9854 |
}
|
9855 |
],
|
9856 |
"logging_steps": 30,
|
@@ -9870,7 +10008,7 @@
|
|
9870 |
"attributes": {}
|
9871 |
}
|
9872 |
},
|
9873 |
-
"total_flos": 1.
|
9874 |
"train_batch_size": 2,
|
9875 |
"trial_name": null,
|
9876 |
"trial_params": null
|
|
|
1 |
{
|
2 |
"best_metric": 0.3433947265148163,
|
3 |
"best_model_checkpoint": "chickens-composite-201616161616-150-epochs-w-transform/checkpoint-33000",
|
4 |
+
"epoch": 70.0,
|
5 |
"eval_steps": 500,
|
6 |
+
"global_step": 35000,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
9851 |
"eval_samples_per_second": 7.579,
|
9852 |
"eval_steps_per_second": 0.985,
|
9853 |
"step": 34500
|
9854 |
+
},
|
9855 |
+
{
|
9856 |
+
"epoch": 69.06,
|
9857 |
+
"grad_norm": 5.733088619308546e-05,
|
9858 |
+
"learning_rate": 5.620432034152107e-06,
|
9859 |
+
"loss": 0.4275,
|
9860 |
+
"step": 34530
|
9861 |
+
},
|
9862 |
+
{
|
9863 |
+
"epoch": 69.12,
|
9864 |
+
"grad_norm": 51.50437927246094,
|
9865 |
+
"learning_rate": 5.614196920735822e-06,
|
9866 |
+
"loss": 0.4622,
|
9867 |
+
"step": 34560
|
9868 |
+
},
|
9869 |
+
{
|
9870 |
+
"epoch": 69.18,
|
9871 |
+
"grad_norm": 38.773948669433594,
|
9872 |
+
"learning_rate": 5.607960837418763e-06,
|
9873 |
+
"loss": 0.4583,
|
9874 |
+
"step": 34590
|
9875 |
+
},
|
9876 |
+
{
|
9877 |
+
"epoch": 69.24,
|
9878 |
+
"grad_norm": 43.785675048828125,
|
9879 |
+
"learning_rate": 5.601723794048558e-06,
|
9880 |
+
"loss": 0.4097,
|
9881 |
+
"step": 34620
|
9882 |
+
},
|
9883 |
+
{
|
9884 |
+
"epoch": 69.3,
|
9885 |
+
"grad_norm": 45.26587677001953,
|
9886 |
+
"learning_rate": 5.59548580047435e-06,
|
9887 |
+
"loss": 0.4097,
|
9888 |
+
"step": 34650
|
9889 |
+
},
|
9890 |
+
{
|
9891 |
+
"epoch": 69.36,
|
9892 |
+
"grad_norm": 28.66240882873535,
|
9893 |
+
"learning_rate": 5.58924686654678e-06,
|
9894 |
+
"loss": 0.4591,
|
9895 |
+
"step": 34680
|
9896 |
+
},
|
9897 |
+
{
|
9898 |
+
"epoch": 69.42,
|
9899 |
+
"grad_norm": 43.78499984741211,
|
9900 |
+
"learning_rate": 5.5830070021179785e-06,
|
9901 |
+
"loss": 0.4095,
|
9902 |
+
"step": 34710
|
9903 |
+
},
|
9904 |
+
{
|
9905 |
+
"epoch": 69.48,
|
9906 |
+
"grad_norm": 32.92940139770508,
|
9907 |
+
"learning_rate": 5.576766217041541e-06,
|
9908 |
+
"loss": 0.4634,
|
9909 |
+
"step": 34740
|
9910 |
+
},
|
9911 |
+
{
|
9912 |
+
"epoch": 69.54,
|
9913 |
+
"grad_norm": 50.84819793701172,
|
9914 |
+
"learning_rate": 5.570524521172523e-06,
|
9915 |
+
"loss": 0.4746,
|
9916 |
+
"step": 34770
|
9917 |
+
},
|
9918 |
+
{
|
9919 |
+
"epoch": 69.6,
|
9920 |
+
"grad_norm": 38.97684097290039,
|
9921 |
+
"learning_rate": 5.5642819243674085e-06,
|
9922 |
+
"loss": 0.3952,
|
9923 |
+
"step": 34800
|
9924 |
+
},
|
9925 |
+
{
|
9926 |
+
"epoch": 69.66,
|
9927 |
+
"grad_norm": 100.71194458007812,
|
9928 |
+
"learning_rate": 5.558038436484116e-06,
|
9929 |
+
"loss": 0.4176,
|
9930 |
+
"step": 34830
|
9931 |
+
},
|
9932 |
+
{
|
9933 |
+
"epoch": 69.72,
|
9934 |
+
"grad_norm": 33.512420654296875,
|
9935 |
+
"learning_rate": 5.551794067381959e-06,
|
9936 |
+
"loss": 0.4269,
|
9937 |
+
"step": 34860
|
9938 |
+
},
|
9939 |
+
{
|
9940 |
+
"epoch": 69.78,
|
9941 |
+
"grad_norm": 54.8726692199707,
|
9942 |
+
"learning_rate": 5.545548826921653e-06,
|
9943 |
+
"loss": 0.3438,
|
9944 |
+
"step": 34890
|
9945 |
+
},
|
9946 |
+
{
|
9947 |
+
"epoch": 69.84,
|
9948 |
+
"grad_norm": 0.00013334951654542238,
|
9949 |
+
"learning_rate": 5.5393027249652844e-06,
|
9950 |
+
"loss": 0.4642,
|
9951 |
+
"step": 34920
|
9952 |
+
},
|
9953 |
+
{
|
9954 |
+
"epoch": 69.9,
|
9955 |
+
"grad_norm": 9.714184125186875e-05,
|
9956 |
+
"learning_rate": 5.5330557713763e-06,
|
9957 |
+
"loss": 0.3817,
|
9958 |
+
"step": 34950
|
9959 |
+
},
|
9960 |
+
{
|
9961 |
+
"epoch": 69.96,
|
9962 |
+
"grad_norm": 55.636146545410156,
|
9963 |
+
"learning_rate": 5.526807976019492e-06,
|
9964 |
+
"loss": 0.4091,
|
9965 |
+
"step": 34980
|
9966 |
+
},
|
9967 |
+
{
|
9968 |
+
"epoch": 70.0,
|
9969 |
+
"eval_loss": 0.3745727241039276,
|
9970 |
+
"eval_map": 0.7332,
|
9971 |
+
"eval_map_50": 0.9476,
|
9972 |
+
"eval_map_75": 0.8716,
|
9973 |
+
"eval_map_chicken": 0.7196,
|
9974 |
+
"eval_map_duck": 0.6808,
|
9975 |
+
"eval_map_large": 0.7409,
|
9976 |
+
"eval_map_medium": 0.728,
|
9977 |
+
"eval_map_plant": 0.7992,
|
9978 |
+
"eval_map_small": 0.1368,
|
9979 |
+
"eval_mar_1": 0.3026,
|
9980 |
+
"eval_mar_10": 0.7781,
|
9981 |
+
"eval_mar_100": 0.7825,
|
9982 |
+
"eval_mar_100_chicken": 0.7726,
|
9983 |
+
"eval_mar_100_duck": 0.7351,
|
9984 |
+
"eval_mar_100_plant": 0.8397,
|
9985 |
+
"eval_mar_large": 0.7993,
|
9986 |
+
"eval_mar_medium": 0.7767,
|
9987 |
+
"eval_mar_small": 0.2071,
|
9988 |
+
"eval_runtime": 14.4354,
|
9989 |
+
"eval_samples_per_second": 6.927,
|
9990 |
+
"eval_steps_per_second": 0.901,
|
9991 |
+
"step": 35000
|
9992 |
}
|
9993 |
],
|
9994 |
"logging_steps": 30,
|
|
|
10008 |
"attributes": {}
|
10009 |
}
|
10010 |
},
|
10011 |
+
"total_flos": 1.2040808951808e+19,
|
10012 |
"train_batch_size": 2,
|
10013 |
"trial_name": null,
|
10014 |
"trial_params": null
|