andrei-teodor commited on
Commit
1bc6f0b
·
verified ·
1 Parent(s): cb29732

Brain MRI 🧠 fine tune - 5 more epochs.

Browse files
README.md CHANGED
@@ -3,6 +3,7 @@ library_name: transformers
3
  license: apache-2.0
4
  base_model: google/vit-base-patch16-224
5
  tags:
 
6
  - generated_from_trainer
7
  metrics:
8
  - accuracy
@@ -16,10 +17,10 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  # vit-base-brain-mri
18
 
19
- This model is a fine-tuned version of [google/vit-base-patch16-224](https://huggingface.co/google/vit-base-patch16-224) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
- - Loss: 0.6249
22
- - Accuracy: 0.7770
23
 
24
  ## Model description
25
 
 
3
  license: apache-2.0
4
  base_model: google/vit-base-patch16-224
5
  tags:
6
+ - image-classification
7
  - generated_from_trainer
8
  metrics:
9
  - accuracy
 
17
 
18
  # vit-base-brain-mri
19
 
20
+ This model is a fine-tuned version of [google/vit-base-patch16-224](https://huggingface.co/google/vit-base-patch16-224) on the BrainMRI dataset.
21
  It achieves the following results on the evaluation set:
22
+ - Loss: 1.1441
23
+ - Accuracy: 0.5457
24
 
25
  ## Model description
26
 
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
- "epoch": 5.0,
3
- "eval_accuracy": 0.5304568527918782,
4
- "eval_loss": 1.1719971895217896,
5
- "eval_runtime": 7.6226,
6
- "eval_samples_per_second": 51.688,
7
- "eval_steps_per_second": 6.559,
8
- "total_flos": 8.896239873264845e+17,
9
- "train_loss": 0.0,
10
- "train_runtime": 0.201,
11
- "train_samples_per_second": 57114.909,
12
- "train_steps_per_second": 1791.06
13
  }
 
1
  {
2
+ "epoch": 10.0,
3
+ "eval_accuracy": 0.5456852791878173,
4
+ "eval_loss": 1.1441423892974854,
5
+ "eval_runtime": 3.3533,
6
+ "eval_samples_per_second": 117.494,
7
+ "eval_steps_per_second": 14.91,
8
+ "total_flos": 1.779247974652969e+18,
9
+ "train_loss": 0.3026825189590454,
10
+ "train_runtime": 130.7944,
11
+ "train_samples_per_second": 175.543,
12
+ "train_steps_per_second": 5.505
13
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 5.0,
3
- "eval_accuracy": 0.5304568527918782,
4
- "eval_loss": 1.1719971895217896,
5
- "eval_runtime": 7.6226,
6
- "eval_samples_per_second": 51.688,
7
- "eval_steps_per_second": 6.559
8
  }
 
1
  {
2
+ "epoch": 10.0,
3
+ "eval_accuracy": 0.5456852791878173,
4
+ "eval_loss": 1.1441423892974854,
5
+ "eval_runtime": 3.3533,
6
+ "eval_samples_per_second": 117.494,
7
+ "eval_steps_per_second": 14.91
8
  }
runs/Aug25_15-08-58_DESKTOP-4SGMSGR/events.out.tfevents.1724587887.DESKTOP-4SGMSGR.35484.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4595eed64c344239b3d3c66fab8db26b02ca685a6cc37e2e543104046d2e4c74
3
+ size 363
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 5.0,
3
- "total_flos": 8.896239873264845e+17,
4
- "train_loss": 0.0,
5
- "train_runtime": 0.201,
6
- "train_samples_per_second": 57114.909,
7
- "train_steps_per_second": 1791.06
8
  }
 
1
  {
2
+ "epoch": 10.0,
3
+ "total_flos": 1.779247974652969e+18,
4
+ "train_loss": 0.3026825189590454,
5
+ "train_runtime": 130.7944,
6
+ "train_samples_per_second": 175.543,
7
+ "train_steps_per_second": 5.505
8
  }
trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 0.7015281915664673,
3
- "best_model_checkpoint": "./vit-base-brain-mri\\checkpoint-360",
4
- "epoch": 5.0,
5
  "eval_steps": 500,
6
- "global_step": 360,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -75,19 +75,92 @@
75
  "step": 360
76
  },
77
  {
78
- "epoch": 5.0,
79
- "step": 360,
80
- "total_flos": 8.896239873264845e+17,
81
- "train_loss": 0.0,
82
- "train_runtime": 0.201,
83
- "train_samples_per_second": 57114.909,
84
- "train_steps_per_second": 1791.06
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
85
  }
86
  ],
87
  "logging_steps": 100,
88
- "max_steps": 360,
89
  "num_input_tokens_seen": 0,
90
- "num_train_epochs": 5,
91
  "save_steps": 500,
92
  "stateful_callbacks": {
93
  "TrainerControl": {
@@ -101,7 +174,7 @@
101
  "attributes": {}
102
  }
103
  },
104
- "total_flos": 8.896239873264845e+17,
105
  "train_batch_size": 32,
106
  "trial_name": null,
107
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.6089015603065491,
3
+ "best_model_checkpoint": "./vit-base-brain-mri\\checkpoint-648",
4
+ "epoch": 10.0,
5
  "eval_steps": 500,
6
+ "global_step": 720,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
75
  "step": 360
76
  },
77
  {
78
+ "epoch": 5.555555555555555,
79
+ "grad_norm": 1.9345481395721436,
80
+ "learning_rate": 0.0001333333333333333,
81
+ "loss": 0.6651,
82
+ "step": 400
83
+ },
84
+ {
85
+ "epoch": 6.0,
86
+ "eval_accuracy": 0.7630662020905923,
87
+ "eval_loss": 0.68391352891922,
88
+ "eval_runtime": 4.8866,
89
+ "eval_samples_per_second": 117.465,
90
+ "eval_steps_per_second": 14.734,
91
+ "step": 432
92
+ },
93
+ {
94
+ "epoch": 6.944444444444445,
95
+ "grad_norm": 2.201732635498047,
96
+ "learning_rate": 9.166666666666667e-05,
97
+ "loss": 0.6307,
98
+ "step": 500
99
+ },
100
+ {
101
+ "epoch": 7.0,
102
+ "eval_accuracy": 0.7700348432055749,
103
+ "eval_loss": 0.6623685359954834,
104
+ "eval_runtime": 4.9432,
105
+ "eval_samples_per_second": 116.118,
106
+ "eval_steps_per_second": 14.565,
107
+ "step": 504
108
+ },
109
+ {
110
+ "epoch": 8.0,
111
+ "eval_accuracy": 0.7822299651567944,
112
+ "eval_loss": 0.6363218426704407,
113
+ "eval_runtime": 4.9241,
114
+ "eval_samples_per_second": 116.57,
115
+ "eval_steps_per_second": 14.622,
116
+ "step": 576
117
+ },
118
+ {
119
+ "epoch": 8.333333333333334,
120
+ "grad_norm": 1.8554637432098389,
121
+ "learning_rate": 4.9999999999999996e-05,
122
+ "loss": 0.5857,
123
+ "step": 600
124
+ },
125
+ {
126
+ "epoch": 9.0,
127
+ "eval_accuracy": 0.7822299651567944,
128
+ "eval_loss": 0.6089015603065491,
129
+ "eval_runtime": 4.9259,
130
+ "eval_samples_per_second": 116.527,
131
+ "eval_steps_per_second": 14.617,
132
+ "step": 648
133
+ },
134
+ {
135
+ "epoch": 9.722222222222221,
136
+ "grad_norm": 3.4061734676361084,
137
+ "learning_rate": 8.333333333333332e-06,
138
+ "loss": 0.576,
139
+ "step": 700
140
+ },
141
+ {
142
+ "epoch": 10.0,
143
+ "eval_accuracy": 0.7770034843205574,
144
+ "eval_loss": 0.6249111294746399,
145
+ "eval_runtime": 5.1184,
146
+ "eval_samples_per_second": 112.144,
147
+ "eval_steps_per_second": 14.067,
148
+ "step": 720
149
+ },
150
+ {
151
+ "epoch": 10.0,
152
+ "step": 720,
153
+ "total_flos": 1.779247974652969e+18,
154
+ "train_loss": 0.3026825189590454,
155
+ "train_runtime": 130.7944,
156
+ "train_samples_per_second": 175.543,
157
+ "train_steps_per_second": 5.505
158
  }
159
  ],
160
  "logging_steps": 100,
161
+ "max_steps": 720,
162
  "num_input_tokens_seen": 0,
163
+ "num_train_epochs": 10,
164
  "save_steps": 500,
165
  "stateful_callbacks": {
166
  "TrainerControl": {
 
174
  "attributes": {}
175
  }
176
  },
177
+ "total_flos": 1.779247974652969e+18,
178
  "train_batch_size": 32,
179
  "trial_name": null,
180
  "trial_params": null