End of training
Browse files- README.md +4 -2
- all_results.json +6 -6
- test_results.json +3 -3
- train_results.json +3 -3
- trainer_state.json +3 -3
- training_args.bin +1 -1
README.md
CHANGED
@@ -2,6 +2,8 @@
|
|
2 |
license: apache-2.0
|
3 |
base_model: SenseTime/deformable-detr
|
4 |
tags:
|
|
|
|
|
5 |
- generated_from_trainer
|
6 |
model-index:
|
7 |
- name: sensetime-deformable-detr-finetuned-10k-cppe5-manual-pad
|
@@ -14,7 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
|
|
14 |
[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="200" height="32"/>](https://wandb.ai/qubvel-hf-co/transformers-detection-model-finetuning-cppe5/runs/zv86s9w6)
|
15 |
# sensetime-deformable-detr-finetuned-10k-cppe5-manual-pad
|
16 |
|
17 |
-
This model is a fine-tuned version of [SenseTime/deformable-detr](https://huggingface.co/SenseTime/deformable-detr) on
|
18 |
It achieves the following results on the evaluation set:
|
19 |
- Loss: 1.0442
|
20 |
- Map: 0.3514
|
@@ -59,7 +61,7 @@ More information needed
|
|
59 |
The following hyperparameters were used during training:
|
60 |
- learning_rate: 5e-05
|
61 |
- train_batch_size: 4
|
62 |
-
- eval_batch_size:
|
63 |
- seed: 1337
|
64 |
- gradient_accumulation_steps: 2
|
65 |
- total_train_batch_size: 8
|
|
|
2 |
license: apache-2.0
|
3 |
base_model: SenseTime/deformable-detr
|
4 |
tags:
|
5 |
+
- object-detection
|
6 |
+
- vision
|
7 |
- generated_from_trainer
|
8 |
model-index:
|
9 |
- name: sensetime-deformable-detr-finetuned-10k-cppe5-manual-pad
|
|
|
16 |
[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="200" height="32"/>](https://wandb.ai/qubvel-hf-co/transformers-detection-model-finetuning-cppe5/runs/zv86s9w6)
|
17 |
# sensetime-deformable-detr-finetuned-10k-cppe5-manual-pad
|
18 |
|
19 |
+
This model is a fine-tuned version of [SenseTime/deformable-detr](https://huggingface.co/SenseTime/deformable-detr) on the cppe-5 dataset.
|
20 |
It achieves the following results on the evaluation set:
|
21 |
- Loss: 1.0442
|
22 |
- Map: 0.3514
|
|
|
61 |
The following hyperparameters were used during training:
|
62 |
- learning_rate: 5e-05
|
63 |
- train_batch_size: 4
|
64 |
+
- eval_batch_size: 1
|
65 |
- seed: 1337
|
66 |
- gradient_accumulation_steps: 2
|
67 |
- total_train_batch_size: 8
|
all_results.json
CHANGED
@@ -49,12 +49,12 @@
|
|
49 |
"test_mar_large": 0.8137,
|
50 |
"test_mar_medium": 0.5441,
|
51 |
"test_mar_small": 0.5739,
|
52 |
-
"test_runtime": 5.
|
53 |
-
"test_samples_per_second": 5.
|
54 |
-
"test_steps_per_second": 5.
|
55 |
"total_flos": 2.1870706694064443e+19,
|
56 |
"train_loss": 0.0,
|
57 |
-
"train_runtime": 3.
|
58 |
-
"train_samples_per_second":
|
59 |
-
"train_steps_per_second":
|
60 |
}
|
|
|
49 |
"test_mar_large": 0.8137,
|
50 |
"test_mar_medium": 0.5441,
|
51 |
"test_mar_small": 0.5739,
|
52 |
+
"test_runtime": 5.4531,
|
53 |
+
"test_samples_per_second": 5.318,
|
54 |
+
"test_steps_per_second": 5.318,
|
55 |
"total_flos": 2.1870706694064443e+19,
|
56 |
"train_loss": 0.0,
|
57 |
+
"train_runtime": 3.1369,
|
58 |
+
"train_samples_per_second": 27096.987,
|
59 |
+
"train_steps_per_second": 3379.154
|
60 |
}
|
test_results.json
CHANGED
@@ -23,7 +23,7 @@
|
|
23 |
"test_mar_large": 0.8137,
|
24 |
"test_mar_medium": 0.5441,
|
25 |
"test_mar_small": 0.5739,
|
26 |
-
"test_runtime": 5.
|
27 |
-
"test_samples_per_second": 5.
|
28 |
-
"test_steps_per_second": 5.
|
29 |
}
|
|
|
23 |
"test_mar_large": 0.8137,
|
24 |
"test_mar_medium": 0.5441,
|
25 |
"test_mar_small": 0.5739,
|
26 |
+
"test_runtime": 5.4531,
|
27 |
+
"test_samples_per_second": 5.318,
|
28 |
+
"test_steps_per_second": 5.318
|
29 |
}
|
train_results.json
CHANGED
@@ -2,7 +2,7 @@
|
|
2 |
"epoch": 99.53051643192488,
|
3 |
"total_flos": 2.1870706694064443e+19,
|
4 |
"train_loss": 0.0,
|
5 |
-
"train_runtime": 3.
|
6 |
-
"train_samples_per_second":
|
7 |
-
"train_steps_per_second":
|
8 |
}
|
|
|
2 |
"epoch": 99.53051643192488,
|
3 |
"total_flos": 2.1870706694064443e+19,
|
4 |
"train_loss": 0.0,
|
5 |
+
"train_runtime": 3.1369,
|
6 |
+
"train_samples_per_second": 27096.987,
|
7 |
+
"train_steps_per_second": 3379.154
|
8 |
}
|
trainer_state.json
CHANGED
@@ -3713,9 +3713,9 @@
|
|
3713 |
"step": 10600,
|
3714 |
"total_flos": 2.1870706694064443e+19,
|
3715 |
"train_loss": 0.0,
|
3716 |
-
"train_runtime": 3.
|
3717 |
-
"train_samples_per_second":
|
3718 |
-
"train_steps_per_second":
|
3719 |
}
|
3720 |
],
|
3721 |
"logging_steps": 500,
|
|
|
3713 |
"step": 10600,
|
3714 |
"total_flos": 2.1870706694064443e+19,
|
3715 |
"train_loss": 0.0,
|
3716 |
+
"train_runtime": 3.1369,
|
3717 |
+
"train_samples_per_second": 27096.987,
|
3718 |
+
"train_steps_per_second": 3379.154
|
3719 |
}
|
3720 |
],
|
3721 |
"logging_steps": 500,
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4923
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c3222ccdb193d177cc05f5ceafdc6676c18c37cf5c8df097f28bd95c9df0e91
|
3 |
size 4923
|