End of training
Browse files- README.md +24 -5
- all_results.json +6 -6
- config.json +1 -0
- eval_results.json +3 -3
- runs/Mar02_14-41-50_04f752329dca/events.out.tfevents.1709390811.04f752329dca.283.1 +3 -0
- train_results.json +3 -3
- trainer_state.json +3 -3
README.md
CHANGED
@@ -2,23 +2,42 @@
|
|
2 |
license: apache-2.0
|
3 |
base_model: facebook/deit-base-distilled-patch16-224
|
4 |
tags:
|
|
|
|
|
5 |
- generated_from_trainer
|
6 |
metrics:
|
7 |
- accuracy
|
8 |
model-index:
|
9 |
-
- name: base
|
|
|
|
|
|
|
|
|
10 |
results: []
|
11 |
---
|
12 |
|
13 |
<!-- This model card has been generated automatically according to the information the Trainer had access to. You
|
14 |
should probably proofread and complete it, then remove this comment. -->
|
15 |
|
16 |
-
# base
|
17 |
-
|
18 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
19 |
It achieves the following results on the evaluation set:
|
20 |
-
- Accuracy: 0.906
|
21 |
- Loss: 0.3054
|
|
|
22 |
|
23 |
## Model description
|
24 |
|
|
|
2 |
license: apache-2.0
|
3 |
base_model: facebook/deit-base-distilled-patch16-224
|
4 |
tags:
|
5 |
+
- image-classification
|
6 |
+
- vision
|
7 |
- generated_from_trainer
|
8 |
metrics:
|
9 |
- accuracy
|
10 |
model-index:
|
11 |
+
- name: "DeiT-base-DatasetDict({\n train: Dataset({\n features: ['img',\
|
12 |
+
\ 'fine_label', 'coarse_label'],\n num_rows: 50000\n })\n test: Dataset({\n\
|
13 |
+
\ features: ['img', 'fine_label', 'coarse_label'],\n num_rows: 10000\n\
|
14 |
+
\ })\n validation: Dataset({\n features: ['img', 'fine_label', 'coarse_label'],\n\
|
15 |
+
\ num_rows: 10000\n })\n})"
|
16 |
results: []
|
17 |
---
|
18 |
|
19 |
<!-- This model card has been generated automatically according to the information the Trainer had access to. You
|
20 |
should probably proofread and complete it, then remove this comment. -->
|
21 |
|
22 |
+
# DeiT-base-DatasetDict({
|
23 |
+
train: Dataset({
|
24 |
+
features: ['img', 'fine_label', 'coarse_label'],
|
25 |
+
num_rows: 50000
|
26 |
+
})
|
27 |
+
test: Dataset({
|
28 |
+
features: ['img', 'fine_label', 'coarse_label'],
|
29 |
+
num_rows: 10000
|
30 |
+
})
|
31 |
+
validation: Dataset({
|
32 |
+
features: ['img', 'fine_label', 'coarse_label'],
|
33 |
+
num_rows: 10000
|
34 |
+
})
|
35 |
+
})
|
36 |
+
|
37 |
+
This model is a fine-tuned version of [facebook/deit-base-distilled-patch16-224](https://huggingface.co/facebook/deit-base-distilled-patch16-224) on the cifar100 dataset.
|
38 |
It achieves the following results on the evaluation set:
|
|
|
39 |
- Loss: 0.3054
|
40 |
+
- Accuracy: 0.906
|
41 |
|
42 |
## Model description
|
43 |
|
all_results.json
CHANGED
@@ -2,12 +2,12 @@
|
|
2 |
"epoch": 10.0,
|
3 |
"eval_accuracy": 0.906,
|
4 |
"eval_loss": 0.3053509294986725,
|
5 |
-
"eval_runtime":
|
6 |
-
"eval_samples_per_second":
|
7 |
-
"eval_steps_per_second":
|
8 |
"total_flos": 3.8815447523328e+19,
|
9 |
"train_loss": 0.0,
|
10 |
-
"train_runtime":
|
11 |
-
"train_samples_per_second":
|
12 |
-
"train_steps_per_second":
|
13 |
}
|
|
|
2 |
"epoch": 10.0,
|
3 |
"eval_accuracy": 0.906,
|
4 |
"eval_loss": 0.3053509294986725,
|
5 |
+
"eval_runtime": 175.7662,
|
6 |
+
"eval_samples_per_second": 56.894,
|
7 |
+
"eval_steps_per_second": 56.894,
|
8 |
"total_flos": 3.8815447523328e+19,
|
9 |
"train_loss": 0.0,
|
10 |
+
"train_runtime": 36.1375,
|
11 |
+
"train_samples_per_second": 13836.038,
|
12 |
+
"train_steps_per_second": 216.396
|
13 |
}
|
config.json
CHANGED
@@ -222,6 +222,7 @@
|
|
222 |
"num_channels": 3,
|
223 |
"num_hidden_layers": 12,
|
224 |
"patch_size": 16,
|
|
|
225 |
"qkv_bias": true,
|
226 |
"torch_dtype": "float32",
|
227 |
"transformers_version": "4.38.1"
|
|
|
222 |
"num_channels": 3,
|
223 |
"num_hidden_layers": 12,
|
224 |
"patch_size": 16,
|
225 |
+
"problem_type": "single_label_classification",
|
226 |
"qkv_bias": true,
|
227 |
"torch_dtype": "float32",
|
228 |
"transformers_version": "4.38.1"
|
eval_results.json
CHANGED
@@ -2,7 +2,7 @@
|
|
2 |
"epoch": 10.0,
|
3 |
"eval_accuracy": 0.906,
|
4 |
"eval_loss": 0.3053509294986725,
|
5 |
-
"eval_runtime":
|
6 |
-
"eval_samples_per_second":
|
7 |
-
"eval_steps_per_second":
|
8 |
}
|
|
|
2 |
"epoch": 10.0,
|
3 |
"eval_accuracy": 0.906,
|
4 |
"eval_loss": 0.3053509294986725,
|
5 |
+
"eval_runtime": 175.7662,
|
6 |
+
"eval_samples_per_second": 56.894,
|
7 |
+
"eval_steps_per_second": 56.894
|
8 |
}
|
runs/Mar02_14-41-50_04f752329dca/events.out.tfevents.1709390811.04f752329dca.283.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:898c1208cdb37723a8396fc5cc641298180de02118c7a73d681bd6295c943afd
|
3 |
+
size 411
|
train_results.json
CHANGED
@@ -2,7 +2,7 @@
|
|
2 |
"epoch": 10.0,
|
3 |
"total_flos": 3.8815447523328e+19,
|
4 |
"train_loss": 0.0,
|
5 |
-
"train_runtime":
|
6 |
-
"train_samples_per_second":
|
7 |
-
"train_steps_per_second":
|
8 |
}
|
|
|
2 |
"epoch": 10.0,
|
3 |
"total_flos": 3.8815447523328e+19,
|
4 |
"train_loss": 0.0,
|
5 |
+
"train_runtime": 36.1375,
|
6 |
+
"train_samples_per_second": 13836.038,
|
7 |
+
"train_steps_per_second": 216.396
|
8 |
}
|
trainer_state.json
CHANGED
@@ -1039,9 +1039,9 @@
|
|
1039 |
"step": 7820,
|
1040 |
"total_flos": 3.8815447523328e+19,
|
1041 |
"train_loss": 0.0,
|
1042 |
-
"train_runtime":
|
1043 |
-
"train_samples_per_second":
|
1044 |
-
"train_steps_per_second":
|
1045 |
}
|
1046 |
],
|
1047 |
"logging_steps": 50,
|
|
|
1039 |
"step": 7820,
|
1040 |
"total_flos": 3.8815447523328e+19,
|
1041 |
"train_loss": 0.0,
|
1042 |
+
"train_runtime": 36.1375,
|
1043 |
+
"train_samples_per_second": 13836.038,
|
1044 |
+
"train_steps_per_second": 216.396
|
1045 |
}
|
1046 |
],
|
1047 |
"logging_steps": 50,
|