okhytrov commited on
Commit
6880ae2
·
verified ·
1 Parent(s): 3845698

End of training

Browse files
README.md CHANGED
@@ -2,23 +2,42 @@
2
  license: apache-2.0
3
  base_model: facebook/deit-base-distilled-patch16-224
4
  tags:
 
 
5
  - generated_from_trainer
6
  metrics:
7
  - accuracy
8
  model-index:
9
- - name: base
 
 
 
 
10
  results: []
11
  ---
12
 
13
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
14
  should probably proofread and complete it, then remove this comment. -->
15
 
16
- # base
17
-
18
- This model is a fine-tuned version of [facebook/deit-base-distilled-patch16-224](https://huggingface.co/facebook/deit-base-distilled-patch16-224) on an unknown dataset.
 
 
 
 
 
 
 
 
 
 
 
 
 
19
  It achieves the following results on the evaluation set:
20
- - Accuracy: 0.906
21
  - Loss: 0.3054
 
22
 
23
  ## Model description
24
 
 
2
  license: apache-2.0
3
  base_model: facebook/deit-base-distilled-patch16-224
4
  tags:
5
+ - image-classification
6
+ - vision
7
  - generated_from_trainer
8
  metrics:
9
  - accuracy
10
  model-index:
11
+ - name: "DeiT-base-DatasetDict({\n train: Dataset({\n features: ['img',\
12
+ \ 'fine_label', 'coarse_label'],\n num_rows: 50000\n })\n test: Dataset({\n\
13
+ \ features: ['img', 'fine_label', 'coarse_label'],\n num_rows: 10000\n\
14
+ \ })\n validation: Dataset({\n features: ['img', 'fine_label', 'coarse_label'],\n\
15
+ \ num_rows: 10000\n })\n})"
16
  results: []
17
  ---
18
 
19
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
20
  should probably proofread and complete it, then remove this comment. -->
21
 
22
+ # DeiT-base-DatasetDict({
23
+ train: Dataset({
24
+ features: ['img', 'fine_label', 'coarse_label'],
25
+ num_rows: 50000
26
+ })
27
+ test: Dataset({
28
+ features: ['img', 'fine_label', 'coarse_label'],
29
+ num_rows: 10000
30
+ })
31
+ validation: Dataset({
32
+ features: ['img', 'fine_label', 'coarse_label'],
33
+ num_rows: 10000
34
+ })
35
+ })
36
+
37
+ This model is a fine-tuned version of [facebook/deit-base-distilled-patch16-224](https://huggingface.co/facebook/deit-base-distilled-patch16-224) on the cifar100 dataset.
38
  It achieves the following results on the evaluation set:
 
39
  - Loss: 0.3054
40
+ - Accuracy: 0.906
41
 
42
  ## Model description
43
 
all_results.json CHANGED
@@ -2,12 +2,12 @@
2
  "epoch": 10.0,
3
  "eval_accuracy": 0.906,
4
  "eval_loss": 0.3053509294986725,
5
- "eval_runtime": 173.1395,
6
- "eval_samples_per_second": 57.757,
7
- "eval_steps_per_second": 57.757,
8
  "total_flos": 3.8815447523328e+19,
9
  "train_loss": 0.0,
10
- "train_runtime": 24.522,
11
- "train_samples_per_second": 20389.834,
12
- "train_steps_per_second": 318.897
13
  }
 
2
  "epoch": 10.0,
3
  "eval_accuracy": 0.906,
4
  "eval_loss": 0.3053509294986725,
5
+ "eval_runtime": 175.7662,
6
+ "eval_samples_per_second": 56.894,
7
+ "eval_steps_per_second": 56.894,
8
  "total_flos": 3.8815447523328e+19,
9
  "train_loss": 0.0,
10
+ "train_runtime": 36.1375,
11
+ "train_samples_per_second": 13836.038,
12
+ "train_steps_per_second": 216.396
13
  }
config.json CHANGED
@@ -222,6 +222,7 @@
222
  "num_channels": 3,
223
  "num_hidden_layers": 12,
224
  "patch_size": 16,
 
225
  "qkv_bias": true,
226
  "torch_dtype": "float32",
227
  "transformers_version": "4.38.1"
 
222
  "num_channels": 3,
223
  "num_hidden_layers": 12,
224
  "patch_size": 16,
225
+ "problem_type": "single_label_classification",
226
  "qkv_bias": true,
227
  "torch_dtype": "float32",
228
  "transformers_version": "4.38.1"
eval_results.json CHANGED
@@ -2,7 +2,7 @@
2
  "epoch": 10.0,
3
  "eval_accuracy": 0.906,
4
  "eval_loss": 0.3053509294986725,
5
- "eval_runtime": 173.1395,
6
- "eval_samples_per_second": 57.757,
7
- "eval_steps_per_second": 57.757
8
  }
 
2
  "epoch": 10.0,
3
  "eval_accuracy": 0.906,
4
  "eval_loss": 0.3053509294986725,
5
+ "eval_runtime": 175.7662,
6
+ "eval_samples_per_second": 56.894,
7
+ "eval_steps_per_second": 56.894
8
  }
runs/Mar02_14-41-50_04f752329dca/events.out.tfevents.1709390811.04f752329dca.283.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:898c1208cdb37723a8396fc5cc641298180de02118c7a73d681bd6295c943afd
3
+ size 411
train_results.json CHANGED
@@ -2,7 +2,7 @@
2
  "epoch": 10.0,
3
  "total_flos": 3.8815447523328e+19,
4
  "train_loss": 0.0,
5
- "train_runtime": 24.522,
6
- "train_samples_per_second": 20389.834,
7
- "train_steps_per_second": 318.897
8
  }
 
2
  "epoch": 10.0,
3
  "total_flos": 3.8815447523328e+19,
4
  "train_loss": 0.0,
5
+ "train_runtime": 36.1375,
6
+ "train_samples_per_second": 13836.038,
7
+ "train_steps_per_second": 216.396
8
  }
trainer_state.json CHANGED
@@ -1039,9 +1039,9 @@
1039
  "step": 7820,
1040
  "total_flos": 3.8815447523328e+19,
1041
  "train_loss": 0.0,
1042
- "train_runtime": 24.522,
1043
- "train_samples_per_second": 20389.834,
1044
- "train_steps_per_second": 318.897
1045
  }
1046
  ],
1047
  "logging_steps": 50,
 
1039
  "step": 7820,
1040
  "total_flos": 3.8815447523328e+19,
1041
  "train_loss": 0.0,
1042
+ "train_runtime": 36.1375,
1043
+ "train_samples_per_second": 13836.038,
1044
+ "train_steps_per_second": 216.396
1045
  }
1046
  ],
1047
  "logging_steps": 50,