tdhcuong commited on
Commit
7eca599
·
verified ·
1 Parent(s): f5e3be8

End of training

Browse files
Files changed (5) hide show
  1. README.md +3 -3
  2. all_results.json +13 -0
  3. eval_results.json +8 -0
  4. train_results.json +8 -0
  5. trainer_state.json +227 -0
README.md CHANGED
@@ -23,7 +23,7 @@ model-index:
23
  metrics:
24
  - name: Accuracy
25
  type: accuracy
26
- value: 0.8984509466437177
27
  ---
28
 
29
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -33,8 +33,8 @@ should probably proofread and complete it, then remove this comment. -->
33
 
34
  This model is a fine-tuned version of [microsoft/swin-tiny-patch4-window7-224](https://huggingface.co/microsoft/swin-tiny-patch4-window7-224) on the imagefolder dataset.
35
  It achieves the following results on the evaluation set:
36
- - Loss: 0.2464
37
- - Accuracy: 0.8985
38
 
39
  ## Model description
40
 
 
23
  metrics:
24
  - name: Accuracy
25
  type: accuracy
26
+ value: 0.9139414802065404
27
  ---
28
 
29
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
33
 
34
  This model is a fine-tuned version of [microsoft/swin-tiny-patch4-window7-224](https://huggingface.co/microsoft/swin-tiny-patch4-window7-224) on the imagefolder dataset.
35
  It achieves the following results on the evaluation set:
36
+ - Loss: 0.2522
37
+ - Accuracy: 0.9139
38
 
39
  ## Model description
40
 
all_results.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 5.0,
3
+ "eval_accuracy": 0.9139414802065404,
4
+ "eval_loss": 0.2521795928478241,
5
+ "eval_runtime": 26.164,
6
+ "eval_samples_per_second": 22.206,
7
+ "eval_steps_per_second": 0.726,
8
+ "total_flos": 6.487956947146752e+17,
9
+ "train_loss": 0.36339920555672994,
10
+ "train_runtime": 1344.0908,
11
+ "train_samples_per_second": 19.418,
12
+ "train_steps_per_second": 0.153
13
+ }
eval_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 5.0,
3
+ "eval_accuracy": 0.9139414802065404,
4
+ "eval_loss": 0.2521795928478241,
5
+ "eval_runtime": 26.164,
6
+ "eval_samples_per_second": 22.206,
7
+ "eval_steps_per_second": 0.726
8
+ }
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 5.0,
3
+ "total_flos": 6.487956947146752e+17,
4
+ "train_loss": 0.36339920555672994,
5
+ "train_runtime": 1344.0908,
6
+ "train_samples_per_second": 19.418,
7
+ "train_steps_per_second": 0.153
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,227 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.9139414802065404,
3
+ "best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned-azure-poc-img-classification/checkpoint-123",
4
+ "epoch": 5.0,
5
+ "eval_steps": 500,
6
+ "global_step": 205,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.24390243902439024,
13
+ "grad_norm": 69.68915557861328,
14
+ "learning_rate": 2.380952380952381e-05,
15
+ "loss": 1.5545,
16
+ "step": 10
17
+ },
18
+ {
19
+ "epoch": 0.4878048780487805,
20
+ "grad_norm": 46.480247497558594,
21
+ "learning_rate": 4.761904761904762e-05,
22
+ "loss": 0.8946,
23
+ "step": 20
24
+ },
25
+ {
26
+ "epoch": 0.7317073170731707,
27
+ "grad_norm": 28.4664363861084,
28
+ "learning_rate": 4.7554347826086956e-05,
29
+ "loss": 0.5093,
30
+ "step": 30
31
+ },
32
+ {
33
+ "epoch": 0.975609756097561,
34
+ "grad_norm": 26.042448043823242,
35
+ "learning_rate": 4.483695652173913e-05,
36
+ "loss": 0.4227,
37
+ "step": 40
38
+ },
39
+ {
40
+ "epoch": 1.0,
41
+ "eval_accuracy": 0.8898450946643718,
42
+ "eval_loss": 0.3245888352394104,
43
+ "eval_runtime": 28.5684,
44
+ "eval_samples_per_second": 20.337,
45
+ "eval_steps_per_second": 0.665,
46
+ "step": 41
47
+ },
48
+ {
49
+ "epoch": 1.2195121951219512,
50
+ "grad_norm": 30.95467758178711,
51
+ "learning_rate": 4.2119565217391304e-05,
52
+ "loss": 0.3611,
53
+ "step": 50
54
+ },
55
+ {
56
+ "epoch": 1.4634146341463414,
57
+ "grad_norm": 15.45040225982666,
58
+ "learning_rate": 3.940217391304348e-05,
59
+ "loss": 0.3267,
60
+ "step": 60
61
+ },
62
+ {
63
+ "epoch": 1.7073170731707317,
64
+ "grad_norm": 17.348590850830078,
65
+ "learning_rate": 3.668478260869566e-05,
66
+ "loss": 0.3091,
67
+ "step": 70
68
+ },
69
+ {
70
+ "epoch": 1.951219512195122,
71
+ "grad_norm": 17.025691986083984,
72
+ "learning_rate": 3.3967391304347826e-05,
73
+ "loss": 0.3169,
74
+ "step": 80
75
+ },
76
+ {
77
+ "epoch": 2.0,
78
+ "eval_accuracy": 0.8950086058519794,
79
+ "eval_loss": 0.27360019087791443,
80
+ "eval_runtime": 25.8613,
81
+ "eval_samples_per_second": 22.466,
82
+ "eval_steps_per_second": 0.735,
83
+ "step": 82
84
+ },
85
+ {
86
+ "epoch": 2.1951219512195124,
87
+ "grad_norm": 14.608966827392578,
88
+ "learning_rate": 3.125e-05,
89
+ "loss": 0.2459,
90
+ "step": 90
91
+ },
92
+ {
93
+ "epoch": 2.4390243902439024,
94
+ "grad_norm": 15.097740173339844,
95
+ "learning_rate": 2.8532608695652175e-05,
96
+ "loss": 0.2455,
97
+ "step": 100
98
+ },
99
+ {
100
+ "epoch": 2.682926829268293,
101
+ "grad_norm": 16.881877899169922,
102
+ "learning_rate": 2.5815217391304346e-05,
103
+ "loss": 0.2439,
104
+ "step": 110
105
+ },
106
+ {
107
+ "epoch": 2.926829268292683,
108
+ "grad_norm": 17.772117614746094,
109
+ "learning_rate": 2.3097826086956523e-05,
110
+ "loss": 0.2632,
111
+ "step": 120
112
+ },
113
+ {
114
+ "epoch": 3.0,
115
+ "eval_accuracy": 0.9139414802065404,
116
+ "eval_loss": 0.2521795928478241,
117
+ "eval_runtime": 27.019,
118
+ "eval_samples_per_second": 21.503,
119
+ "eval_steps_per_second": 0.703,
120
+ "step": 123
121
+ },
122
+ {
123
+ "epoch": 3.1707317073170733,
124
+ "grad_norm": 16.634872436523438,
125
+ "learning_rate": 2.0380434782608694e-05,
126
+ "loss": 0.2085,
127
+ "step": 130
128
+ },
129
+ {
130
+ "epoch": 3.4146341463414633,
131
+ "grad_norm": 25.425128936767578,
132
+ "learning_rate": 1.766304347826087e-05,
133
+ "loss": 0.2293,
134
+ "step": 140
135
+ },
136
+ {
137
+ "epoch": 3.658536585365854,
138
+ "grad_norm": 9.363799095153809,
139
+ "learning_rate": 1.4945652173913044e-05,
140
+ "loss": 0.2041,
141
+ "step": 150
142
+ },
143
+ {
144
+ "epoch": 3.902439024390244,
145
+ "grad_norm": 8.764758110046387,
146
+ "learning_rate": 1.2228260869565218e-05,
147
+ "loss": 0.2034,
148
+ "step": 160
149
+ },
150
+ {
151
+ "epoch": 4.0,
152
+ "eval_accuracy": 0.8984509466437177,
153
+ "eval_loss": 0.24487625062465668,
154
+ "eval_runtime": 25.7575,
155
+ "eval_samples_per_second": 22.557,
156
+ "eval_steps_per_second": 0.738,
157
+ "step": 164
158
+ },
159
+ {
160
+ "epoch": 4.146341463414634,
161
+ "grad_norm": 11.34645938873291,
162
+ "learning_rate": 9.510869565217392e-06,
163
+ "loss": 0.224,
164
+ "step": 170
165
+ },
166
+ {
167
+ "epoch": 4.390243902439025,
168
+ "grad_norm": 16.645652770996094,
169
+ "learning_rate": 6.7934782608695655e-06,
170
+ "loss": 0.1933,
171
+ "step": 180
172
+ },
173
+ {
174
+ "epoch": 4.634146341463414,
175
+ "grad_norm": 12.6370267868042,
176
+ "learning_rate": 4.07608695652174e-06,
177
+ "loss": 0.1932,
178
+ "step": 190
179
+ },
180
+ {
181
+ "epoch": 4.878048780487805,
182
+ "grad_norm": 20.207782745361328,
183
+ "learning_rate": 1.3586956521739131e-06,
184
+ "loss": 0.1984,
185
+ "step": 200
186
+ },
187
+ {
188
+ "epoch": 5.0,
189
+ "eval_accuracy": 0.8984509466437177,
190
+ "eval_loss": 0.24636875092983246,
191
+ "eval_runtime": 27.2859,
192
+ "eval_samples_per_second": 21.293,
193
+ "eval_steps_per_second": 0.696,
194
+ "step": 205
195
+ },
196
+ {
197
+ "epoch": 5.0,
198
+ "step": 205,
199
+ "total_flos": 6.487956947146752e+17,
200
+ "train_loss": 0.36339920555672994,
201
+ "train_runtime": 1344.0908,
202
+ "train_samples_per_second": 19.418,
203
+ "train_steps_per_second": 0.153
204
+ }
205
+ ],
206
+ "logging_steps": 10,
207
+ "max_steps": 205,
208
+ "num_input_tokens_seen": 0,
209
+ "num_train_epochs": 5,
210
+ "save_steps": 500,
211
+ "stateful_callbacks": {
212
+ "TrainerControl": {
213
+ "args": {
214
+ "should_epoch_stop": false,
215
+ "should_evaluate": false,
216
+ "should_log": false,
217
+ "should_save": true,
218
+ "should_training_stop": true
219
+ },
220
+ "attributes": {}
221
+ }
222
+ },
223
+ "total_flos": 6.487956947146752e+17,
224
+ "train_batch_size": 32,
225
+ "trial_name": null,
226
+ "trial_params": null
227
+ }