zen45 commited on
Commit
025177d
·
verified ·
1 Parent(s): 9aa0f61

End of training

Browse files
Files changed (5) hide show
  1. README.md +3 -3
  2. all_results.json +13 -0
  3. eval_results.json +8 -0
  4. train_results.json +8 -0
  5. trainer_state.json +229 -0
README.md CHANGED
@@ -22,7 +22,7 @@ model-index:
22
  metrics:
23
  - name: Accuracy
24
  type: accuracy
25
- value: 0.7614213197969543
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -32,8 +32,8 @@ should probably proofread and complete it, then remove this comment. -->
32
 
33
  This model is a fine-tuned version of [microsoft/swin-base-patch4-window7-224-in22k](https://huggingface.co/microsoft/swin-base-patch4-window7-224-in22k) on the imagefolder dataset.
34
  It achieves the following results on the evaluation set:
35
- - Loss: 1.3081
36
- - Accuracy: 0.7614
37
 
38
  ## Model description
39
 
 
22
  metrics:
23
  - name: Accuracy
24
  type: accuracy
25
+ value: 0.7715736040609137
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
32
 
33
  This model is a fine-tuned version of [microsoft/swin-base-patch4-window7-224-in22k](https://huggingface.co/microsoft/swin-base-patch4-window7-224-in22k) on the imagefolder dataset.
34
  It achieves the following results on the evaluation set:
35
+ - Loss: 1.1390
36
+ - Accuracy: 0.7716
37
 
38
  ## Model description
39
 
all_results.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 5.0,
3
+ "eval_accuracy": 0.7715736040609137,
4
+ "eval_loss": 1.139024019241333,
5
+ "eval_runtime": 26.9374,
6
+ "eval_samples_per_second": 14.627,
7
+ "eval_steps_per_second": 0.928,
8
+ "total_flos": 1.1242852922068992e+18,
9
+ "train_loss": 0.37599817170037164,
10
+ "train_runtime": 5634.9759,
11
+ "train_samples_per_second": 2.547,
12
+ "train_steps_per_second": 0.04
13
+ }
eval_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 5.0,
3
+ "eval_accuracy": 0.7715736040609137,
4
+ "eval_loss": 1.139024019241333,
5
+ "eval_runtime": 26.9374,
6
+ "eval_samples_per_second": 14.627,
7
+ "eval_steps_per_second": 0.928
8
+ }
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 5.0,
3
+ "total_flos": 1.1242852922068992e+18,
4
+ "train_loss": 0.37599817170037164,
5
+ "train_runtime": 5634.9759,
6
+ "train_samples_per_second": 2.547,
7
+ "train_steps_per_second": 0.04
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,229 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.7715736040609137,
3
+ "best_model_checkpoint": "swin-base-patch4-window7-224-in22k-finetuned-CT\\checkpoint-180",
4
+ "epoch": 5.0,
5
+ "eval_steps": 500,
6
+ "global_step": 225,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.2222222222222222,
13
+ "grad_norm": 4.816601276397705,
14
+ "learning_rate": 1.3043478260869566e-05,
15
+ "loss": 1.515,
16
+ "step": 10
17
+ },
18
+ {
19
+ "epoch": 0.4444444444444444,
20
+ "grad_norm": 4.57719087600708,
21
+ "learning_rate": 2.608695652173913e-05,
22
+ "loss": 1.2094,
23
+ "step": 20
24
+ },
25
+ {
26
+ "epoch": 0.6666666666666666,
27
+ "grad_norm": 22.845544815063477,
28
+ "learning_rate": 2.896039603960396e-05,
29
+ "loss": 0.8499,
30
+ "step": 30
31
+ },
32
+ {
33
+ "epoch": 0.8888888888888888,
34
+ "grad_norm": 22.14103126525879,
35
+ "learning_rate": 2.747524752475248e-05,
36
+ "loss": 0.5901,
37
+ "step": 40
38
+ },
39
+ {
40
+ "epoch": 1.0,
41
+ "eval_accuracy": 0.5685279187817259,
42
+ "eval_loss": 1.2601628303527832,
43
+ "eval_runtime": 25.1222,
44
+ "eval_samples_per_second": 15.683,
45
+ "eval_steps_per_second": 0.995,
46
+ "step": 45
47
+ },
48
+ {
49
+ "epoch": 1.1111111111111112,
50
+ "grad_norm": 13.752126693725586,
51
+ "learning_rate": 2.599009900990099e-05,
52
+ "loss": 0.4871,
53
+ "step": 50
54
+ },
55
+ {
56
+ "epoch": 1.3333333333333333,
57
+ "grad_norm": 20.15511131286621,
58
+ "learning_rate": 2.4504950495049504e-05,
59
+ "loss": 0.375,
60
+ "step": 60
61
+ },
62
+ {
63
+ "epoch": 1.5555555555555556,
64
+ "grad_norm": 7.8009490966796875,
65
+ "learning_rate": 2.301980198019802e-05,
66
+ "loss": 0.333,
67
+ "step": 70
68
+ },
69
+ {
70
+ "epoch": 1.7777777777777777,
71
+ "grad_norm": 6.6323957443237305,
72
+ "learning_rate": 2.1534653465346535e-05,
73
+ "loss": 0.2945,
74
+ "step": 80
75
+ },
76
+ {
77
+ "epoch": 2.0,
78
+ "grad_norm": 4.815214157104492,
79
+ "learning_rate": 2.004950495049505e-05,
80
+ "loss": 0.2771,
81
+ "step": 90
82
+ },
83
+ {
84
+ "epoch": 2.0,
85
+ "eval_accuracy": 0.7106598984771574,
86
+ "eval_loss": 1.1592636108398438,
87
+ "eval_runtime": 26.3129,
88
+ "eval_samples_per_second": 14.974,
89
+ "eval_steps_per_second": 0.95,
90
+ "step": 90
91
+ },
92
+ {
93
+ "epoch": 2.2222222222222223,
94
+ "grad_norm": 7.441839694976807,
95
+ "learning_rate": 1.8564356435643564e-05,
96
+ "loss": 0.2747,
97
+ "step": 100
98
+ },
99
+ {
100
+ "epoch": 2.4444444444444446,
101
+ "grad_norm": 16.264951705932617,
102
+ "learning_rate": 1.7079207920792078e-05,
103
+ "loss": 0.2465,
104
+ "step": 110
105
+ },
106
+ {
107
+ "epoch": 2.6666666666666665,
108
+ "grad_norm": 51.40734100341797,
109
+ "learning_rate": 1.5594059405940596e-05,
110
+ "loss": 0.2113,
111
+ "step": 120
112
+ },
113
+ {
114
+ "epoch": 2.888888888888889,
115
+ "grad_norm": 9.421001434326172,
116
+ "learning_rate": 1.4108910891089108e-05,
117
+ "loss": 0.2341,
118
+ "step": 130
119
+ },
120
+ {
121
+ "epoch": 3.0,
122
+ "eval_accuracy": 0.7233502538071066,
123
+ "eval_loss": 1.2320008277893066,
124
+ "eval_runtime": 25.3627,
125
+ "eval_samples_per_second": 15.535,
126
+ "eval_steps_per_second": 0.986,
127
+ "step": 135
128
+ },
129
+ {
130
+ "epoch": 3.111111111111111,
131
+ "grad_norm": 4.912576675415039,
132
+ "learning_rate": 1.2623762376237624e-05,
133
+ "loss": 0.2227,
134
+ "step": 140
135
+ },
136
+ {
137
+ "epoch": 3.3333333333333335,
138
+ "grad_norm": 35.091007232666016,
139
+ "learning_rate": 1.1138613861386138e-05,
140
+ "loss": 0.1684,
141
+ "step": 150
142
+ },
143
+ {
144
+ "epoch": 3.5555555555555554,
145
+ "grad_norm": 7.606155872344971,
146
+ "learning_rate": 9.653465346534654e-06,
147
+ "loss": 0.1606,
148
+ "step": 160
149
+ },
150
+ {
151
+ "epoch": 3.7777777777777777,
152
+ "grad_norm": 8.227788925170898,
153
+ "learning_rate": 8.168316831683168e-06,
154
+ "loss": 0.1323,
155
+ "step": 170
156
+ },
157
+ {
158
+ "epoch": 4.0,
159
+ "grad_norm": 9.39113712310791,
160
+ "learning_rate": 6.6831683168316835e-06,
161
+ "loss": 0.1879,
162
+ "step": 180
163
+ },
164
+ {
165
+ "epoch": 4.0,
166
+ "eval_accuracy": 0.7715736040609137,
167
+ "eval_loss": 1.139024019241333,
168
+ "eval_runtime": 25.2262,
169
+ "eval_samples_per_second": 15.619,
170
+ "eval_steps_per_second": 0.991,
171
+ "step": 180
172
+ },
173
+ {
174
+ "epoch": 4.222222222222222,
175
+ "grad_norm": 8.584113121032715,
176
+ "learning_rate": 5.198019801980198e-06,
177
+ "loss": 0.1653,
178
+ "step": 190
179
+ },
180
+ {
181
+ "epoch": 4.444444444444445,
182
+ "grad_norm": 9.124540328979492,
183
+ "learning_rate": 3.7128712871287128e-06,
184
+ "loss": 0.1394,
185
+ "step": 200
186
+ },
187
+ {
188
+ "epoch": 4.666666666666667,
189
+ "grad_norm": 6.846659183502197,
190
+ "learning_rate": 2.227722772277228e-06,
191
+ "loss": 0.1275,
192
+ "step": 210
193
+ },
194
+ {
195
+ "epoch": 4.888888888888889,
196
+ "grad_norm": 9.12004280090332,
197
+ "learning_rate": 7.425742574257426e-07,
198
+ "loss": 0.1765,
199
+ "step": 220
200
+ },
201
+ {
202
+ "epoch": 5.0,
203
+ "eval_accuracy": 0.7614213197969543,
204
+ "eval_loss": 1.3080726861953735,
205
+ "eval_runtime": 27.2127,
206
+ "eval_samples_per_second": 14.479,
207
+ "eval_steps_per_second": 0.919,
208
+ "step": 225
209
+ },
210
+ {
211
+ "epoch": 5.0,
212
+ "step": 225,
213
+ "total_flos": 1.1242852922068992e+18,
214
+ "train_loss": 0.37599817170037164,
215
+ "train_runtime": 5634.9759,
216
+ "train_samples_per_second": 2.547,
217
+ "train_steps_per_second": 0.04
218
+ }
219
+ ],
220
+ "logging_steps": 10,
221
+ "max_steps": 225,
222
+ "num_input_tokens_seen": 0,
223
+ "num_train_epochs": 5,
224
+ "save_steps": 500,
225
+ "total_flos": 1.1242852922068992e+18,
226
+ "train_batch_size": 16,
227
+ "trial_name": null,
228
+ "trial_params": null
229
+ }