BuddhikaWeerasinghe commited on
Commit
c5cde79
·
1 Parent(s): 9096044

End of training

Browse files
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 1.5,
3
- "eval_accuracy": 0.055,
4
- "eval_loss": 4.912134170532227,
5
- "eval_runtime": 45.6456,
6
- "eval_samples_per_second": 4.382,
7
- "eval_steps_per_second": 2.191
8
  }
 
1
  {
2
+ "epoch": 9.1,
3
+ "eval_accuracy": 0.065,
4
+ "eval_loss": 8.357227325439453,
5
+ "eval_runtime": 45.341,
6
+ "eval_samples_per_second": 4.411,
7
+ "eval_steps_per_second": 2.206
8
  }
runs/Jun28_08-08-17_4f5dfca5dd87/events.out.tfevents.1687941883.4f5dfca5dd87.28.1 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c805bb99dd5e265499088b0f489d2dc4b1b01c069a6d9e241e049b9d915c39fd
3
- size 411
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b5ede4cfcdc7a299a6bb8188ca2ee203c84ba3a79448cc7a5ed87737e4a0e71
3
+ size 734
test_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 1.5,
3
- "eval_accuracy": 0.055,
4
- "eval_loss": 4.912134170532227,
5
- "eval_runtime": 45.6456,
6
- "eval_samples_per_second": 4.382,
7
- "eval_steps_per_second": 2.191
8
  }
 
1
  {
2
+ "epoch": 9.1,
3
+ "eval_accuracy": 0.065,
4
+ "eval_loss": 8.357227325439453,
5
+ "eval_runtime": 45.341,
6
+ "eval_samples_per_second": 4.411,
7
+ "eval_steps_per_second": 2.206
8
  }
trainer_state.json CHANGED
@@ -1,79 +1,241 @@
1
  {
2
- "best_metric": 0.822429906542056,
3
- "best_model_checkpoint": "videomae-base-finetuned-ucf101-subset-buddhika-weerasinghe/checkpoint-360",
4
- "epoch": 1.5,
5
- "global_step": 360,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
- "epoch": 0.28,
12
- "learning_rate": 4.012345679012346e-05,
13
- "loss": 2.2265,
14
  "step": 100
15
  },
16
  {
17
- "epoch": 0.5,
18
- "eval_accuracy": 0.719626168224299,
19
- "eval_loss": 1.0680640935897827,
20
- "eval_runtime": 25.2225,
21
- "eval_samples_per_second": 4.242,
22
- "eval_steps_per_second": 2.141,
23
  "step": 180
24
  },
25
  {
26
- "epoch": 1.06,
27
- "learning_rate": 2.4691358024691357e-05,
28
- "loss": 1.3376,
29
  "step": 200
30
  },
31
  {
32
- "epoch": 1.33,
33
- "learning_rate": 9.259259259259259e-06,
34
- "loss": 0.5234,
35
  "step": 300
36
  },
37
  {
38
- "epoch": 1.5,
39
- "eval_accuracy": 0.822429906542056,
40
- "eval_loss": 0.4782926142215729,
41
- "eval_runtime": 25.0552,
42
- "eval_samples_per_second": 4.271,
43
- "eval_steps_per_second": 2.155,
44
  "step": 360
45
  },
46
  {
47
- "epoch": 1.5,
48
- "step": 360,
49
- "total_flos": 8.972465149889741e+17,
50
- "train_loss": 1.1890253172980414,
51
- "train_runtime": 471.6798,
52
- "train_samples_per_second": 1.526,
53
- "train_steps_per_second": 0.763
54
  },
55
  {
56
- "epoch": 1.5,
57
- "eval_accuracy": 0.055,
58
- "eval_loss": 4.912134170532227,
59
- "eval_runtime": 47.46,
60
- "eval_samples_per_second": 4.214,
61
- "eval_steps_per_second": 2.107,
62
- "step": 360
63
  },
64
  {
65
- "epoch": 1.5,
66
- "eval_accuracy": 0.055,
67
- "eval_loss": 4.912134170532227,
68
- "eval_runtime": 45.6456,
69
- "eval_samples_per_second": 4.382,
70
- "eval_steps_per_second": 2.191,
71
- "step": 360
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
72
  }
73
  ],
74
- "max_steps": 360,
75
  "num_train_epochs": 9223372036854775807,
76
- "total_flos": 8.972465149889741e+17,
77
  "trial_name": null,
78
  "trial_params": null
79
  }
 
1
  {
2
+ "best_metric": 0.9532710280373832,
3
+ "best_model_checkpoint": "videomae-base-finetuned-ucf101-subset-buddhika-weerasinghe/checkpoint-1800",
4
+ "epoch": 9.1,
5
+ "global_step": 1800,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
+ "epoch": 0.06,
12
+ "learning_rate": 2.777777777777778e-05,
13
+ "loss": 2.4197,
14
  "step": 100
15
  },
16
  {
17
+ "epoch": 0.1,
18
+ "eval_accuracy": 0.5327102803738317,
19
+ "eval_loss": 1.6377586126327515,
20
+ "eval_runtime": 24.7176,
21
+ "eval_samples_per_second": 4.329,
22
+ "eval_steps_per_second": 2.185,
23
  "step": 180
24
  },
25
  {
26
+ "epoch": 1.01,
27
+ "learning_rate": 4.938271604938271e-05,
28
+ "loss": 1.8361,
29
  "step": 200
30
  },
31
  {
32
+ "epoch": 1.07,
33
+ "learning_rate": 4.62962962962963e-05,
34
+ "loss": 0.8573,
35
  "step": 300
36
  },
37
  {
38
+ "epoch": 1.1,
39
+ "eval_accuracy": 0.8411214953271028,
40
+ "eval_loss": 0.6645746827125549,
41
+ "eval_runtime": 25.158,
42
+ "eval_samples_per_second": 4.253,
43
+ "eval_steps_per_second": 2.146,
44
  "step": 360
45
  },
46
  {
47
+ "epoch": 2.02,
48
+ "learning_rate": 4.3209876543209875e-05,
49
+ "loss": 0.5808,
50
+ "step": 400
 
 
 
51
  },
52
  {
53
+ "epoch": 2.08,
54
+ "learning_rate": 4.012345679012346e-05,
55
+ "loss": 0.3788,
56
+ "step": 500
 
 
 
57
  },
58
  {
59
+ "epoch": 2.1,
60
+ "eval_accuracy": 0.8691588785046729,
61
+ "eval_loss": 0.47293204069137573,
62
+ "eval_runtime": 24.7596,
63
+ "eval_samples_per_second": 4.322,
64
+ "eval_steps_per_second": 2.181,
65
+ "step": 540
66
+ },
67
+ {
68
+ "epoch": 3.03,
69
+ "learning_rate": 3.7037037037037037e-05,
70
+ "loss": 0.3202,
71
+ "step": 600
72
+ },
73
+ {
74
+ "epoch": 3.09,
75
+ "learning_rate": 3.395061728395062e-05,
76
+ "loss": 0.3128,
77
+ "step": 700
78
+ },
79
+ {
80
+ "epoch": 3.1,
81
+ "eval_accuracy": 0.8785046728971962,
82
+ "eval_loss": 0.4594048857688904,
83
+ "eval_runtime": 24.6582,
84
+ "eval_samples_per_second": 4.339,
85
+ "eval_steps_per_second": 2.19,
86
+ "step": 720
87
+ },
88
+ {
89
+ "epoch": 4.04,
90
+ "learning_rate": 3.08641975308642e-05,
91
+ "loss": 0.1997,
92
+ "step": 800
93
+ },
94
+ {
95
+ "epoch": 4.1,
96
+ "learning_rate": 2.777777777777778e-05,
97
+ "loss": 0.1661,
98
+ "step": 900
99
+ },
100
+ {
101
+ "epoch": 4.1,
102
+ "eval_accuracy": 0.8317757009345794,
103
+ "eval_loss": 0.5953821539878845,
104
+ "eval_runtime": 24.4322,
105
+ "eval_samples_per_second": 4.379,
106
+ "eval_steps_per_second": 2.21,
107
+ "step": 900
108
+ },
109
+ {
110
+ "epoch": 5.06,
111
+ "learning_rate": 2.4691358024691357e-05,
112
+ "loss": 0.1321,
113
+ "step": 1000
114
+ },
115
+ {
116
+ "epoch": 5.1,
117
+ "eval_accuracy": 0.9345794392523364,
118
+ "eval_loss": 0.19723989069461823,
119
+ "eval_runtime": 24.5315,
120
+ "eval_samples_per_second": 4.362,
121
+ "eval_steps_per_second": 2.201,
122
+ "step": 1080
123
+ },
124
+ {
125
+ "epoch": 6.01,
126
+ "learning_rate": 2.1604938271604937e-05,
127
+ "loss": 0.0066,
128
+ "step": 1100
129
+ },
130
+ {
131
+ "epoch": 6.07,
132
+ "learning_rate": 1.8518518518518518e-05,
133
+ "loss": 0.0602,
134
+ "step": 1200
135
+ },
136
+ {
137
+ "epoch": 6.1,
138
+ "eval_accuracy": 0.9252336448598131,
139
+ "eval_loss": 0.3471812903881073,
140
+ "eval_runtime": 24.5462,
141
+ "eval_samples_per_second": 4.359,
142
+ "eval_steps_per_second": 2.2,
143
+ "step": 1260
144
+ },
145
+ {
146
+ "epoch": 7.02,
147
+ "learning_rate": 1.54320987654321e-05,
148
+ "loss": 0.0025,
149
+ "step": 1300
150
+ },
151
+ {
152
+ "epoch": 7.08,
153
+ "learning_rate": 1.2345679012345678e-05,
154
+ "loss": 0.0269,
155
+ "step": 1400
156
+ },
157
+ {
158
+ "epoch": 7.1,
159
+ "eval_accuracy": 0.9252336448598131,
160
+ "eval_loss": 0.3087226152420044,
161
+ "eval_runtime": 24.5511,
162
+ "eval_samples_per_second": 4.358,
163
+ "eval_steps_per_second": 2.199,
164
+ "step": 1440
165
+ },
166
+ {
167
+ "epoch": 8.03,
168
+ "learning_rate": 9.259259259259259e-06,
169
+ "loss": 0.0116,
170
+ "step": 1500
171
+ },
172
+ {
173
+ "epoch": 8.09,
174
+ "learning_rate": 6.172839506172839e-06,
175
+ "loss": 0.0058,
176
+ "step": 1600
177
+ },
178
+ {
179
+ "epoch": 8.1,
180
+ "eval_accuracy": 0.9439252336448598,
181
+ "eval_loss": 0.31687241792678833,
182
+ "eval_runtime": 24.5581,
183
+ "eval_samples_per_second": 4.357,
184
+ "eval_steps_per_second": 2.199,
185
+ "step": 1620
186
+ },
187
+ {
188
+ "epoch": 9.04,
189
+ "learning_rate": 3.0864197530864196e-06,
190
+ "loss": 0.0029,
191
+ "step": 1700
192
+ },
193
+ {
194
+ "epoch": 9.1,
195
+ "learning_rate": 0.0,
196
+ "loss": 0.0061,
197
+ "step": 1800
198
+ },
199
+ {
200
+ "epoch": 9.1,
201
+ "eval_accuracy": 0.9532710280373832,
202
+ "eval_loss": 0.2525083124637604,
203
+ "eval_runtime": 24.7778,
204
+ "eval_samples_per_second": 4.318,
205
+ "eval_steps_per_second": 2.179,
206
+ "step": 1800
207
+ },
208
+ {
209
+ "epoch": 9.1,
210
+ "step": 1800,
211
+ "total_flos": 4.4862325749448704e+18,
212
+ "train_loss": 0.40701433156927425,
213
+ "train_runtime": 1997.2528,
214
+ "train_samples_per_second": 1.802,
215
+ "train_steps_per_second": 0.901
216
+ },
217
+ {
218
+ "epoch": 9.1,
219
+ "eval_accuracy": 0.065,
220
+ "eval_loss": 8.357227325439453,
221
+ "eval_runtime": 46.1165,
222
+ "eval_samples_per_second": 4.337,
223
+ "eval_steps_per_second": 2.168,
224
+ "step": 1800
225
+ },
226
+ {
227
+ "epoch": 9.1,
228
+ "eval_accuracy": 0.065,
229
+ "eval_loss": 8.357227325439453,
230
+ "eval_runtime": 45.341,
231
+ "eval_samples_per_second": 4.411,
232
+ "eval_steps_per_second": 2.206,
233
+ "step": 1800
234
  }
235
  ],
236
+ "max_steps": 1800,
237
  "num_train_epochs": 9223372036854775807,
238
+ "total_flos": 4.4862325749448704e+18,
239
  "trial_name": null,
240
  "trial_params": null
241
  }