BuddhikaWeerasinghe commited on
Commit
31042ef
·
1 Parent(s): ae90098

End of training

Browse files
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 9.1,
3
- "eval_accuracy": 0.065,
4
- "eval_loss": 8.357227325439453,
5
- "eval_runtime": 45.341,
6
- "eval_samples_per_second": 4.411,
7
- "eval_steps_per_second": 2.206
8
  }
 
1
  {
2
  "epoch": 9.1,
3
+ "eval_accuracy": 0.0,
4
+ "eval_loss": 8.188952445983887,
5
+ "eval_runtime": 1.8553,
6
+ "eval_samples_per_second": 4.312,
7
+ "eval_steps_per_second": 2.156
8
  }
runs/Jun28_09-15-43_d7d6e6a71cfc/events.out.tfevents.1687946329.d7d6e6a71cfc.28.1 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:323dc234232021dc460a19c80045cc381d6c5f5a9973896c61f45878336236d5
3
- size 411
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4cd3cd6364c6ed1920e7374bc0c1813d79bd0694e7a123be68d41a3227e27e6a
3
+ size 734
test_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 9.1,
3
- "eval_accuracy": 0.065,
4
- "eval_loss": 8.357227325439453,
5
- "eval_runtime": 45.341,
6
- "eval_samples_per_second": 4.411,
7
- "eval_steps_per_second": 2.206
8
  }
 
1
  {
2
  "epoch": 9.1,
3
+ "eval_accuracy": 0.0,
4
+ "eval_loss": 8.188952445983887,
5
+ "eval_runtime": 1.8553,
6
+ "eval_samples_per_second": 4.312,
7
+ "eval_steps_per_second": 2.156
8
  }
trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 0.9532710280373832,
3
- "best_model_checkpoint": "videomae-base-finetuned-ucf101-subset-buddhika-weerasinghe/checkpoint-1800",
4
  "epoch": 9.1,
5
  "global_step": 1800,
6
  "is_hyper_param_search": false,
@@ -10,198 +10,198 @@
10
  {
11
  "epoch": 0.06,
12
  "learning_rate": 2.777777777777778e-05,
13
- "loss": 2.4197,
14
  "step": 100
15
  },
16
  {
17
  "epoch": 0.1,
18
- "eval_accuracy": 0.5327102803738317,
19
- "eval_loss": 1.6377586126327515,
20
- "eval_runtime": 24.7176,
21
- "eval_samples_per_second": 4.329,
22
- "eval_steps_per_second": 2.185,
23
  "step": 180
24
  },
25
  {
26
  "epoch": 1.01,
27
  "learning_rate": 4.938271604938271e-05,
28
- "loss": 1.8361,
29
  "step": 200
30
  },
31
  {
32
  "epoch": 1.07,
33
  "learning_rate": 4.62962962962963e-05,
34
- "loss": 0.8573,
35
  "step": 300
36
  },
37
  {
38
  "epoch": 1.1,
39
- "eval_accuracy": 0.8411214953271028,
40
- "eval_loss": 0.6645746827125549,
41
- "eval_runtime": 25.158,
42
- "eval_samples_per_second": 4.253,
43
- "eval_steps_per_second": 2.146,
44
  "step": 360
45
  },
46
  {
47
  "epoch": 2.02,
48
  "learning_rate": 4.3209876543209875e-05,
49
- "loss": 0.5808,
50
  "step": 400
51
  },
52
  {
53
  "epoch": 2.08,
54
  "learning_rate": 4.012345679012346e-05,
55
- "loss": 0.3788,
56
  "step": 500
57
  },
58
  {
59
  "epoch": 2.1,
60
- "eval_accuracy": 0.8691588785046729,
61
- "eval_loss": 0.47293204069137573,
62
- "eval_runtime": 24.7596,
63
- "eval_samples_per_second": 4.322,
64
- "eval_steps_per_second": 2.181,
65
  "step": 540
66
  },
67
  {
68
  "epoch": 3.03,
69
  "learning_rate": 3.7037037037037037e-05,
70
- "loss": 0.3202,
71
  "step": 600
72
  },
73
  {
74
  "epoch": 3.09,
75
  "learning_rate": 3.395061728395062e-05,
76
- "loss": 0.3128,
77
  "step": 700
78
  },
79
  {
80
  "epoch": 3.1,
81
- "eval_accuracy": 0.8785046728971962,
82
- "eval_loss": 0.4594048857688904,
83
- "eval_runtime": 24.6582,
84
- "eval_samples_per_second": 4.339,
85
- "eval_steps_per_second": 2.19,
86
  "step": 720
87
  },
88
  {
89
  "epoch": 4.04,
90
  "learning_rate": 3.08641975308642e-05,
91
- "loss": 0.1997,
92
  "step": 800
93
  },
94
  {
95
  "epoch": 4.1,
96
  "learning_rate": 2.777777777777778e-05,
97
- "loss": 0.1661,
98
  "step": 900
99
  },
100
  {
101
  "epoch": 4.1,
102
- "eval_accuracy": 0.8317757009345794,
103
- "eval_loss": 0.5953821539878845,
104
- "eval_runtime": 24.4322,
105
- "eval_samples_per_second": 4.379,
106
- "eval_steps_per_second": 2.21,
107
  "step": 900
108
  },
109
  {
110
  "epoch": 5.06,
111
  "learning_rate": 2.4691358024691357e-05,
112
- "loss": 0.1321,
113
  "step": 1000
114
  },
115
  {
116
  "epoch": 5.1,
117
- "eval_accuracy": 0.9345794392523364,
118
- "eval_loss": 0.19723989069461823,
119
- "eval_runtime": 24.5315,
120
- "eval_samples_per_second": 4.362,
121
- "eval_steps_per_second": 2.201,
122
  "step": 1080
123
  },
124
  {
125
  "epoch": 6.01,
126
  "learning_rate": 2.1604938271604937e-05,
127
- "loss": 0.0066,
128
  "step": 1100
129
  },
130
  {
131
  "epoch": 6.07,
132
  "learning_rate": 1.8518518518518518e-05,
133
- "loss": 0.0602,
134
  "step": 1200
135
  },
136
  {
137
  "epoch": 6.1,
138
- "eval_accuracy": 0.9252336448598131,
139
- "eval_loss": 0.3471812903881073,
140
- "eval_runtime": 24.5462,
141
- "eval_samples_per_second": 4.359,
142
- "eval_steps_per_second": 2.2,
143
  "step": 1260
144
  },
145
  {
146
  "epoch": 7.02,
147
  "learning_rate": 1.54320987654321e-05,
148
- "loss": 0.0025,
149
  "step": 1300
150
  },
151
  {
152
  "epoch": 7.08,
153
  "learning_rate": 1.2345679012345678e-05,
154
- "loss": 0.0269,
155
  "step": 1400
156
  },
157
  {
158
  "epoch": 7.1,
159
- "eval_accuracy": 0.9252336448598131,
160
- "eval_loss": 0.3087226152420044,
161
- "eval_runtime": 24.5511,
162
- "eval_samples_per_second": 4.358,
163
- "eval_steps_per_second": 2.199,
164
  "step": 1440
165
  },
166
  {
167
  "epoch": 8.03,
168
  "learning_rate": 9.259259259259259e-06,
169
- "loss": 0.0116,
170
  "step": 1500
171
  },
172
  {
173
  "epoch": 8.09,
174
  "learning_rate": 6.172839506172839e-06,
175
- "loss": 0.0058,
176
  "step": 1600
177
  },
178
  {
179
  "epoch": 8.1,
180
- "eval_accuracy": 0.9439252336448598,
181
- "eval_loss": 0.31687241792678833,
182
- "eval_runtime": 24.5581,
183
- "eval_samples_per_second": 4.357,
184
- "eval_steps_per_second": 2.199,
185
  "step": 1620
186
  },
187
  {
188
  "epoch": 9.04,
189
  "learning_rate": 3.0864197530864196e-06,
190
- "loss": 0.0029,
191
  "step": 1700
192
  },
193
  {
194
  "epoch": 9.1,
195
  "learning_rate": 0.0,
196
- "loss": 0.0061,
197
  "step": 1800
198
  },
199
  {
200
  "epoch": 9.1,
201
- "eval_accuracy": 0.9532710280373832,
202
- "eval_loss": 0.2525083124637604,
203
- "eval_runtime": 24.7778,
204
- "eval_samples_per_second": 4.318,
205
  "eval_steps_per_second": 2.179,
206
  "step": 1800
207
  },
@@ -209,27 +209,27 @@
209
  "epoch": 9.1,
210
  "step": 1800,
211
  "total_flos": 4.4862325749448704e+18,
212
- "train_loss": 0.40701433156927425,
213
- "train_runtime": 1997.2528,
214
- "train_samples_per_second": 1.802,
215
- "train_steps_per_second": 0.901
216
  },
217
  {
218
  "epoch": 9.1,
219
- "eval_accuracy": 0.065,
220
- "eval_loss": 8.357227325439453,
221
- "eval_runtime": 46.1165,
222
- "eval_samples_per_second": 4.337,
223
- "eval_steps_per_second": 2.168,
224
  "step": 1800
225
  },
226
  {
227
  "epoch": 9.1,
228
- "eval_accuracy": 0.065,
229
- "eval_loss": 8.357227325439453,
230
- "eval_runtime": 45.341,
231
- "eval_samples_per_second": 4.411,
232
- "eval_steps_per_second": 2.206,
233
  "step": 1800
234
  }
235
  ],
 
1
  {
2
+ "best_metric": 0.9763313609467456,
3
+ "best_model_checkpoint": "videomae-base-finetuned-ucf101-subset-buddhika-weerasinghe/checkpoint-1620",
4
  "epoch": 9.1,
5
  "global_step": 1800,
6
  "is_hyper_param_search": false,
 
10
  {
11
  "epoch": 0.06,
12
  "learning_rate": 2.777777777777778e-05,
13
+ "loss": 2.4105,
14
  "step": 100
15
  },
16
  {
17
  "epoch": 0.1,
18
+ "eval_accuracy": 0.46153846153846156,
19
+ "eval_loss": 1.6308622360229492,
20
+ "eval_runtime": 77.3029,
21
+ "eval_samples_per_second": 4.372,
22
+ "eval_steps_per_second": 2.186,
23
  "step": 180
24
  },
25
  {
26
  "epoch": 1.01,
27
  "learning_rate": 4.938271604938271e-05,
28
+ "loss": 1.8958,
29
  "step": 200
30
  },
31
  {
32
  "epoch": 1.07,
33
  "learning_rate": 4.62962962962963e-05,
34
+ "loss": 0.9175,
35
  "step": 300
36
  },
37
  {
38
  "epoch": 1.1,
39
+ "eval_accuracy": 0.878698224852071,
40
+ "eval_loss": 0.4374070167541504,
41
+ "eval_runtime": 78.2783,
42
+ "eval_samples_per_second": 4.318,
43
+ "eval_steps_per_second": 2.159,
44
  "step": 360
45
  },
46
  {
47
  "epoch": 2.02,
48
  "learning_rate": 4.3209876543209875e-05,
49
+ "loss": 0.6119,
50
  "step": 400
51
  },
52
  {
53
  "epoch": 2.08,
54
  "learning_rate": 4.012345679012346e-05,
55
+ "loss": 0.5086,
56
  "step": 500
57
  },
58
  {
59
  "epoch": 2.1,
60
+ "eval_accuracy": 0.8905325443786982,
61
+ "eval_loss": 0.38013187050819397,
62
+ "eval_runtime": 74.0577,
63
+ "eval_samples_per_second": 4.564,
64
+ "eval_steps_per_second": 2.282,
65
  "step": 540
66
  },
67
  {
68
  "epoch": 3.03,
69
  "learning_rate": 3.7037037037037037e-05,
70
+ "loss": 0.4112,
71
  "step": 600
72
  },
73
  {
74
  "epoch": 3.09,
75
  "learning_rate": 3.395061728395062e-05,
76
+ "loss": 0.2994,
77
  "step": 700
78
  },
79
  {
80
  "epoch": 3.1,
81
+ "eval_accuracy": 0.8816568047337278,
82
+ "eval_loss": 0.346200168132782,
83
+ "eval_runtime": 77.9704,
84
+ "eval_samples_per_second": 4.335,
85
+ "eval_steps_per_second": 2.167,
86
  "step": 720
87
  },
88
  {
89
  "epoch": 4.04,
90
  "learning_rate": 3.08641975308642e-05,
91
+ "loss": 0.2183,
92
  "step": 800
93
  },
94
  {
95
  "epoch": 4.1,
96
  "learning_rate": 2.777777777777778e-05,
97
+ "loss": 0.1555,
98
  "step": 900
99
  },
100
  {
101
  "epoch": 4.1,
102
+ "eval_accuracy": 0.9230769230769231,
103
+ "eval_loss": 0.3273673951625824,
104
+ "eval_runtime": 77.1136,
105
+ "eval_samples_per_second": 4.383,
106
+ "eval_steps_per_second": 2.192,
107
  "step": 900
108
  },
109
  {
110
  "epoch": 5.06,
111
  "learning_rate": 2.4691358024691357e-05,
112
+ "loss": 0.1337,
113
  "step": 1000
114
  },
115
  {
116
  "epoch": 5.1,
117
+ "eval_accuracy": 0.9615384615384616,
118
+ "eval_loss": 0.1434585154056549,
119
+ "eval_runtime": 77.4654,
120
+ "eval_samples_per_second": 4.363,
121
+ "eval_steps_per_second": 2.182,
122
  "step": 1080
123
  },
124
  {
125
  "epoch": 6.01,
126
  "learning_rate": 2.1604938271604937e-05,
127
+ "loss": 0.0749,
128
  "step": 1100
129
  },
130
  {
131
  "epoch": 6.07,
132
  "learning_rate": 1.8518518518518518e-05,
133
+ "loss": 0.021,
134
  "step": 1200
135
  },
136
  {
137
  "epoch": 6.1,
138
+ "eval_accuracy": 0.9615384615384616,
139
+ "eval_loss": 0.18787238001823425,
140
+ "eval_runtime": 77.5975,
141
+ "eval_samples_per_second": 4.356,
142
+ "eval_steps_per_second": 2.178,
143
  "step": 1260
144
  },
145
  {
146
  "epoch": 7.02,
147
  "learning_rate": 1.54320987654321e-05,
148
+ "loss": 0.003,
149
  "step": 1300
150
  },
151
  {
152
  "epoch": 7.08,
153
  "learning_rate": 1.2345679012345678e-05,
154
+ "loss": 0.0485,
155
  "step": 1400
156
  },
157
  {
158
  "epoch": 7.1,
159
+ "eval_accuracy": 0.9674556213017751,
160
+ "eval_loss": 0.10547798126935959,
161
+ "eval_runtime": 76.9785,
162
+ "eval_samples_per_second": 4.391,
163
+ "eval_steps_per_second": 2.195,
164
  "step": 1440
165
  },
166
  {
167
  "epoch": 8.03,
168
  "learning_rate": 9.259259259259259e-06,
169
+ "loss": 0.0021,
170
  "step": 1500
171
  },
172
  {
173
  "epoch": 8.09,
174
  "learning_rate": 6.172839506172839e-06,
175
+ "loss": 0.0019,
176
  "step": 1600
177
  },
178
  {
179
  "epoch": 8.1,
180
+ "eval_accuracy": 0.9763313609467456,
181
+ "eval_loss": 0.08644197881221771,
182
+ "eval_runtime": 78.2696,
183
+ "eval_samples_per_second": 4.318,
184
+ "eval_steps_per_second": 2.159,
185
  "step": 1620
186
  },
187
  {
188
  "epoch": 9.04,
189
  "learning_rate": 3.0864197530864196e-06,
190
+ "loss": 0.0038,
191
  "step": 1700
192
  },
193
  {
194
  "epoch": 9.1,
195
  "learning_rate": 0.0,
196
+ "loss": 0.0054,
197
  "step": 1800
198
  },
199
  {
200
  "epoch": 9.1,
201
+ "eval_accuracy": 0.9763313609467456,
202
+ "eval_loss": 0.08389929682016373,
203
+ "eval_runtime": 77.5761,
204
+ "eval_samples_per_second": 4.357,
205
  "eval_steps_per_second": 2.179,
206
  "step": 1800
207
  },
 
209
  "epoch": 9.1,
210
  "step": 1800,
211
  "total_flos": 4.4862325749448704e+18,
212
+ "train_loss": 0.42906751138468585,
213
+ "train_runtime": 2457.281,
214
+ "train_samples_per_second": 1.465,
215
+ "train_steps_per_second": 0.733
216
  },
217
  {
218
  "epoch": 9.1,
219
+ "eval_accuracy": 0.0,
220
+ "eval_loss": 8.188952445983887,
221
+ "eval_runtime": 2.195,
222
+ "eval_samples_per_second": 3.645,
223
+ "eval_steps_per_second": 1.822,
224
  "step": 1800
225
  },
226
  {
227
  "epoch": 9.1,
228
+ "eval_accuracy": 0.0,
229
+ "eval_loss": 8.188952445983887,
230
+ "eval_runtime": 1.8553,
231
+ "eval_samples_per_second": 4.312,
232
+ "eval_steps_per_second": 2.156,
233
  "step": 1800
234
  }
235
  ],