anirudhmu's picture
End of training
deb26e9
{
"best_metric": 0.9844559585492227,
"best_model_checkpoint": "videomae-base-finetuned-soccer-action-recognitionx4/checkpoint-960",
"epoch": 39.02066666666666,
"eval_steps": 500,
"global_step": 1125,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.02,
"eval_accuracy": 0.37823834196891193,
"eval_loss": 1.3255189657211304,
"eval_runtime": 88.7594,
"eval_samples_per_second": 2.174,
"eval_steps_per_second": 0.552,
"step": 28
},
{
"epoch": 1.02,
"eval_accuracy": 0.5751295336787565,
"eval_loss": 0.9903116822242737,
"eval_runtime": 34.7202,
"eval_samples_per_second": 5.559,
"eval_steps_per_second": 1.411,
"step": 56
},
{
"epoch": 2.02,
"learning_rate": 1.4159292035398232e-05,
"loss": 1.1078,
"step": 80
},
{
"epoch": 2.02,
"eval_accuracy": 0.8238341968911918,
"eval_loss": 0.46475353837013245,
"eval_runtime": 33.6288,
"eval_samples_per_second": 5.739,
"eval_steps_per_second": 1.457,
"step": 84
},
{
"epoch": 3.03,
"eval_accuracy": 0.8341968911917098,
"eval_loss": 0.4074859917163849,
"eval_runtime": 33.5102,
"eval_samples_per_second": 5.759,
"eval_steps_per_second": 1.462,
"step": 113
},
{
"epoch": 4.02,
"eval_accuracy": 0.927461139896373,
"eval_loss": 0.23006045818328857,
"eval_runtime": 34.0136,
"eval_samples_per_second": 5.674,
"eval_steps_per_second": 1.441,
"step": 141
},
{
"epoch": 5.02,
"learning_rate": 1.907114624505929e-05,
"loss": 0.2591,
"step": 160
},
{
"epoch": 5.02,
"eval_accuracy": 0.8549222797927462,
"eval_loss": 0.4089970588684082,
"eval_runtime": 33.9545,
"eval_samples_per_second": 5.684,
"eval_steps_per_second": 1.443,
"step": 169
},
{
"epoch": 6.02,
"eval_accuracy": 0.9481865284974094,
"eval_loss": 0.1527147889137268,
"eval_runtime": 34.2304,
"eval_samples_per_second": 5.638,
"eval_steps_per_second": 1.431,
"step": 197
},
{
"epoch": 7.03,
"eval_accuracy": 0.9585492227979274,
"eval_loss": 0.14126576483249664,
"eval_runtime": 34.1805,
"eval_samples_per_second": 5.646,
"eval_steps_per_second": 1.434,
"step": 226
},
{
"epoch": 8.01,
"learning_rate": 1.74901185770751e-05,
"loss": 0.111,
"step": 240
},
{
"epoch": 8.02,
"eval_accuracy": 0.9637305699481865,
"eval_loss": 0.1385740041732788,
"eval_runtime": 33.69,
"eval_samples_per_second": 5.729,
"eval_steps_per_second": 1.454,
"step": 254
},
{
"epoch": 9.02,
"eval_accuracy": 0.9430051813471503,
"eval_loss": 0.16739489138126373,
"eval_runtime": 34.3119,
"eval_samples_per_second": 5.625,
"eval_steps_per_second": 1.428,
"step": 282
},
{
"epoch": 10.02,
"eval_accuracy": 0.9740932642487047,
"eval_loss": 0.10096671432256699,
"eval_runtime": 33.6401,
"eval_samples_per_second": 5.737,
"eval_steps_per_second": 1.457,
"step": 310
},
{
"epoch": 11.01,
"learning_rate": 1.590909090909091e-05,
"loss": 0.0509,
"step": 320
},
{
"epoch": 11.03,
"eval_accuracy": 0.9637305699481865,
"eval_loss": 0.1586216688156128,
"eval_runtime": 33.6589,
"eval_samples_per_second": 5.734,
"eval_steps_per_second": 1.456,
"step": 339
},
{
"epoch": 12.02,
"eval_accuracy": 0.8860103626943006,
"eval_loss": 0.2695624530315399,
"eval_runtime": 34.0413,
"eval_samples_per_second": 5.67,
"eval_steps_per_second": 1.439,
"step": 367
},
{
"epoch": 13.02,
"eval_accuracy": 0.917098445595855,
"eval_loss": 0.3004997670650482,
"eval_runtime": 33.8891,
"eval_samples_per_second": 5.695,
"eval_steps_per_second": 1.446,
"step": 395
},
{
"epoch": 14.0,
"learning_rate": 1.432806324110672e-05,
"loss": 0.023,
"step": 400
},
{
"epoch": 14.02,
"eval_accuracy": 0.9740932642487047,
"eval_loss": 0.10009404271841049,
"eval_runtime": 34.3813,
"eval_samples_per_second": 5.614,
"eval_steps_per_second": 1.425,
"step": 423
},
{
"epoch": 15.03,
"eval_accuracy": 0.9481865284974094,
"eval_loss": 0.19607579708099365,
"eval_runtime": 33.8549,
"eval_samples_per_second": 5.701,
"eval_steps_per_second": 1.447,
"step": 452
},
{
"epoch": 16.02,
"learning_rate": 1.274703557312253e-05,
"loss": 0.0354,
"step": 480
},
{
"epoch": 16.02,
"eval_accuracy": 0.9222797927461139,
"eval_loss": 0.2595587968826294,
"eval_runtime": 34.7628,
"eval_samples_per_second": 5.552,
"eval_steps_per_second": 1.41,
"step": 480
},
{
"epoch": 17.02,
"eval_accuracy": 0.9689119170984456,
"eval_loss": 0.10061533749103546,
"eval_runtime": 36.7389,
"eval_samples_per_second": 5.253,
"eval_steps_per_second": 1.334,
"step": 508
},
{
"epoch": 18.02,
"eval_accuracy": 0.9792746113989638,
"eval_loss": 0.09470318257808685,
"eval_runtime": 35.1648,
"eval_samples_per_second": 5.488,
"eval_steps_per_second": 1.393,
"step": 536
},
{
"epoch": 19.02,
"learning_rate": 1.116600790513834e-05,
"loss": 0.0141,
"step": 560
},
{
"epoch": 19.03,
"eval_accuracy": 0.9792746113989638,
"eval_loss": 0.08311115205287933,
"eval_runtime": 35.0699,
"eval_samples_per_second": 5.503,
"eval_steps_per_second": 1.397,
"step": 565
},
{
"epoch": 20.02,
"eval_accuracy": 0.9792746113989638,
"eval_loss": 0.06850504875183105,
"eval_runtime": 34.7445,
"eval_samples_per_second": 5.555,
"eval_steps_per_second": 1.41,
"step": 593
},
{
"epoch": 21.02,
"eval_accuracy": 0.9689119170984456,
"eval_loss": 0.09778512269258499,
"eval_runtime": 34.2526,
"eval_samples_per_second": 5.635,
"eval_steps_per_second": 1.431,
"step": 621
},
{
"epoch": 22.02,
"learning_rate": 9.58498023715415e-06,
"loss": 0.0168,
"step": 640
},
{
"epoch": 22.02,
"eval_accuracy": 0.9792746113989638,
"eval_loss": 0.08115241676568985,
"eval_runtime": 33.4433,
"eval_samples_per_second": 5.771,
"eval_steps_per_second": 1.465,
"step": 649
},
{
"epoch": 23.03,
"eval_accuracy": 0.9792746113989638,
"eval_loss": 0.07816170156002045,
"eval_runtime": 32.8844,
"eval_samples_per_second": 5.869,
"eval_steps_per_second": 1.49,
"step": 678
},
{
"epoch": 24.02,
"eval_accuracy": 0.927461139896373,
"eval_loss": 0.2624199390411377,
"eval_runtime": 33.6116,
"eval_samples_per_second": 5.742,
"eval_steps_per_second": 1.458,
"step": 706
},
{
"epoch": 25.01,
"learning_rate": 8.003952569169962e-06,
"loss": 0.0029,
"step": 720
},
{
"epoch": 25.02,
"eval_accuracy": 0.9533678756476683,
"eval_loss": 0.1805860698223114,
"eval_runtime": 33.2451,
"eval_samples_per_second": 5.805,
"eval_steps_per_second": 1.474,
"step": 734
},
{
"epoch": 26.02,
"eval_accuracy": 0.9585492227979274,
"eval_loss": 0.21230334043502808,
"eval_runtime": 32.7523,
"eval_samples_per_second": 5.893,
"eval_steps_per_second": 1.496,
"step": 762
},
{
"epoch": 27.03,
"eval_accuracy": 0.9481865284974094,
"eval_loss": 0.200972780585289,
"eval_runtime": 34.3388,
"eval_samples_per_second": 5.62,
"eval_steps_per_second": 1.427,
"step": 791
},
{
"epoch": 28.01,
"learning_rate": 6.422924901185771e-06,
"loss": 0.0048,
"step": 800
},
{
"epoch": 28.02,
"eval_accuracy": 0.9689119170984456,
"eval_loss": 0.12585969269275665,
"eval_runtime": 32.5431,
"eval_samples_per_second": 5.931,
"eval_steps_per_second": 1.506,
"step": 819
},
{
"epoch": 29.02,
"eval_accuracy": 0.9430051813471503,
"eval_loss": 0.2145320475101471,
"eval_runtime": 33.8812,
"eval_samples_per_second": 5.696,
"eval_steps_per_second": 1.446,
"step": 847
},
{
"epoch": 30.02,
"eval_accuracy": 0.9222797927461139,
"eval_loss": 0.29007139801979065,
"eval_runtime": 33.0865,
"eval_samples_per_second": 5.833,
"eval_steps_per_second": 1.481,
"step": 875
},
{
"epoch": 31.0,
"learning_rate": 4.841897233201581e-06,
"loss": 0.0042,
"step": 880
},
{
"epoch": 31.03,
"eval_accuracy": 0.9792746113989638,
"eval_loss": 0.0911334827542305,
"eval_runtime": 32.213,
"eval_samples_per_second": 5.991,
"eval_steps_per_second": 1.521,
"step": 904
},
{
"epoch": 32.02,
"eval_accuracy": 0.9740932642487047,
"eval_loss": 0.0891527533531189,
"eval_runtime": 35.2316,
"eval_samples_per_second": 5.478,
"eval_steps_per_second": 1.391,
"step": 932
},
{
"epoch": 33.02,
"learning_rate": 3.2608695652173914e-06,
"loss": 0.0024,
"step": 960
},
{
"epoch": 33.02,
"eval_accuracy": 0.9844559585492227,
"eval_loss": 0.09106723964214325,
"eval_runtime": 33.6234,
"eval_samples_per_second": 5.74,
"eval_steps_per_second": 1.457,
"step": 960
},
{
"epoch": 34.02,
"eval_accuracy": 0.9740932642487047,
"eval_loss": 0.09867668896913528,
"eval_runtime": 34.9535,
"eval_samples_per_second": 5.522,
"eval_steps_per_second": 1.402,
"step": 988
},
{
"epoch": 35.03,
"eval_accuracy": 0.9481865284974094,
"eval_loss": 0.14462456107139587,
"eval_runtime": 34.1647,
"eval_samples_per_second": 5.649,
"eval_steps_per_second": 1.434,
"step": 1017
},
{
"epoch": 36.02,
"learning_rate": 1.6798418972332018e-06,
"loss": 0.0008,
"step": 1040
},
{
"epoch": 36.02,
"eval_accuracy": 0.9481865284974094,
"eval_loss": 0.14153124392032623,
"eval_runtime": 33.7336,
"eval_samples_per_second": 5.721,
"eval_steps_per_second": 1.453,
"step": 1045
},
{
"epoch": 37.02,
"eval_accuracy": 0.9481865284974094,
"eval_loss": 0.1434861421585083,
"eval_runtime": 34.3867,
"eval_samples_per_second": 5.613,
"eval_steps_per_second": 1.425,
"step": 1073
},
{
"epoch": 38.02,
"eval_accuracy": 0.9481865284974094,
"eval_loss": 0.14380092918872833,
"eval_runtime": 34.1415,
"eval_samples_per_second": 5.653,
"eval_steps_per_second": 1.435,
"step": 1101
},
{
"epoch": 39.02,
"learning_rate": 9.881422924901187e-08,
"loss": 0.0008,
"step": 1120
},
{
"epoch": 39.02,
"eval_accuracy": 0.9533678756476683,
"eval_loss": 0.137101411819458,
"eval_runtime": 34.8796,
"eval_samples_per_second": 5.533,
"eval_steps_per_second": 1.405,
"step": 1125
},
{
"epoch": 39.02,
"step": 1125,
"total_flos": 4.471333316936427e+19,
"train_loss": 0.1162004730856667,
"train_runtime": 11133.0856,
"train_samples_per_second": 3.234,
"train_steps_per_second": 0.101
},
{
"epoch": 39.02,
"eval_accuracy": 0.964824120603015,
"eval_loss": 0.13270962238311768,
"eval_runtime": 98.7852,
"eval_samples_per_second": 2.014,
"eval_steps_per_second": 0.506,
"step": 1125
},
{
"epoch": 39.02,
"eval_accuracy": 0.964824120603015,
"eval_loss": 0.13270962238311768,
"eval_runtime": 34.085,
"eval_samples_per_second": 5.838,
"eval_steps_per_second": 1.467,
"step": 1125
}
],
"logging_steps": 80,
"max_steps": 1125,
"num_train_epochs": 9223372036854775807,
"save_steps": 500,
"total_flos": 4.471333316936427e+19,
"trial_name": null,
"trial_params": null
}