delivery_truck_classification / trainer_state.json
JEdward7777's picture
End of training
975cb8b
raw
history blame
16.8 kB
{
"best_metric": 0.9733333333333334,
"best_model_checkpoint": "delivery_truck_classification/checkpoint-155",
"epoch": 59.90909090909091,
"global_step": 300,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.91,
"eval_accuracy": 0.06666666666666667,
"eval_loss": 2.124830722808838,
"eval_runtime": 4.5982,
"eval_samples_per_second": 16.311,
"eval_steps_per_second": 0.652,
"step": 5
},
{
"epoch": 1.91,
"eval_accuracy": 0.24,
"eval_loss": 1.922129511833191,
"eval_runtime": 4.7321,
"eval_samples_per_second": 15.849,
"eval_steps_per_second": 0.634,
"step": 10
},
{
"epoch": 2.91,
"eval_accuracy": 0.32,
"eval_loss": 1.7176545858383179,
"eval_runtime": 4.4837,
"eval_samples_per_second": 16.727,
"eval_steps_per_second": 0.669,
"step": 15
},
{
"epoch": 3.91,
"learning_rate": 3.3333333333333335e-05,
"loss": 2.0123,
"step": 20
},
{
"epoch": 3.91,
"eval_accuracy": 0.4266666666666667,
"eval_loss": 1.5490375757217407,
"eval_runtime": 4.4804,
"eval_samples_per_second": 16.74,
"eval_steps_per_second": 0.67,
"step": 20
},
{
"epoch": 4.91,
"eval_accuracy": 0.5333333333333333,
"eval_loss": 1.3192248344421387,
"eval_runtime": 4.5163,
"eval_samples_per_second": 16.607,
"eval_steps_per_second": 0.664,
"step": 25
},
{
"epoch": 5.91,
"eval_accuracy": 0.64,
"eval_loss": 1.0764085054397583,
"eval_runtime": 4.4752,
"eval_samples_per_second": 16.759,
"eval_steps_per_second": 0.67,
"step": 30
},
{
"epoch": 6.91,
"eval_accuracy": 0.76,
"eval_loss": 0.8421124219894409,
"eval_runtime": 4.5472,
"eval_samples_per_second": 16.494,
"eval_steps_per_second": 0.66,
"step": 35
},
{
"epoch": 7.91,
"learning_rate": 4.814814814814815e-05,
"loss": 1.3539,
"step": 40
},
{
"epoch": 7.91,
"eval_accuracy": 0.8266666666666667,
"eval_loss": 0.6503960490226746,
"eval_runtime": 4.6022,
"eval_samples_per_second": 16.296,
"eval_steps_per_second": 0.652,
"step": 40
},
{
"epoch": 8.91,
"eval_accuracy": 0.8666666666666667,
"eval_loss": 0.5242553949356079,
"eval_runtime": 4.4829,
"eval_samples_per_second": 16.73,
"eval_steps_per_second": 0.669,
"step": 45
},
{
"epoch": 9.91,
"eval_accuracy": 0.88,
"eval_loss": 0.4281647205352783,
"eval_runtime": 4.4238,
"eval_samples_per_second": 16.954,
"eval_steps_per_second": 0.678,
"step": 50
},
{
"epoch": 10.91,
"eval_accuracy": 0.9066666666666666,
"eval_loss": 0.3949722349643707,
"eval_runtime": 4.5638,
"eval_samples_per_second": 16.434,
"eval_steps_per_second": 0.657,
"step": 55
},
{
"epoch": 11.91,
"learning_rate": 4.4444444444444447e-05,
"loss": 0.7315,
"step": 60
},
{
"epoch": 11.91,
"eval_accuracy": 0.8933333333333333,
"eval_loss": 0.361709862947464,
"eval_runtime": 4.5199,
"eval_samples_per_second": 16.593,
"eval_steps_per_second": 0.664,
"step": 60
},
{
"epoch": 12.91,
"eval_accuracy": 0.9066666666666666,
"eval_loss": 0.3166624903678894,
"eval_runtime": 4.4623,
"eval_samples_per_second": 16.807,
"eval_steps_per_second": 0.672,
"step": 65
},
{
"epoch": 13.91,
"eval_accuracy": 0.9066666666666666,
"eval_loss": 0.3022773861885071,
"eval_runtime": 4.4075,
"eval_samples_per_second": 17.016,
"eval_steps_per_second": 0.681,
"step": 70
},
{
"epoch": 14.91,
"eval_accuracy": 0.9333333333333333,
"eval_loss": 0.24396675825119019,
"eval_runtime": 4.4157,
"eval_samples_per_second": 16.985,
"eval_steps_per_second": 0.679,
"step": 75
},
{
"epoch": 15.91,
"learning_rate": 4.074074074074074e-05,
"loss": 0.5713,
"step": 80
},
{
"epoch": 15.91,
"eval_accuracy": 0.9333333333333333,
"eval_loss": 0.24749578535556793,
"eval_runtime": 4.3849,
"eval_samples_per_second": 17.104,
"eval_steps_per_second": 0.684,
"step": 80
},
{
"epoch": 16.91,
"eval_accuracy": 0.92,
"eval_loss": 0.2443261742591858,
"eval_runtime": 4.5173,
"eval_samples_per_second": 16.603,
"eval_steps_per_second": 0.664,
"step": 85
},
{
"epoch": 17.91,
"eval_accuracy": 0.96,
"eval_loss": 0.20929811894893646,
"eval_runtime": 4.4498,
"eval_samples_per_second": 16.855,
"eval_steps_per_second": 0.674,
"step": 90
},
{
"epoch": 18.91,
"eval_accuracy": 0.9466666666666667,
"eval_loss": 0.20770420134067535,
"eval_runtime": 4.481,
"eval_samples_per_second": 16.737,
"eval_steps_per_second": 0.669,
"step": 95
},
{
"epoch": 19.91,
"learning_rate": 3.7037037037037037e-05,
"loss": 0.515,
"step": 100
},
{
"epoch": 19.91,
"eval_accuracy": 0.9333333333333333,
"eval_loss": 0.2124166041612625,
"eval_runtime": 4.6887,
"eval_samples_per_second": 15.996,
"eval_steps_per_second": 0.64,
"step": 100
},
{
"epoch": 20.91,
"eval_accuracy": 0.96,
"eval_loss": 0.21663539111614227,
"eval_runtime": 4.4061,
"eval_samples_per_second": 17.022,
"eval_steps_per_second": 0.681,
"step": 105
},
{
"epoch": 21.91,
"eval_accuracy": 0.9333333333333333,
"eval_loss": 0.1939961463212967,
"eval_runtime": 4.4646,
"eval_samples_per_second": 16.799,
"eval_steps_per_second": 0.672,
"step": 110
},
{
"epoch": 22.91,
"eval_accuracy": 0.9333333333333333,
"eval_loss": 0.19843259453773499,
"eval_runtime": 4.5883,
"eval_samples_per_second": 16.346,
"eval_steps_per_second": 0.654,
"step": 115
},
{
"epoch": 23.91,
"learning_rate": 3.3333333333333335e-05,
"loss": 0.4582,
"step": 120
},
{
"epoch": 23.91,
"eval_accuracy": 0.9333333333333333,
"eval_loss": 0.23953679203987122,
"eval_runtime": 4.5302,
"eval_samples_per_second": 16.556,
"eval_steps_per_second": 0.662,
"step": 120
},
{
"epoch": 24.91,
"eval_accuracy": 0.92,
"eval_loss": 0.24795593321323395,
"eval_runtime": 4.4621,
"eval_samples_per_second": 16.808,
"eval_steps_per_second": 0.672,
"step": 125
},
{
"epoch": 25.91,
"eval_accuracy": 0.92,
"eval_loss": 0.2179584801197052,
"eval_runtime": 4.4204,
"eval_samples_per_second": 16.967,
"eval_steps_per_second": 0.679,
"step": 130
},
{
"epoch": 26.91,
"eval_accuracy": 0.9333333333333333,
"eval_loss": 0.2231944501399994,
"eval_runtime": 4.4482,
"eval_samples_per_second": 16.861,
"eval_steps_per_second": 0.674,
"step": 135
},
{
"epoch": 27.91,
"learning_rate": 2.962962962962963e-05,
"loss": 0.4279,
"step": 140
},
{
"epoch": 27.91,
"eval_accuracy": 0.9333333333333333,
"eval_loss": 0.1976775974035263,
"eval_runtime": 4.4409,
"eval_samples_per_second": 16.888,
"eval_steps_per_second": 0.676,
"step": 140
},
{
"epoch": 28.91,
"eval_accuracy": 0.9466666666666667,
"eval_loss": 0.18473981320858002,
"eval_runtime": 4.4471,
"eval_samples_per_second": 16.865,
"eval_steps_per_second": 0.675,
"step": 145
},
{
"epoch": 29.91,
"eval_accuracy": 0.9466666666666667,
"eval_loss": 0.19218212366104126,
"eval_runtime": 4.4988,
"eval_samples_per_second": 16.671,
"eval_steps_per_second": 0.667,
"step": 150
},
{
"epoch": 30.91,
"eval_accuracy": 0.9733333333333334,
"eval_loss": 0.1787085384130478,
"eval_runtime": 4.4136,
"eval_samples_per_second": 16.993,
"eval_steps_per_second": 0.68,
"step": 155
},
{
"epoch": 31.91,
"learning_rate": 2.5925925925925925e-05,
"loss": 0.4031,
"step": 160
},
{
"epoch": 31.91,
"eval_accuracy": 0.9733333333333334,
"eval_loss": 0.16259188950061798,
"eval_runtime": 4.4524,
"eval_samples_per_second": 16.845,
"eval_steps_per_second": 0.674,
"step": 160
},
{
"epoch": 32.91,
"eval_accuracy": 0.9733333333333334,
"eval_loss": 0.16668973863124847,
"eval_runtime": 4.4694,
"eval_samples_per_second": 16.781,
"eval_steps_per_second": 0.671,
"step": 165
},
{
"epoch": 33.91,
"eval_accuracy": 0.9733333333333334,
"eval_loss": 0.1871425062417984,
"eval_runtime": 4.4399,
"eval_samples_per_second": 16.892,
"eval_steps_per_second": 0.676,
"step": 170
},
{
"epoch": 34.91,
"eval_accuracy": 0.9733333333333334,
"eval_loss": 0.20150674879550934,
"eval_runtime": 4.4431,
"eval_samples_per_second": 16.88,
"eval_steps_per_second": 0.675,
"step": 175
},
{
"epoch": 35.91,
"learning_rate": 2.2222222222222223e-05,
"loss": 0.3952,
"step": 180
},
{
"epoch": 35.91,
"eval_accuracy": 0.9733333333333334,
"eval_loss": 0.18359220027923584,
"eval_runtime": 4.5102,
"eval_samples_per_second": 16.629,
"eval_steps_per_second": 0.665,
"step": 180
},
{
"epoch": 36.91,
"eval_accuracy": 0.96,
"eval_loss": 0.18555229902267456,
"eval_runtime": 4.5169,
"eval_samples_per_second": 16.604,
"eval_steps_per_second": 0.664,
"step": 185
},
{
"epoch": 37.91,
"eval_accuracy": 0.9333333333333333,
"eval_loss": 0.1952236294746399,
"eval_runtime": 4.5438,
"eval_samples_per_second": 16.506,
"eval_steps_per_second": 0.66,
"step": 190
},
{
"epoch": 38.91,
"eval_accuracy": 0.96,
"eval_loss": 0.1720731258392334,
"eval_runtime": 4.4501,
"eval_samples_per_second": 16.854,
"eval_steps_per_second": 0.674,
"step": 195
},
{
"epoch": 39.91,
"learning_rate": 1.8518518518518518e-05,
"loss": 0.369,
"step": 200
},
{
"epoch": 39.91,
"eval_accuracy": 0.9466666666666667,
"eval_loss": 0.1618812382221222,
"eval_runtime": 4.4486,
"eval_samples_per_second": 16.859,
"eval_steps_per_second": 0.674,
"step": 200
},
{
"epoch": 40.91,
"eval_accuracy": 0.96,
"eval_loss": 0.16587452590465546,
"eval_runtime": 4.385,
"eval_samples_per_second": 17.104,
"eval_steps_per_second": 0.684,
"step": 205
},
{
"epoch": 41.91,
"eval_accuracy": 0.96,
"eval_loss": 0.1568831503391266,
"eval_runtime": 4.5404,
"eval_samples_per_second": 16.518,
"eval_steps_per_second": 0.661,
"step": 210
},
{
"epoch": 42.91,
"eval_accuracy": 0.96,
"eval_loss": 0.1357746571302414,
"eval_runtime": 4.4209,
"eval_samples_per_second": 16.965,
"eval_steps_per_second": 0.679,
"step": 215
},
{
"epoch": 43.91,
"learning_rate": 1.4814814814814815e-05,
"loss": 0.3262,
"step": 220
},
{
"epoch": 43.91,
"eval_accuracy": 0.96,
"eval_loss": 0.13711059093475342,
"eval_runtime": 4.5003,
"eval_samples_per_second": 16.665,
"eval_steps_per_second": 0.667,
"step": 220
},
{
"epoch": 44.91,
"eval_accuracy": 0.9466666666666667,
"eval_loss": 0.1336827427148819,
"eval_runtime": 4.47,
"eval_samples_per_second": 16.779,
"eval_steps_per_second": 0.671,
"step": 225
},
{
"epoch": 45.91,
"eval_accuracy": 0.9466666666666667,
"eval_loss": 0.13736897706985474,
"eval_runtime": 4.5693,
"eval_samples_per_second": 16.414,
"eval_steps_per_second": 0.657,
"step": 230
},
{
"epoch": 46.91,
"eval_accuracy": 0.96,
"eval_loss": 0.17894567549228668,
"eval_runtime": 4.3355,
"eval_samples_per_second": 17.299,
"eval_steps_per_second": 0.692,
"step": 235
},
{
"epoch": 47.91,
"learning_rate": 1.1111111111111112e-05,
"loss": 0.3616,
"step": 240
},
{
"epoch": 47.91,
"eval_accuracy": 0.9466666666666667,
"eval_loss": 0.21668750047683716,
"eval_runtime": 4.4669,
"eval_samples_per_second": 16.79,
"eval_steps_per_second": 0.672,
"step": 240
},
{
"epoch": 48.91,
"eval_accuracy": 0.96,
"eval_loss": 0.17571820318698883,
"eval_runtime": 4.4771,
"eval_samples_per_second": 16.752,
"eval_steps_per_second": 0.67,
"step": 245
},
{
"epoch": 49.91,
"eval_accuracy": 0.9733333333333334,
"eval_loss": 0.17293348908424377,
"eval_runtime": 4.4293,
"eval_samples_per_second": 16.933,
"eval_steps_per_second": 0.677,
"step": 250
},
{
"epoch": 50.91,
"eval_accuracy": 0.9733333333333334,
"eval_loss": 0.17224831879138947,
"eval_runtime": 4.4183,
"eval_samples_per_second": 16.975,
"eval_steps_per_second": 0.679,
"step": 255
},
{
"epoch": 51.91,
"learning_rate": 7.4074074074074075e-06,
"loss": 0.303,
"step": 260
},
{
"epoch": 51.91,
"eval_accuracy": 0.9733333333333334,
"eval_loss": 0.16005316376686096,
"eval_runtime": 4.4073,
"eval_samples_per_second": 17.017,
"eval_steps_per_second": 0.681,
"step": 260
},
{
"epoch": 52.91,
"eval_accuracy": 0.9733333333333334,
"eval_loss": 0.15919166803359985,
"eval_runtime": 4.4398,
"eval_samples_per_second": 16.893,
"eval_steps_per_second": 0.676,
"step": 265
},
{
"epoch": 53.91,
"eval_accuracy": 0.9733333333333334,
"eval_loss": 0.16125422716140747,
"eval_runtime": 4.3899,
"eval_samples_per_second": 17.085,
"eval_steps_per_second": 0.683,
"step": 270
},
{
"epoch": 54.91,
"eval_accuracy": 0.9733333333333334,
"eval_loss": 0.15753033757209778,
"eval_runtime": 4.4684,
"eval_samples_per_second": 16.785,
"eval_steps_per_second": 0.671,
"step": 275
},
{
"epoch": 55.91,
"learning_rate": 3.7037037037037037e-06,
"loss": 0.305,
"step": 280
},
{
"epoch": 55.91,
"eval_accuracy": 0.9733333333333334,
"eval_loss": 0.15587559342384338,
"eval_runtime": 4.3795,
"eval_samples_per_second": 17.125,
"eval_steps_per_second": 0.685,
"step": 280
},
{
"epoch": 56.91,
"eval_accuracy": 0.9733333333333334,
"eval_loss": 0.14887748658657074,
"eval_runtime": 4.4449,
"eval_samples_per_second": 16.873,
"eval_steps_per_second": 0.675,
"step": 285
},
{
"epoch": 57.91,
"eval_accuracy": 0.96,
"eval_loss": 0.14639350771903992,
"eval_runtime": 4.4527,
"eval_samples_per_second": 16.844,
"eval_steps_per_second": 0.674,
"step": 290
},
{
"epoch": 58.91,
"eval_accuracy": 0.9466666666666667,
"eval_loss": 0.14625021815299988,
"eval_runtime": 4.4199,
"eval_samples_per_second": 16.969,
"eval_steps_per_second": 0.679,
"step": 295
},
{
"epoch": 59.91,
"learning_rate": 0.0,
"loss": 0.3328,
"step": 300
},
{
"epoch": 59.91,
"eval_accuracy": 0.9466666666666667,
"eval_loss": 0.14626549184322357,
"eval_runtime": 4.4407,
"eval_samples_per_second": 16.889,
"eval_steps_per_second": 0.676,
"step": 300
},
{
"epoch": 59.91,
"step": 300,
"total_flos": 1.0044714081093673e+18,
"train_loss": 0.5910613632202149,
"train_runtime": 5579.9163,
"train_samples_per_second": 7.247,
"train_steps_per_second": 0.054
}
],
"max_steps": 300,
"num_train_epochs": 60,
"total_flos": 1.0044714081093673e+18,
"trial_name": null,
"trial_params": null
}