{ "best_metric": 0.9733333333333334, "best_model_checkpoint": "delivery_truck_classification/checkpoint-155", "epoch": 59.90909090909091, "global_step": 300, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.91, "eval_accuracy": 0.06666666666666667, "eval_loss": 2.124830722808838, "eval_runtime": 4.5982, "eval_samples_per_second": 16.311, "eval_steps_per_second": 0.652, "step": 5 }, { "epoch": 1.91, "eval_accuracy": 0.24, "eval_loss": 1.922129511833191, "eval_runtime": 4.7321, "eval_samples_per_second": 15.849, "eval_steps_per_second": 0.634, "step": 10 }, { "epoch": 2.91, "eval_accuracy": 0.32, "eval_loss": 1.7176545858383179, "eval_runtime": 4.4837, "eval_samples_per_second": 16.727, "eval_steps_per_second": 0.669, "step": 15 }, { "epoch": 3.91, "learning_rate": 3.3333333333333335e-05, "loss": 2.0123, "step": 20 }, { "epoch": 3.91, "eval_accuracy": 0.4266666666666667, "eval_loss": 1.5490375757217407, "eval_runtime": 4.4804, "eval_samples_per_second": 16.74, "eval_steps_per_second": 0.67, "step": 20 }, { "epoch": 4.91, "eval_accuracy": 0.5333333333333333, "eval_loss": 1.3192248344421387, "eval_runtime": 4.5163, "eval_samples_per_second": 16.607, "eval_steps_per_second": 0.664, "step": 25 }, { "epoch": 5.91, "eval_accuracy": 0.64, "eval_loss": 1.0764085054397583, "eval_runtime": 4.4752, "eval_samples_per_second": 16.759, "eval_steps_per_second": 0.67, "step": 30 }, { "epoch": 6.91, "eval_accuracy": 0.76, "eval_loss": 0.8421124219894409, "eval_runtime": 4.5472, "eval_samples_per_second": 16.494, "eval_steps_per_second": 0.66, "step": 35 }, { "epoch": 7.91, "learning_rate": 4.814814814814815e-05, "loss": 1.3539, "step": 40 }, { "epoch": 7.91, "eval_accuracy": 0.8266666666666667, "eval_loss": 0.6503960490226746, "eval_runtime": 4.6022, "eval_samples_per_second": 16.296, "eval_steps_per_second": 0.652, "step": 40 }, { "epoch": 8.91, "eval_accuracy": 0.8666666666666667, "eval_loss": 0.5242553949356079, "eval_runtime": 4.4829, "eval_samples_per_second": 16.73, "eval_steps_per_second": 0.669, "step": 45 }, { "epoch": 9.91, "eval_accuracy": 0.88, "eval_loss": 0.4281647205352783, "eval_runtime": 4.4238, "eval_samples_per_second": 16.954, "eval_steps_per_second": 0.678, "step": 50 }, { "epoch": 10.91, "eval_accuracy": 0.9066666666666666, "eval_loss": 0.3949722349643707, "eval_runtime": 4.5638, "eval_samples_per_second": 16.434, "eval_steps_per_second": 0.657, "step": 55 }, { "epoch": 11.91, "learning_rate": 4.4444444444444447e-05, "loss": 0.7315, "step": 60 }, { "epoch": 11.91, "eval_accuracy": 0.8933333333333333, "eval_loss": 0.361709862947464, "eval_runtime": 4.5199, "eval_samples_per_second": 16.593, "eval_steps_per_second": 0.664, "step": 60 }, { "epoch": 12.91, "eval_accuracy": 0.9066666666666666, "eval_loss": 0.3166624903678894, "eval_runtime": 4.4623, "eval_samples_per_second": 16.807, "eval_steps_per_second": 0.672, "step": 65 }, { "epoch": 13.91, "eval_accuracy": 0.9066666666666666, "eval_loss": 0.3022773861885071, "eval_runtime": 4.4075, "eval_samples_per_second": 17.016, "eval_steps_per_second": 0.681, "step": 70 }, { "epoch": 14.91, "eval_accuracy": 0.9333333333333333, "eval_loss": 0.24396675825119019, "eval_runtime": 4.4157, "eval_samples_per_second": 16.985, "eval_steps_per_second": 0.679, "step": 75 }, { "epoch": 15.91, "learning_rate": 4.074074074074074e-05, "loss": 0.5713, "step": 80 }, { "epoch": 15.91, "eval_accuracy": 0.9333333333333333, "eval_loss": 0.24749578535556793, "eval_runtime": 4.3849, "eval_samples_per_second": 17.104, "eval_steps_per_second": 0.684, "step": 80 }, { "epoch": 16.91, "eval_accuracy": 0.92, "eval_loss": 0.2443261742591858, "eval_runtime": 4.5173, "eval_samples_per_second": 16.603, "eval_steps_per_second": 0.664, "step": 85 }, { "epoch": 17.91, "eval_accuracy": 0.96, "eval_loss": 0.20929811894893646, "eval_runtime": 4.4498, "eval_samples_per_second": 16.855, "eval_steps_per_second": 0.674, "step": 90 }, { "epoch": 18.91, "eval_accuracy": 0.9466666666666667, "eval_loss": 0.20770420134067535, "eval_runtime": 4.481, "eval_samples_per_second": 16.737, "eval_steps_per_second": 0.669, "step": 95 }, { "epoch": 19.91, "learning_rate": 3.7037037037037037e-05, "loss": 0.515, "step": 100 }, { "epoch": 19.91, "eval_accuracy": 0.9333333333333333, "eval_loss": 0.2124166041612625, "eval_runtime": 4.6887, "eval_samples_per_second": 15.996, "eval_steps_per_second": 0.64, "step": 100 }, { "epoch": 20.91, "eval_accuracy": 0.96, "eval_loss": 0.21663539111614227, "eval_runtime": 4.4061, "eval_samples_per_second": 17.022, "eval_steps_per_second": 0.681, "step": 105 }, { "epoch": 21.91, "eval_accuracy": 0.9333333333333333, "eval_loss": 0.1939961463212967, "eval_runtime": 4.4646, "eval_samples_per_second": 16.799, "eval_steps_per_second": 0.672, "step": 110 }, { "epoch": 22.91, "eval_accuracy": 0.9333333333333333, "eval_loss": 0.19843259453773499, "eval_runtime": 4.5883, "eval_samples_per_second": 16.346, "eval_steps_per_second": 0.654, "step": 115 }, { "epoch": 23.91, "learning_rate": 3.3333333333333335e-05, "loss": 0.4582, "step": 120 }, { "epoch": 23.91, "eval_accuracy": 0.9333333333333333, "eval_loss": 0.23953679203987122, "eval_runtime": 4.5302, "eval_samples_per_second": 16.556, "eval_steps_per_second": 0.662, "step": 120 }, { "epoch": 24.91, "eval_accuracy": 0.92, "eval_loss": 0.24795593321323395, "eval_runtime": 4.4621, "eval_samples_per_second": 16.808, "eval_steps_per_second": 0.672, "step": 125 }, { "epoch": 25.91, "eval_accuracy": 0.92, "eval_loss": 0.2179584801197052, "eval_runtime": 4.4204, "eval_samples_per_second": 16.967, "eval_steps_per_second": 0.679, "step": 130 }, { "epoch": 26.91, "eval_accuracy": 0.9333333333333333, "eval_loss": 0.2231944501399994, "eval_runtime": 4.4482, "eval_samples_per_second": 16.861, "eval_steps_per_second": 0.674, "step": 135 }, { "epoch": 27.91, "learning_rate": 2.962962962962963e-05, "loss": 0.4279, "step": 140 }, { "epoch": 27.91, "eval_accuracy": 0.9333333333333333, "eval_loss": 0.1976775974035263, "eval_runtime": 4.4409, "eval_samples_per_second": 16.888, "eval_steps_per_second": 0.676, "step": 140 }, { "epoch": 28.91, "eval_accuracy": 0.9466666666666667, "eval_loss": 0.18473981320858002, "eval_runtime": 4.4471, "eval_samples_per_second": 16.865, "eval_steps_per_second": 0.675, "step": 145 }, { "epoch": 29.91, "eval_accuracy": 0.9466666666666667, "eval_loss": 0.19218212366104126, "eval_runtime": 4.4988, "eval_samples_per_second": 16.671, "eval_steps_per_second": 0.667, "step": 150 }, { "epoch": 30.91, "eval_accuracy": 0.9733333333333334, "eval_loss": 0.1787085384130478, "eval_runtime": 4.4136, "eval_samples_per_second": 16.993, "eval_steps_per_second": 0.68, "step": 155 }, { "epoch": 31.91, "learning_rate": 2.5925925925925925e-05, "loss": 0.4031, "step": 160 }, { "epoch": 31.91, "eval_accuracy": 0.9733333333333334, "eval_loss": 0.16259188950061798, "eval_runtime": 4.4524, "eval_samples_per_second": 16.845, "eval_steps_per_second": 0.674, "step": 160 }, { "epoch": 32.91, "eval_accuracy": 0.9733333333333334, "eval_loss": 0.16668973863124847, "eval_runtime": 4.4694, "eval_samples_per_second": 16.781, "eval_steps_per_second": 0.671, "step": 165 }, { "epoch": 33.91, "eval_accuracy": 0.9733333333333334, "eval_loss": 0.1871425062417984, "eval_runtime": 4.4399, "eval_samples_per_second": 16.892, "eval_steps_per_second": 0.676, "step": 170 }, { "epoch": 34.91, "eval_accuracy": 0.9733333333333334, "eval_loss": 0.20150674879550934, "eval_runtime": 4.4431, "eval_samples_per_second": 16.88, "eval_steps_per_second": 0.675, "step": 175 }, { "epoch": 35.91, "learning_rate": 2.2222222222222223e-05, "loss": 0.3952, "step": 180 }, { "epoch": 35.91, "eval_accuracy": 0.9733333333333334, "eval_loss": 0.18359220027923584, "eval_runtime": 4.5102, "eval_samples_per_second": 16.629, "eval_steps_per_second": 0.665, "step": 180 }, { "epoch": 36.91, "eval_accuracy": 0.96, "eval_loss": 0.18555229902267456, "eval_runtime": 4.5169, "eval_samples_per_second": 16.604, "eval_steps_per_second": 0.664, "step": 185 }, { "epoch": 37.91, "eval_accuracy": 0.9333333333333333, "eval_loss": 0.1952236294746399, "eval_runtime": 4.5438, "eval_samples_per_second": 16.506, "eval_steps_per_second": 0.66, "step": 190 }, { "epoch": 38.91, "eval_accuracy": 0.96, "eval_loss": 0.1720731258392334, "eval_runtime": 4.4501, "eval_samples_per_second": 16.854, "eval_steps_per_second": 0.674, "step": 195 }, { "epoch": 39.91, "learning_rate": 1.8518518518518518e-05, "loss": 0.369, "step": 200 }, { "epoch": 39.91, "eval_accuracy": 0.9466666666666667, "eval_loss": 0.1618812382221222, "eval_runtime": 4.4486, "eval_samples_per_second": 16.859, "eval_steps_per_second": 0.674, "step": 200 }, { "epoch": 40.91, "eval_accuracy": 0.96, "eval_loss": 0.16587452590465546, "eval_runtime": 4.385, "eval_samples_per_second": 17.104, "eval_steps_per_second": 0.684, "step": 205 }, { "epoch": 41.91, "eval_accuracy": 0.96, "eval_loss": 0.1568831503391266, "eval_runtime": 4.5404, "eval_samples_per_second": 16.518, "eval_steps_per_second": 0.661, "step": 210 }, { "epoch": 42.91, "eval_accuracy": 0.96, "eval_loss": 0.1357746571302414, "eval_runtime": 4.4209, "eval_samples_per_second": 16.965, "eval_steps_per_second": 0.679, "step": 215 }, { "epoch": 43.91, "learning_rate": 1.4814814814814815e-05, "loss": 0.3262, "step": 220 }, { "epoch": 43.91, "eval_accuracy": 0.96, "eval_loss": 0.13711059093475342, "eval_runtime": 4.5003, "eval_samples_per_second": 16.665, "eval_steps_per_second": 0.667, "step": 220 }, { "epoch": 44.91, "eval_accuracy": 0.9466666666666667, "eval_loss": 0.1336827427148819, "eval_runtime": 4.47, "eval_samples_per_second": 16.779, "eval_steps_per_second": 0.671, "step": 225 }, { "epoch": 45.91, "eval_accuracy": 0.9466666666666667, "eval_loss": 0.13736897706985474, "eval_runtime": 4.5693, "eval_samples_per_second": 16.414, "eval_steps_per_second": 0.657, "step": 230 }, { "epoch": 46.91, "eval_accuracy": 0.96, "eval_loss": 0.17894567549228668, "eval_runtime": 4.3355, "eval_samples_per_second": 17.299, "eval_steps_per_second": 0.692, "step": 235 }, { "epoch": 47.91, "learning_rate": 1.1111111111111112e-05, "loss": 0.3616, "step": 240 }, { "epoch": 47.91, "eval_accuracy": 0.9466666666666667, "eval_loss": 0.21668750047683716, "eval_runtime": 4.4669, "eval_samples_per_second": 16.79, "eval_steps_per_second": 0.672, "step": 240 }, { "epoch": 48.91, "eval_accuracy": 0.96, "eval_loss": 0.17571820318698883, "eval_runtime": 4.4771, "eval_samples_per_second": 16.752, "eval_steps_per_second": 0.67, "step": 245 }, { "epoch": 49.91, "eval_accuracy": 0.9733333333333334, "eval_loss": 0.17293348908424377, "eval_runtime": 4.4293, "eval_samples_per_second": 16.933, "eval_steps_per_second": 0.677, "step": 250 }, { "epoch": 50.91, "eval_accuracy": 0.9733333333333334, "eval_loss": 0.17224831879138947, "eval_runtime": 4.4183, "eval_samples_per_second": 16.975, "eval_steps_per_second": 0.679, "step": 255 }, { "epoch": 51.91, "learning_rate": 7.4074074074074075e-06, "loss": 0.303, "step": 260 }, { "epoch": 51.91, "eval_accuracy": 0.9733333333333334, "eval_loss": 0.16005316376686096, "eval_runtime": 4.4073, "eval_samples_per_second": 17.017, "eval_steps_per_second": 0.681, "step": 260 }, { "epoch": 52.91, "eval_accuracy": 0.9733333333333334, "eval_loss": 0.15919166803359985, "eval_runtime": 4.4398, "eval_samples_per_second": 16.893, "eval_steps_per_second": 0.676, "step": 265 }, { "epoch": 53.91, "eval_accuracy": 0.9733333333333334, "eval_loss": 0.16125422716140747, "eval_runtime": 4.3899, "eval_samples_per_second": 17.085, "eval_steps_per_second": 0.683, "step": 270 }, { "epoch": 54.91, "eval_accuracy": 0.9733333333333334, "eval_loss": 0.15753033757209778, "eval_runtime": 4.4684, "eval_samples_per_second": 16.785, "eval_steps_per_second": 0.671, "step": 275 }, { "epoch": 55.91, "learning_rate": 3.7037037037037037e-06, "loss": 0.305, "step": 280 }, { "epoch": 55.91, "eval_accuracy": 0.9733333333333334, "eval_loss": 0.15587559342384338, "eval_runtime": 4.3795, "eval_samples_per_second": 17.125, "eval_steps_per_second": 0.685, "step": 280 }, { "epoch": 56.91, "eval_accuracy": 0.9733333333333334, "eval_loss": 0.14887748658657074, "eval_runtime": 4.4449, "eval_samples_per_second": 16.873, "eval_steps_per_second": 0.675, "step": 285 }, { "epoch": 57.91, "eval_accuracy": 0.96, "eval_loss": 0.14639350771903992, "eval_runtime": 4.4527, "eval_samples_per_second": 16.844, "eval_steps_per_second": 0.674, "step": 290 }, { "epoch": 58.91, "eval_accuracy": 0.9466666666666667, "eval_loss": 0.14625021815299988, "eval_runtime": 4.4199, "eval_samples_per_second": 16.969, "eval_steps_per_second": 0.679, "step": 295 }, { "epoch": 59.91, "learning_rate": 0.0, "loss": 0.3328, "step": 300 }, { "epoch": 59.91, "eval_accuracy": 0.9466666666666667, "eval_loss": 0.14626549184322357, "eval_runtime": 4.4407, "eval_samples_per_second": 16.889, "eval_steps_per_second": 0.676, "step": 300 }, { "epoch": 59.91, "step": 300, "total_flos": 1.0044714081093673e+18, "train_loss": 0.5910613632202149, "train_runtime": 5579.9163, "train_samples_per_second": 7.247, "train_steps_per_second": 0.054 } ], "max_steps": 300, "num_train_epochs": 60, "total_flos": 1.0044714081093673e+18, "trial_name": null, "trial_params": null }