{ "best_metric": 1.0, "best_model_checkpoint": "delivery_truck_classification/checkpoint-172", "epoch": 59.94117647058823, "global_step": 240, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.94, "eval_accuracy": 0.1864406779661017, "eval_loss": 1.9123966693878174, "eval_runtime": 3.7131, "eval_samples_per_second": 15.89, "eval_steps_per_second": 0.539, "step": 4 }, { "epoch": 1.94, "eval_accuracy": 0.23728813559322035, "eval_loss": 1.8094592094421387, "eval_runtime": 4.4625, "eval_samples_per_second": 13.221, "eval_steps_per_second": 0.448, "step": 8 }, { "epoch": 2.94, "eval_accuracy": 0.3898305084745763, "eval_loss": 1.6757333278656006, "eval_runtime": 3.88, "eval_samples_per_second": 15.206, "eval_steps_per_second": 0.515, "step": 12 }, { "epoch": 3.94, "eval_accuracy": 0.5254237288135594, "eval_loss": 1.4906411170959473, "eval_runtime": 3.788, "eval_samples_per_second": 15.576, "eval_steps_per_second": 0.528, "step": 16 }, { "epoch": 4.94, "learning_rate": 4.166666666666667e-05, "loss": 1.8286, "step": 20 }, { "epoch": 4.94, "eval_accuracy": 0.6440677966101694, "eval_loss": 1.2703886032104492, "eval_runtime": 4.208, "eval_samples_per_second": 14.021, "eval_steps_per_second": 0.475, "step": 20 }, { "epoch": 5.94, "eval_accuracy": 0.6779661016949152, "eval_loss": 1.0685124397277832, "eval_runtime": 3.8096, "eval_samples_per_second": 15.487, "eval_steps_per_second": 0.525, "step": 24 }, { "epoch": 6.94, "eval_accuracy": 0.7457627118644068, "eval_loss": 0.8031855225563049, "eval_runtime": 4.1542, "eval_samples_per_second": 14.203, "eval_steps_per_second": 0.481, "step": 28 }, { "epoch": 7.94, "eval_accuracy": 0.7627118644067796, "eval_loss": 0.6308717131614685, "eval_runtime": 3.7602, "eval_samples_per_second": 15.691, "eval_steps_per_second": 0.532, "step": 32 }, { "epoch": 8.94, "eval_accuracy": 0.847457627118644, "eval_loss": 0.49890831112861633, "eval_runtime": 4.1569, "eval_samples_per_second": 14.193, "eval_steps_per_second": 0.481, "step": 36 }, { "epoch": 9.94, "learning_rate": 4.62962962962963e-05, "loss": 0.9342, "step": 40 }, { "epoch": 9.94, "eval_accuracy": 0.847457627118644, "eval_loss": 0.40634387731552124, "eval_runtime": 3.8202, "eval_samples_per_second": 15.444, "eval_steps_per_second": 0.524, "step": 40 }, { "epoch": 10.94, "eval_accuracy": 0.9152542372881356, "eval_loss": 0.26924625039100647, "eval_runtime": 4.1384, "eval_samples_per_second": 14.257, "eval_steps_per_second": 0.483, "step": 44 }, { "epoch": 11.94, "eval_accuracy": 0.8983050847457628, "eval_loss": 0.27362605929374695, "eval_runtime": 3.707, "eval_samples_per_second": 15.916, "eval_steps_per_second": 0.54, "step": 48 }, { "epoch": 12.94, "eval_accuracy": 0.9322033898305084, "eval_loss": 0.21159349381923676, "eval_runtime": 4.0712, "eval_samples_per_second": 14.492, "eval_steps_per_second": 0.491, "step": 52 }, { "epoch": 13.94, "eval_accuracy": 0.9830508474576272, "eval_loss": 0.1497751921415329, "eval_runtime": 3.629, "eval_samples_per_second": 16.258, "eval_steps_per_second": 0.551, "step": 56 }, { "epoch": 14.94, "learning_rate": 4.166666666666667e-05, "loss": 0.5151, "step": 60 }, { "epoch": 14.94, "eval_accuracy": 0.9152542372881356, "eval_loss": 0.1906394362449646, "eval_runtime": 4.159, "eval_samples_per_second": 14.186, "eval_steps_per_second": 0.481, "step": 60 }, { "epoch": 15.94, "eval_accuracy": 0.9491525423728814, "eval_loss": 0.16975143551826477, "eval_runtime": 3.7313, "eval_samples_per_second": 15.812, "eval_steps_per_second": 0.536, "step": 64 }, { "epoch": 16.94, "eval_accuracy": 0.9491525423728814, "eval_loss": 0.1431875377893448, "eval_runtime": 4.1272, "eval_samples_per_second": 14.295, "eval_steps_per_second": 0.485, "step": 68 }, { "epoch": 17.94, "eval_accuracy": 0.9322033898305084, "eval_loss": 0.16815055906772614, "eval_runtime": 3.6724, "eval_samples_per_second": 16.066, "eval_steps_per_second": 0.545, "step": 72 }, { "epoch": 18.94, "eval_accuracy": 0.9830508474576272, "eval_loss": 0.10692509263753891, "eval_runtime": 4.1232, "eval_samples_per_second": 14.309, "eval_steps_per_second": 0.485, "step": 76 }, { "epoch": 19.94, "learning_rate": 3.7037037037037037e-05, "loss": 0.4009, "step": 80 }, { "epoch": 19.94, "eval_accuracy": 0.9830508474576272, "eval_loss": 0.08214119076728821, "eval_runtime": 3.6886, "eval_samples_per_second": 15.995, "eval_steps_per_second": 0.542, "step": 80 }, { "epoch": 20.94, "eval_accuracy": 0.9830508474576272, "eval_loss": 0.09025811403989792, "eval_runtime": 4.3053, "eval_samples_per_second": 13.704, "eval_steps_per_second": 0.465, "step": 84 }, { "epoch": 21.94, "eval_accuracy": 0.9661016949152542, "eval_loss": 0.12810270488262177, "eval_runtime": 3.7203, "eval_samples_per_second": 15.859, "eval_steps_per_second": 0.538, "step": 88 }, { "epoch": 22.94, "eval_accuracy": 0.9830508474576272, "eval_loss": 0.09356144815683365, "eval_runtime": 4.118, "eval_samples_per_second": 14.328, "eval_steps_per_second": 0.486, "step": 92 }, { "epoch": 23.94, "eval_accuracy": 0.9661016949152542, "eval_loss": 0.10591834783554077, "eval_runtime": 3.6933, "eval_samples_per_second": 15.975, "eval_steps_per_second": 0.542, "step": 96 }, { "epoch": 24.94, "learning_rate": 3.240740740740741e-05, "loss": 0.3482, "step": 100 }, { "epoch": 24.94, "eval_accuracy": 0.9491525423728814, "eval_loss": 0.14312368631362915, "eval_runtime": 4.1639, "eval_samples_per_second": 14.169, "eval_steps_per_second": 0.48, "step": 100 }, { "epoch": 25.94, "eval_accuracy": 0.9661016949152542, "eval_loss": 0.08986904472112656, "eval_runtime": 3.7088, "eval_samples_per_second": 15.908, "eval_steps_per_second": 0.539, "step": 104 }, { "epoch": 26.94, "eval_accuracy": 0.9661016949152542, "eval_loss": 0.06888163089752197, "eval_runtime": 4.1304, "eval_samples_per_second": 14.284, "eval_steps_per_second": 0.484, "step": 108 }, { "epoch": 27.94, "eval_accuracy": 0.9661016949152542, "eval_loss": 0.07510155439376831, "eval_runtime": 3.7462, "eval_samples_per_second": 15.749, "eval_steps_per_second": 0.534, "step": 112 }, { "epoch": 28.94, "eval_accuracy": 0.9661016949152542, "eval_loss": 0.08912018686532974, "eval_runtime": 3.7992, "eval_samples_per_second": 15.53, "eval_steps_per_second": 0.526, "step": 116 }, { "epoch": 29.94, "learning_rate": 2.777777777777778e-05, "loss": 0.3306, "step": 120 }, { "epoch": 29.94, "eval_accuracy": 0.9830508474576272, "eval_loss": 0.05226200073957443, "eval_runtime": 4.2109, "eval_samples_per_second": 14.011, "eval_steps_per_second": 0.475, "step": 120 }, { "epoch": 30.94, "eval_accuracy": 0.9830508474576272, "eval_loss": 0.07344209402799606, "eval_runtime": 3.9025, "eval_samples_per_second": 15.118, "eval_steps_per_second": 0.512, "step": 124 }, { "epoch": 31.94, "eval_accuracy": 0.9830508474576272, "eval_loss": 0.07462318241596222, "eval_runtime": 4.1592, "eval_samples_per_second": 14.185, "eval_steps_per_second": 0.481, "step": 128 }, { "epoch": 32.94, "eval_accuracy": 0.9661016949152542, "eval_loss": 0.04742526262998581, "eval_runtime": 3.8091, "eval_samples_per_second": 15.489, "eval_steps_per_second": 0.525, "step": 132 }, { "epoch": 33.94, "eval_accuracy": 0.9830508474576272, "eval_loss": 0.044318120926618576, "eval_runtime": 3.7853, "eval_samples_per_second": 15.587, "eval_steps_per_second": 0.528, "step": 136 }, { "epoch": 34.94, "learning_rate": 2.314814814814815e-05, "loss": 0.2871, "step": 140 }, { "epoch": 34.94, "eval_accuracy": 0.9830508474576272, "eval_loss": 0.08141448348760605, "eval_runtime": 4.1875, "eval_samples_per_second": 14.09, "eval_steps_per_second": 0.478, "step": 140 }, { "epoch": 35.94, "eval_accuracy": 0.9830508474576272, "eval_loss": 0.0690697729587555, "eval_runtime": 3.7869, "eval_samples_per_second": 15.58, "eval_steps_per_second": 0.528, "step": 144 }, { "epoch": 36.94, "eval_accuracy": 0.9830508474576272, "eval_loss": 0.053145911544561386, "eval_runtime": 4.1845, "eval_samples_per_second": 14.1, "eval_steps_per_second": 0.478, "step": 148 }, { "epoch": 37.94, "eval_accuracy": 0.9830508474576272, "eval_loss": 0.06143573671579361, "eval_runtime": 3.7811, "eval_samples_per_second": 15.604, "eval_steps_per_second": 0.529, "step": 152 }, { "epoch": 38.94, "eval_accuracy": 0.9830508474576272, "eval_loss": 0.057755034416913986, "eval_runtime": 4.2237, "eval_samples_per_second": 13.969, "eval_steps_per_second": 0.474, "step": 156 }, { "epoch": 39.94, "learning_rate": 1.8518518518518518e-05, "loss": 0.2754, "step": 160 }, { "epoch": 39.94, "eval_accuracy": 0.9830508474576272, "eval_loss": 0.05201863497495651, "eval_runtime": 3.7528, "eval_samples_per_second": 15.722, "eval_steps_per_second": 0.533, "step": 160 }, { "epoch": 40.94, "eval_accuracy": 0.9830508474576272, "eval_loss": 0.05365251377224922, "eval_runtime": 3.7906, "eval_samples_per_second": 15.565, "eval_steps_per_second": 0.528, "step": 164 }, { "epoch": 41.94, "eval_accuracy": 0.9830508474576272, "eval_loss": 0.04466838762164116, "eval_runtime": 4.0883, "eval_samples_per_second": 14.432, "eval_steps_per_second": 0.489, "step": 168 }, { "epoch": 42.94, "eval_accuracy": 1.0, "eval_loss": 0.028991766273975372, "eval_runtime": 3.7894, "eval_samples_per_second": 15.57, "eval_steps_per_second": 0.528, "step": 172 }, { "epoch": 43.94, "eval_accuracy": 1.0, "eval_loss": 0.029105449095368385, "eval_runtime": 4.1829, "eval_samples_per_second": 14.105, "eval_steps_per_second": 0.478, "step": 176 }, { "epoch": 44.94, "learning_rate": 1.388888888888889e-05, "loss": 0.269, "step": 180 }, { "epoch": 44.94, "eval_accuracy": 0.9830508474576272, "eval_loss": 0.03256472200155258, "eval_runtime": 3.7585, "eval_samples_per_second": 15.698, "eval_steps_per_second": 0.532, "step": 180 }, { "epoch": 45.94, "eval_accuracy": 0.9830508474576272, "eval_loss": 0.03297417610883713, "eval_runtime": 4.155, "eval_samples_per_second": 14.2, "eval_steps_per_second": 0.481, "step": 184 }, { "epoch": 46.94, "eval_accuracy": 0.9830508474576272, "eval_loss": 0.034774668514728546, "eval_runtime": 3.7675, "eval_samples_per_second": 15.66, "eval_steps_per_second": 0.531, "step": 188 }, { "epoch": 47.94, "eval_accuracy": 0.9830508474576272, "eval_loss": 0.03467889130115509, "eval_runtime": 4.0766, "eval_samples_per_second": 14.473, "eval_steps_per_second": 0.491, "step": 192 }, { "epoch": 48.94, "eval_accuracy": 0.9830508474576272, "eval_loss": 0.03474270924925804, "eval_runtime": 3.7643, "eval_samples_per_second": 15.674, "eval_steps_per_second": 0.531, "step": 196 }, { "epoch": 49.94, "learning_rate": 9.259259259259259e-06, "loss": 0.2615, "step": 200 }, { "epoch": 49.94, "eval_accuracy": 0.9830508474576272, "eval_loss": 0.04243284463882446, "eval_runtime": 4.0985, "eval_samples_per_second": 14.395, "eval_steps_per_second": 0.488, "step": 200 }, { "epoch": 50.94, "eval_accuracy": 0.9830508474576272, "eval_loss": 0.04514499008655548, "eval_runtime": 3.9491, "eval_samples_per_second": 14.94, "eval_steps_per_second": 0.506, "step": 204 }, { "epoch": 51.94, "eval_accuracy": 0.9830508474576272, "eval_loss": 0.043262287974357605, "eval_runtime": 3.6957, "eval_samples_per_second": 15.964, "eval_steps_per_second": 0.541, "step": 208 }, { "epoch": 52.94, "eval_accuracy": 0.9830508474576272, "eval_loss": 0.035157691687345505, "eval_runtime": 4.172, "eval_samples_per_second": 14.142, "eval_steps_per_second": 0.479, "step": 212 }, { "epoch": 53.94, "eval_accuracy": 0.9830508474576272, "eval_loss": 0.03394060581922531, "eval_runtime": 3.7213, "eval_samples_per_second": 15.855, "eval_steps_per_second": 0.537, "step": 216 }, { "epoch": 54.94, "learning_rate": 4.6296296296296296e-06, "loss": 0.2386, "step": 220 }, { "epoch": 54.94, "eval_accuracy": 0.9830508474576272, "eval_loss": 0.03394594043493271, "eval_runtime": 4.1524, "eval_samples_per_second": 14.208, "eval_steps_per_second": 0.482, "step": 220 }, { "epoch": 55.94, "eval_accuracy": 0.9830508474576272, "eval_loss": 0.03388730436563492, "eval_runtime": 3.719, "eval_samples_per_second": 15.864, "eval_steps_per_second": 0.538, "step": 224 }, { "epoch": 56.94, "eval_accuracy": 0.9830508474576272, "eval_loss": 0.034843575209379196, "eval_runtime": 4.1514, "eval_samples_per_second": 14.212, "eval_steps_per_second": 0.482, "step": 228 }, { "epoch": 57.94, "eval_accuracy": 0.9830508474576272, "eval_loss": 0.03663792461156845, "eval_runtime": 3.7689, "eval_samples_per_second": 15.654, "eval_steps_per_second": 0.531, "step": 232 }, { "epoch": 58.94, "eval_accuracy": 0.9830508474576272, "eval_loss": 0.03743705153465271, "eval_runtime": 4.1165, "eval_samples_per_second": 14.333, "eval_steps_per_second": 0.486, "step": 236 }, { "epoch": 59.94, "learning_rate": 0.0, "loss": 0.2362, "step": 240 }, { "epoch": 59.94, "eval_accuracy": 0.9830508474576272, "eval_loss": 0.03746996819972992, "eval_runtime": 3.7404, "eval_samples_per_second": 15.774, "eval_steps_per_second": 0.535, "step": 240 }, { "epoch": 59.94, "step": 240, "total_flos": 7.88616702456404e+17, "train_loss": 0.4937874893347422, "train_runtime": 3820.3512, "train_samples_per_second": 8.308, "train_steps_per_second": 0.063 } ], "max_steps": 240, "num_train_epochs": 60, "total_flos": 7.88616702456404e+17, "trial_name": null, "trial_params": null }