{ "best_metric": 2.2174315452575684, "best_model_checkpoint": "hBERTv2_new_no_pretrain_stsb/checkpoint-90", "epoch": 7.0, "global_step": 315, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "learning_rate": 3.9200000000000004e-05, "loss": 2.3893, "step": 45 }, { "epoch": 1.0, "eval_combined_score": 0.11711747086860938, "eval_loss": 2.3697988986968994, "eval_pearson": 0.12043925832454841, "eval_runtime": 6.5953, "eval_samples_per_second": 227.435, "eval_spearmanr": 0.11379568341267035, "eval_steps_per_second": 1.819, "step": 45 }, { "epoch": 2.0, "learning_rate": 3.8400000000000005e-05, "loss": 1.9589, "step": 90 }, { "epoch": 2.0, "eval_combined_score": 0.20194085374544546, "eval_loss": 2.2174315452575684, "eval_pearson": 0.19461814333305827, "eval_runtime": 6.597, "eval_samples_per_second": 227.377, "eval_spearmanr": 0.20926356415783265, "eval_steps_per_second": 1.819, "step": 90 }, { "epoch": 3.0, "learning_rate": 3.76e-05, "loss": 1.6743, "step": 135 }, { "epoch": 3.0, "eval_combined_score": 0.2175435728704142, "eval_loss": 2.3480913639068604, "eval_pearson": 0.21439031391646174, "eval_runtime": 6.5993, "eval_samples_per_second": 227.299, "eval_spearmanr": 0.22069683182436667, "eval_steps_per_second": 1.818, "step": 135 }, { "epoch": 4.0, "learning_rate": 3.680000000000001e-05, "loss": 1.4068, "step": 180 }, { "epoch": 4.0, "eval_combined_score": 0.24955142048606804, "eval_loss": 2.5921387672424316, "eval_pearson": 0.247162444909398, "eval_runtime": 6.6007, "eval_samples_per_second": 227.248, "eval_spearmanr": 0.2519403960627381, "eval_steps_per_second": 1.818, "step": 180 }, { "epoch": 5.0, "learning_rate": 3.6e-05, "loss": 1.2205, "step": 225 }, { "epoch": 5.0, "eval_combined_score": 0.27093228753161847, "eval_loss": 2.627875566482544, "eval_pearson": 0.27178091382672603, "eval_runtime": 6.595, "eval_samples_per_second": 227.444, "eval_spearmanr": 0.27008366123651084, "eval_steps_per_second": 1.82, "step": 225 }, { "epoch": 6.0, "learning_rate": 3.52e-05, "loss": 0.9353, "step": 270 }, { "epoch": 6.0, "eval_combined_score": 0.316500979446309, "eval_loss": 2.5439531803131104, "eval_pearson": 0.3117440470832078, "eval_runtime": 6.6054, "eval_samples_per_second": 227.087, "eval_spearmanr": 0.3212579118094102, "eval_steps_per_second": 1.817, "step": 270 }, { "epoch": 7.0, "learning_rate": 3.44e-05, "loss": 0.7662, "step": 315 }, { "epoch": 7.0, "eval_combined_score": 0.3509809608594302, "eval_loss": 2.305265188217163, "eval_pearson": 0.35010838206071104, "eval_runtime": 6.5951, "eval_samples_per_second": 227.443, "eval_spearmanr": 0.3518535396581493, "eval_steps_per_second": 1.82, "step": 315 }, { "epoch": 7.0, "step": 315, "total_flos": 5889079841390592.0, "train_loss": 1.4787501380557107, "train_runtime": 694.6363, "train_samples_per_second": 413.814, "train_steps_per_second": 3.239 } ], "max_steps": 2250, "num_train_epochs": 50, "total_flos": 5889079841390592.0, "trial_name": null, "trial_params": null }