{ "best_metric": 0.8523043960135418, "best_model_checkpoint": "result/my-sup-simcse-bert-base-lastterm", "epoch": 3.0, "global_step": 3231, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.12, "eval_avg_sts": 0.8194254390928033, "eval_sickr_spearman": 0.7990052495236399, "eval_stsb_spearman": 0.8398456286619668, "step": 125 }, { "epoch": 0.23, "eval_avg_sts": 0.8165670458735704, "eval_sickr_spearman": 0.7869509320268182, "eval_stsb_spearman": 0.8461831597203227, "step": 250 }, { "epoch": 0.35, "eval_avg_sts": 0.8228159333151963, "eval_sickr_spearman": 0.7957744855165066, "eval_stsb_spearman": 0.8498573811138859, "step": 375 }, { "epoch": 0.46, "learning_rate": 4.226245744351594e-05, "loss": 1.0808, "step": 500 }, { "epoch": 0.46, "eval_avg_sts": 0.8168153761131349, "eval_sickr_spearman": 0.7877662119426287, "eval_stsb_spearman": 0.8458645402836412, "step": 500 }, { "epoch": 0.58, "eval_avg_sts": 0.8156032349409434, "eval_sickr_spearman": 0.7826891323962145, "eval_stsb_spearman": 0.8485173374856724, "step": 625 }, { "epoch": 0.7, "eval_avg_sts": 0.8169960567322327, "eval_sickr_spearman": 0.7846676775577546, "eval_stsb_spearman": 0.849324435906711, "step": 750 }, { "epoch": 0.81, "eval_avg_sts": 0.8146560028725298, "eval_sickr_spearman": 0.7835492733607682, "eval_stsb_spearman": 0.8457627323842916, "step": 875 }, { "epoch": 0.93, "learning_rate": 3.452491488703188e-05, "loss": 0.8522, "step": 1000 }, { "epoch": 0.93, "eval_avg_sts": 0.8163927093002852, "eval_sickr_spearman": 0.7824352399940127, "eval_stsb_spearman": 0.8503501786065577, "step": 1000 }, { "epoch": 1.04, "eval_avg_sts": 0.8052909347246509, "eval_sickr_spearman": 0.7662991914658787, "eval_stsb_spearman": 0.8442826779834229, "step": 1125 }, { "epoch": 1.16, "eval_avg_sts": 0.8106314735517854, "eval_sickr_spearman": 0.77574806186519, "eval_stsb_spearman": 0.8455148852383809, "step": 1250 }, { "epoch": 1.28, "eval_avg_sts": 0.8113568861098444, "eval_sickr_spearman": 0.7783763237358834, "eval_stsb_spearman": 0.8443374484838054, "step": 1375 }, { "epoch": 1.39, "learning_rate": 2.678737233054782e-05, "loss": 0.6828, "step": 1500 }, { "epoch": 1.39, "eval_avg_sts": 0.8208657443062924, "eval_sickr_spearman": 0.7928466056350422, "eval_stsb_spearman": 0.8488848829775427, "step": 1500 }, { "epoch": 1.51, "eval_avg_sts": 0.8180871720303612, "eval_sickr_spearman": 0.7858960729770345, "eval_stsb_spearman": 0.8502782710836879, "step": 1625 }, { "epoch": 1.62, "eval_avg_sts": 0.8170722172992666, "eval_sickr_spearman": 0.7818400385849915, "eval_stsb_spearman": 0.8523043960135418, "step": 1750 }, { "epoch": 1.74, "eval_avg_sts": 0.81144903531131, "eval_sickr_spearman": 0.7756615098203985, "eval_stsb_spearman": 0.8472365608022215, "step": 1875 }, { "epoch": 1.86, "learning_rate": 1.9049829774063757e-05, "loss": 0.6522, "step": 2000 }, { "epoch": 1.86, "eval_avg_sts": 0.8141474203440927, "eval_sickr_spearman": 0.7794347370871737, "eval_stsb_spearman": 0.8488601036010117, "step": 2000 }, { "epoch": 1.97, "eval_avg_sts": 0.8158956922741192, "eval_sickr_spearman": 0.7808102517701584, "eval_stsb_spearman": 0.8509811327780799, "step": 2125 }, { "epoch": 2.09, "eval_avg_sts": 0.814587631326179, "eval_sickr_spearman": 0.7796313764164613, "eval_stsb_spearman": 0.8495438862358966, "step": 2250 }, { "epoch": 2.21, "eval_avg_sts": 0.8114095673015015, "eval_sickr_spearman": 0.7735022716552481, "eval_stsb_spearman": 0.8493168629477549, "step": 2375 }, { "epoch": 2.32, "learning_rate": 1.1312287217579697e-05, "loss": 0.5675, "step": 2500 }, { "epoch": 2.32, "eval_avg_sts": 0.8121220784998155, "eval_sickr_spearman": 0.7740748984465933, "eval_stsb_spearman": 0.8501692585530379, "step": 2500 }, { "epoch": 2.44, "eval_avg_sts": 0.8130334510314673, "eval_sickr_spearman": 0.7768290018030546, "eval_stsb_spearman": 0.84923790025988, "step": 2625 }, { "epoch": 2.55, "eval_avg_sts": 0.8140933803428295, "eval_sickr_spearman": 0.7770954303227319, "eval_stsb_spearman": 0.8510913303629272, "step": 2750 }, { "epoch": 2.67, "eval_avg_sts": 0.8149543004915998, "eval_sickr_spearman": 0.7786629253181646, "eval_stsb_spearman": 0.8512456756650348, "step": 2875 }, { "epoch": 2.79, "learning_rate": 3.574744661095636e-06, "loss": 0.5295, "step": 3000 }, { "epoch": 2.79, "eval_avg_sts": 0.8162287995156676, "eval_sickr_spearman": 0.7821816357784194, "eval_stsb_spearman": 0.8502759632529158, "step": 3000 }, { "epoch": 2.9, "eval_avg_sts": 0.8163857434466557, "eval_sickr_spearman": 0.7826894686139245, "eval_stsb_spearman": 0.850082018279387, "step": 3125 }, { "epoch": 3.0, "step": 3231, "train_runtime": 2076.5315, "train_samples_per_second": 1.556 } ], "max_steps": 3231, "num_train_epochs": 3, "total_flos": 52139850005053440, "trial_name": null, "trial_params": null }