|
{ |
|
"best_metric": 0.815129401249849, |
|
"best_model_checkpoint": "result/my-unsup-simcse-bert-base-uncased", |
|
"epoch": 0.2399846409829771, |
|
"global_step": 1875, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.02, |
|
"eval_avg_sts": 0.7118506537188065, |
|
"eval_sickr_spearman": 0.7191480759127982, |
|
"eval_stsb_spearman": 0.704553231524815, |
|
"step": 125 |
|
}, |
|
{ |
|
"epoch": 0.03, |
|
"eval_avg_sts": 0.7490824841945876, |
|
"eval_sickr_spearman": 0.7415587518643453, |
|
"eval_stsb_spearman": 0.7566062165248297, |
|
"step": 250 |
|
}, |
|
{ |
|
"epoch": 0.05, |
|
"eval_avg_sts": 0.761657495121701, |
|
"eval_sickr_spearman": 0.7473965027359571, |
|
"eval_stsb_spearman": 0.7759184875074447, |
|
"step": 375 |
|
}, |
|
{ |
|
"epoch": 0.06, |
|
"learning_rate": 2.8080122872136184e-05, |
|
"loss": 0.0028, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 0.06, |
|
"eval_avg_sts": 0.7557478973832961, |
|
"eval_sickr_spearman": 0.739644291594853, |
|
"eval_stsb_spearman": 0.7718515031717392, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 0.08, |
|
"eval_avg_sts": 0.7582679338253449, |
|
"eval_sickr_spearman": 0.745471220921864, |
|
"eval_stsb_spearman": 0.7710646467288258, |
|
"step": 625 |
|
}, |
|
{ |
|
"epoch": 0.1, |
|
"eval_avg_sts": 0.7584985773227231, |
|
"eval_sickr_spearman": 0.7513467923228714, |
|
"eval_stsb_spearman": 0.7656503623225748, |
|
"step": 750 |
|
}, |
|
{ |
|
"epoch": 0.11, |
|
"eval_avg_sts": 0.7382867459735918, |
|
"eval_sickr_spearman": 0.6915170632864946, |
|
"eval_stsb_spearman": 0.785056428660689, |
|
"step": 875 |
|
}, |
|
{ |
|
"epoch": 0.13, |
|
"learning_rate": 2.6160245744272367e-05, |
|
"loss": 0.001, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 0.13, |
|
"eval_avg_sts": 0.7696010959205108, |
|
"eval_sickr_spearman": 0.7403704289249832, |
|
"eval_stsb_spearman": 0.7988317629160384, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 0.14, |
|
"eval_avg_sts": 0.7688633369693862, |
|
"eval_sickr_spearman": 0.7358842236914375, |
|
"eval_stsb_spearman": 0.8018424502473349, |
|
"step": 1125 |
|
}, |
|
{ |
|
"epoch": 0.16, |
|
"eval_avg_sts": 0.7735971189091344, |
|
"eval_sickr_spearman": 0.7425422731621982, |
|
"eval_stsb_spearman": 0.8046519646560706, |
|
"step": 1250 |
|
}, |
|
{ |
|
"epoch": 0.18, |
|
"eval_avg_sts": 0.7754623637694573, |
|
"eval_sickr_spearman": 0.7437673388828963, |
|
"eval_stsb_spearman": 0.8071573886560185, |
|
"step": 1375 |
|
}, |
|
{ |
|
"epoch": 0.19, |
|
"learning_rate": 2.424036861640855e-05, |
|
"loss": 0.0002, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 0.19, |
|
"eval_avg_sts": 0.7741734659454558, |
|
"eval_sickr_spearman": 0.7443858813788181, |
|
"eval_stsb_spearman": 0.8039610505120934, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 0.21, |
|
"eval_avg_sts": 0.779812815773511, |
|
"eval_sickr_spearman": 0.7505964761581395, |
|
"eval_stsb_spearman": 0.8090291553888825, |
|
"step": 1625 |
|
}, |
|
{ |
|
"epoch": 0.22, |
|
"eval_avg_sts": 0.7806364317746171, |
|
"eval_sickr_spearman": 0.7509446342591667, |
|
"eval_stsb_spearman": 0.8103282292900675, |
|
"step": 1750 |
|
}, |
|
{ |
|
"epoch": 0.24, |
|
"eval_avg_sts": 0.785057765369954, |
|
"eval_sickr_spearman": 0.7549861294900588, |
|
"eval_stsb_spearman": 0.815129401249849, |
|
"step": 1875 |
|
} |
|
], |
|
"max_steps": 7813, |
|
"num_train_epochs": 1, |
|
"total_flos": 0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|