|
{ |
|
"best_metric": 0.37634159533224454, |
|
"best_model_checkpoint": "/home2/s5432073/language-tech-project/results/ltp-roberta-large-defaultltp-roberta-large-default-2/checkpoint-1600", |
|
"epoch": 9.467455621301776, |
|
"global_step": 1600, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.18, |
|
"learning_rate": 9.28348909657321e-06, |
|
"loss": 0.4492, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 1.18, |
|
"eval_f1": 0.11572875154130194, |
|
"eval_f1_all": [ |
|
0.0, |
|
0.05847953216374269, |
|
0.0, |
|
0.0, |
|
0.4682713347921225, |
|
0.0, |
|
0.0, |
|
0.0, |
|
0.6747759282970549, |
|
0.520393811533052, |
|
0.0, |
|
0.0, |
|
0.0, |
|
0.0, |
|
0.0, |
|
0.0, |
|
0.5926544240400667, |
|
0.0, |
|
0.0, |
|
0.0 |
|
], |
|
"eval_loss": 0.36748331785202026, |
|
"eval_runtime": 3.8035, |
|
"eval_samples_per_second": 498.483, |
|
"eval_steps_per_second": 15.775, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 2.37, |
|
"learning_rate": 8.037383177570094e-06, |
|
"loss": 0.3449, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 2.37, |
|
"eval_f1": 0.22644858426717676, |
|
"eval_f1_all": [ |
|
0.3419354838709677, |
|
0.30434782608695654, |
|
0.0, |
|
0.0, |
|
0.5748898678414096, |
|
0.0, |
|
0.3260869565217391, |
|
0.0, |
|
0.7539203860072377, |
|
0.5495118549511855, |
|
0.0879120879120879, |
|
0.23971377459749552, |
|
0.0, |
|
0.0, |
|
0.055045871559633024, |
|
0.0, |
|
0.6266548984995588, |
|
0.5684210526315789, |
|
0.008928571428571428, |
|
0.09160305343511452 |
|
], |
|
"eval_loss": 0.33438944816589355, |
|
"eval_runtime": 2.9482, |
|
"eval_samples_per_second": 643.096, |
|
"eval_steps_per_second": 20.351, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 3.55, |
|
"learning_rate": 6.791277258566978e-06, |
|
"loss": 0.3163, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 3.55, |
|
"eval_f1": 0.29790838893606486, |
|
"eval_f1_all": [ |
|
0.4838709677419356, |
|
0.4791965566714491, |
|
0.0, |
|
0.0, |
|
0.5882352941176471, |
|
0.012121212121212121, |
|
0.303030303030303, |
|
0.0, |
|
0.7144866385372716, |
|
0.574385510996119, |
|
0.3069767441860465, |
|
0.4, |
|
0.0, |
|
0.0, |
|
0.40190249702734837, |
|
0.0, |
|
0.6844840386043058, |
|
0.6761904761904762, |
|
0.034482758620689655, |
|
0.29880478087649404 |
|
], |
|
"eval_loss": 0.3200507164001465, |
|
"eval_runtime": 2.9119, |
|
"eval_samples_per_second": 651.111, |
|
"eval_steps_per_second": 20.605, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 4.73, |
|
"learning_rate": 5.545171339563863e-06, |
|
"loss": 0.3021, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 4.73, |
|
"eval_f1": 0.33206438169614216, |
|
"eval_f1_all": [ |
|
0.5162907268170427, |
|
0.5621761658031088, |
|
0.0, |
|
0.0, |
|
0.6198347107438016, |
|
0.08139534883720931, |
|
0.36734693877551017, |
|
0.0, |
|
0.7533632286995516, |
|
0.6167290886392011, |
|
0.36111111111111105, |
|
0.42990654205607476, |
|
0.0, |
|
0.0, |
|
0.5192909280500522, |
|
0.014814814814814815, |
|
0.6877828054298644, |
|
0.6568627450980392, |
|
0.08906882591093117, |
|
0.36531365313653136 |
|
], |
|
"eval_loss": 0.3112545609474182, |
|
"eval_runtime": 3.7309, |
|
"eval_samples_per_second": 508.183, |
|
"eval_steps_per_second": 16.082, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 5.92, |
|
"learning_rate": 4.299065420560748e-06, |
|
"loss": 0.2879, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 5.92, |
|
"eval_f1": 0.3556641957175606, |
|
"eval_f1_all": [ |
|
0.5228426395939088, |
|
0.5761843790012804, |
|
0.014285714285714285, |
|
0.05660377358490566, |
|
0.6353166986564299, |
|
0.09195402298850576, |
|
0.4059405940594059, |
|
0.0, |
|
0.7578814627994955, |
|
0.639225181598063, |
|
0.3873873873873874, |
|
0.49717514124293793, |
|
0.0, |
|
0.015503875968992248, |
|
0.5467059980334316, |
|
0.08934707903780069, |
|
0.6688907422852377, |
|
0.6995515695067265, |
|
0.09876543209876544, |
|
0.4097222222222222 |
|
], |
|
"eval_loss": 0.3077404499053955, |
|
"eval_runtime": 3.283, |
|
"eval_samples_per_second": 577.521, |
|
"eval_steps_per_second": 18.276, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 7.1, |
|
"learning_rate": 3.0529595015576325e-06, |
|
"loss": 0.2783, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 7.1, |
|
"eval_f1": 0.3662892905615983, |
|
"eval_f1_all": [ |
|
0.5064599483204134, |
|
0.5771643663739021, |
|
0.028169014084507046, |
|
0.125, |
|
0.6408730158730159, |
|
0.1222222222222222, |
|
0.35789473684210527, |
|
0.0, |
|
0.7578947368421052, |
|
0.6680988184747583, |
|
0.4291497975708502, |
|
0.5216178521617852, |
|
0.0, |
|
0.015503875968992248, |
|
0.5635864592863677, |
|
0.10135135135135136, |
|
0.6790622473726757, |
|
0.7058823529411764, |
|
0.10317460317460318, |
|
0.422680412371134 |
|
], |
|
"eval_loss": 0.3067641854286194, |
|
"eval_runtime": 3.0738, |
|
"eval_samples_per_second": 616.829, |
|
"eval_steps_per_second": 19.52, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 8.28, |
|
"learning_rate": 1.8068535825545173e-06, |
|
"loss": 0.2721, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 8.28, |
|
"eval_f1": 0.36379633008264506, |
|
"eval_f1_all": [ |
|
0.5247524752475247, |
|
0.5838509316770186, |
|
0.028368794326241138, |
|
0.07407407407407407, |
|
0.6463654223968567, |
|
0.13259668508287292, |
|
0.35106382978723405, |
|
0.0, |
|
0.7543075941289088, |
|
0.6308243727598566, |
|
0.4, |
|
0.5212620027434842, |
|
0.0, |
|
0.015503875968992248, |
|
0.5748709122203098, |
|
0.07612456747404846, |
|
0.6950959488272921, |
|
0.6986899563318777, |
|
0.14785992217898833, |
|
0.42031523642732044 |
|
], |
|
"eval_loss": 0.3058605194091797, |
|
"eval_runtime": 3.1337, |
|
"eval_samples_per_second": 605.037, |
|
"eval_steps_per_second": 19.147, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 9.47, |
|
"learning_rate": 5.607476635514019e-07, |
|
"loss": 0.2672, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 9.47, |
|
"eval_f1": 0.37634159533224454, |
|
"eval_f1_all": [ |
|
0.5393794749403341, |
|
0.5859085290482077, |
|
0.06896551724137931, |
|
0.15384615384615385, |
|
0.6564885496183206, |
|
0.12972972972972974, |
|
0.38000000000000006, |
|
0.0, |
|
0.7552715654952076, |
|
0.6600441501103753, |
|
0.41463414634146345, |
|
0.5263157894736842, |
|
0.0, |
|
0.015503875968992248, |
|
0.5658263305322129, |
|
0.10596026490066227, |
|
0.6955848179705655, |
|
0.7085201793721972, |
|
0.13076923076923078, |
|
0.4340836012861736 |
|
], |
|
"eval_loss": 0.3051939308643341, |
|
"eval_runtime": 3.2008, |
|
"eval_samples_per_second": 592.358, |
|
"eval_steps_per_second": 18.746, |
|
"step": 1600 |
|
} |
|
], |
|
"max_steps": 1690, |
|
"num_train_epochs": 10, |
|
"total_flos": 1.1949029604729552e+16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|