|
{ |
|
"before_init_mem_cpu": 3040526336, |
|
"before_init_mem_gpu": 512, |
|
"epoch": 18.0, |
|
"eval_-_f1-score": 0.3333333333333333, |
|
"eval_-_precision": 0.42857142857142855, |
|
"eval_-_recall": 0.2727272727272727, |
|
"eval_-_support": 22.0, |
|
"eval_<_f1-score": 0.9691187031907254, |
|
"eval_<_precision": 0.9674313805817288, |
|
"eval_<_recall": 0.9708119218910586, |
|
"eval_<_support": 4865.0, |
|
"eval_=_f1-score": 0.8385744234800838, |
|
"eval_=_precision": 0.8733624454148472, |
|
"eval_=_recall": 0.8064516129032258, |
|
"eval_=_support": 248.0, |
|
"eval_>_f1-score": 0.9696098562628337, |
|
"eval_>_precision": 0.9686153846153847, |
|
"eval_>_recall": 0.9706063720452209, |
|
"eval_>_support": 4865.0, |
|
"eval_accuracy": 0.9651, |
|
"eval_loss": 0.10465546697378159, |
|
"eval_macro_avg_f1-score": 0.777659079066744, |
|
"eval_macro_avg_precision": 0.8094951597958472, |
|
"eval_macro_avg_recall": 0.7551492948916945, |
|
"eval_macro_avg_support": 10000.0, |
|
"eval_mem_cpu_alloc_delta": -175185920, |
|
"eval_mem_cpu_peaked_delta": 175185920, |
|
"eval_mem_gpu_alloc_delta": 0, |
|
"eval_mem_gpu_peaked_delta": 1242359296, |
|
"eval_runtime": 12.3635, |
|
"eval_samples": 10000, |
|
"eval_samples_per_second": 808.83, |
|
"eval_steps_per_second": 3.235, |
|
"eval_weighted_avg_f1-score": 0.964721423209796, |
|
"eval_weighted_avg_precision": 0.964488997057541, |
|
"eval_weighted_avg_recall": 0.9651, |
|
"eval_weighted_avg_support": 10000.0, |
|
"init_mem_cpu_alloc_delta": 18427904, |
|
"init_mem_cpu_peaked_delta": 0, |
|
"init_mem_gpu_alloc_delta": 0, |
|
"init_mem_gpu_peaked_delta": 0, |
|
"total_flos": 2.949719748897669e+18, |
|
"train_loss": 0.22952656600628965, |
|
"train_mem_cpu_alloc_delta": 826355712, |
|
"train_mem_cpu_peaked_delta": 403324928, |
|
"train_mem_gpu_alloc_delta": 690193408, |
|
"train_mem_gpu_peaked_delta": 19408810496, |
|
"train_runtime": 33563.6304, |
|
"train_samples": 502272, |
|
"train_samples_per_second": 448.943, |
|
"train_steps_per_second": 0.877 |
|
} |