|
{ |
|
"best_metric": 0.7635786873553013, |
|
"best_model_checkpoint": "model_checkpoint/fine-tuned_legalbert_multilabel_original_train/checkpoint-783", |
|
"epoch": 2.997129186602871, |
|
"eval_steps": 500, |
|
"global_step": 783, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.999043062200957, |
|
"eval_A_f1": 0.0, |
|
"eval_A_precision": 0.0, |
|
"eval_A_recall": 0.0, |
|
"eval_CH_f1": 0.0, |
|
"eval_CH_precision": 0.0, |
|
"eval_CH_recall": 0.0, |
|
"eval_CR_f1": 0.0, |
|
"eval_CR_precision": 0.0, |
|
"eval_CR_recall": 0.0, |
|
"eval_FAIR_f1": 0.9544351203273459, |
|
"eval_FAIR_precision": 0.9774147727272727, |
|
"eval_FAIR_recall": 0.9325111803767449, |
|
"eval_J_f1": 0.0, |
|
"eval_J_precision": 0.0, |
|
"eval_J_recall": 0.0, |
|
"eval_LAW_f1": 0.0, |
|
"eval_LAW_precision": 0.0, |
|
"eval_LAW_recall": 0.0, |
|
"eval_LTD_f1": 0.6153846153846154, |
|
"eval_LTD_precision": 0.7472527472527473, |
|
"eval_LTD_recall": 0.5230769230769231, |
|
"eval_TER_f1": 0.0, |
|
"eval_TER_precision": 0.0, |
|
"eval_TER_recall": 0.0, |
|
"eval_USE_f1": 0.017241379310344827, |
|
"eval_USE_precision": 1.0, |
|
"eval_USE_recall": 0.008695652173913044, |
|
"eval_accuracy": 0.8484116439183477, |
|
"eval_f1_macro": 0.17634012389136736, |
|
"eval_loss": 0.06019286438822746, |
|
"eval_precision_macro": 0.3027408355533356, |
|
"eval_recall_macro": 0.1626981950697312, |
|
"eval_runtime": 894.9212, |
|
"eval_samples_per_second": 9.251, |
|
"eval_steps_per_second": 0.579, |
|
"step": 261 |
|
}, |
|
{ |
|
"epoch": 1.9138755980861244, |
|
"grad_norm": 0.9339248538017273, |
|
"learning_rate": 1.8135376756066413e-05, |
|
"loss": 0.0784, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 1.998086124401914, |
|
"eval_A_f1": 0.5909090909090909, |
|
"eval_A_precision": 1.0, |
|
"eval_A_recall": 0.41935483870967744, |
|
"eval_CH_f1": 0.4873096446700508, |
|
"eval_CH_precision": 0.8571428571428571, |
|
"eval_CH_recall": 0.3404255319148936, |
|
"eval_CR_f1": 0.0, |
|
"eval_CR_precision": 0.0, |
|
"eval_CR_recall": 0.0, |
|
"eval_FAIR_f1": 0.9716993725804298, |
|
"eval_FAIR_precision": 0.9573852426673681, |
|
"eval_FAIR_recall": 0.9864480281881014, |
|
"eval_J_f1": 0.8623853211009175, |
|
"eval_J_precision": 0.9038461538461539, |
|
"eval_J_recall": 0.8245614035087719, |
|
"eval_LAW_f1": 0.7927927927927928, |
|
"eval_LAW_precision": 0.88, |
|
"eval_LAW_recall": 0.7213114754098361, |
|
"eval_LTD_f1": 0.6752688172043011, |
|
"eval_LTD_precision": 0.7658536585365854, |
|
"eval_LTD_recall": 0.6038461538461538, |
|
"eval_TER_f1": 0.6990881458966566, |
|
"eval_TER_precision": 0.7419354838709677, |
|
"eval_TER_recall": 0.6609195402298851, |
|
"eval_USE_f1": 0.6632124352331606, |
|
"eval_USE_precision": 0.8205128205128205, |
|
"eval_USE_recall": 0.5565217391304348, |
|
"eval_accuracy": 0.9299432298586786, |
|
"eval_f1_macro": 0.6380739578208222, |
|
"eval_loss": 0.04580436274409294, |
|
"eval_precision_macro": 0.7696306907307503, |
|
"eval_recall_macro": 0.568154301215306, |
|
"eval_runtime": 898.3262, |
|
"eval_samples_per_second": 9.216, |
|
"eval_steps_per_second": 0.577, |
|
"step": 522 |
|
}, |
|
{ |
|
"epoch": 2.997129186602871, |
|
"eval_A_f1": 0.7, |
|
"eval_A_precision": 0.7241379310344828, |
|
"eval_A_recall": 0.6774193548387096, |
|
"eval_CH_f1": 0.72, |
|
"eval_CH_precision": 0.8256880733944955, |
|
"eval_CH_recall": 0.6382978723404256, |
|
"eval_CR_f1": 0.6301369863013698, |
|
"eval_CR_precision": 0.8214285714285714, |
|
"eval_CR_recall": 0.5111111111111111, |
|
"eval_FAIR_f1": 0.9708172523529014, |
|
"eval_FAIR_precision": 0.9700947225981056, |
|
"eval_FAIR_recall": 0.9715408591950129, |
|
"eval_J_f1": 0.9026548672566371, |
|
"eval_J_precision": 0.9107142857142857, |
|
"eval_J_recall": 0.8947368421052632, |
|
"eval_LAW_f1": 0.8035714285714286, |
|
"eval_LAW_precision": 0.8823529411764706, |
|
"eval_LAW_recall": 0.7377049180327869, |
|
"eval_LTD_f1": 0.7022900763358778, |
|
"eval_LTD_precision": 0.696969696969697, |
|
"eval_LTD_recall": 0.7076923076923077, |
|
"eval_TER_f1": 0.7440476190476191, |
|
"eval_TER_precision": 0.7716049382716049, |
|
"eval_TER_recall": 0.7183908045977011, |
|
"eval_USE_f1": 0.6986899563318777, |
|
"eval_USE_precision": 0.7017543859649122, |
|
"eval_USE_recall": 0.6956521739130435, |
|
"eval_accuracy": 0.9356202439908201, |
|
"eval_f1_macro": 0.7635786873553013, |
|
"eval_loss": 0.043075863271951675, |
|
"eval_precision_macro": 0.8116383940614028, |
|
"eval_recall_macro": 0.7280606937584846, |
|
"eval_runtime": 894.9343, |
|
"eval_samples_per_second": 9.251, |
|
"eval_steps_per_second": 0.579, |
|
"step": 783 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 783, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 3, |
|
"save_steps": 500, |
|
"stateful_callbacks": { |
|
"EarlyStoppingCallback": { |
|
"args": { |
|
"early_stopping_patience": 2, |
|
"early_stopping_threshold": 0.01 |
|
}, |
|
"attributes": { |
|
"early_stopping_patience_counter": 0 |
|
} |
|
}, |
|
"TrainerControl": { |
|
"args": { |
|
"should_epoch_stop": false, |
|
"should_evaluate": false, |
|
"should_log": false, |
|
"should_save": true, |
|
"should_training_stop": true |
|
}, |
|
"attributes": {} |
|
} |
|
}, |
|
"total_flos": 3294883706222592.0, |
|
"train_batch_size": 8, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|