{ "best_metric": 0.965675057208238, "best_model_checkpoint": "/content/drive/MyDrive/Papers/RAG_3GPP/models/checkpoints/embedding/bge-small-telecom_15e_512bs/checkpoint-45", "epoch": 3.8181818181818183, "eval_steps": 15, "global_step": 45, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.2727272727272727, "grad_norm": 1.7355202436447144, "learning_rate": 4.411764705882353e-05, "loss": 1.0332, "step": 15 }, { "epoch": 1.2727272727272727, "eval_loss": 0.0967816412448883, "eval_runtime": 3.2637, "eval_samples_per_second": 401.687, "eval_steps_per_second": 0.919, "eval_telecom-ir-eval_cosine_accuracy@1": 0.9450800915331807, "eval_telecom-ir-eval_cosine_accuracy@10": 0.9931350114416476, "eval_telecom-ir-eval_cosine_accuracy@3": 0.9870327993897788, "eval_telecom-ir-eval_cosine_accuracy@5": 0.988558352402746, "eval_telecom-ir-eval_cosine_map@100": 0.96574625373806, "eval_telecom-ir-eval_cosine_mrr@10": 0.9655954499776009, "eval_telecom-ir-eval_cosine_ndcg@10": 0.9725340084355174, "eval_telecom-ir-eval_cosine_precision@1": 0.9450800915331807, "eval_telecom-ir-eval_cosine_recall@1": 0.9450800915331807, "step": 15 }, { "epoch": 2.5454545454545454, "grad_norm": 0.8801536560058594, "learning_rate": 4.9054165035221236e-05, "loss": 0.2091, "step": 30 }, { "epoch": 2.5454545454545454, "eval_loss": 0.05175875499844551, "eval_runtime": 3.3397, "eval_samples_per_second": 392.552, "eval_steps_per_second": 0.898, "eval_telecom-ir-eval_cosine_accuracy@1": 0.96186117467582, "eval_telecom-ir-eval_cosine_accuracy@10": 0.9938977879481312, "eval_telecom-ir-eval_cosine_accuracy@3": 0.9908466819221968, "eval_telecom-ir-eval_cosine_accuracy@5": 0.992372234935164, "eval_telecom-ir-eval_cosine_map@100": 0.976456964386964, "eval_telecom-ir-eval_cosine_mrr@10": 0.9762734130011017, "eval_telecom-ir-eval_cosine_ndcg@10": 0.9807745601952235, "eval_telecom-ir-eval_cosine_precision@1": 0.96186117467582, "eval_telecom-ir-eval_cosine_recall@1": 0.96186117467582, "step": 30 }, { "epoch": 3.8181818181818183, "grad_norm": 0.5518485307693481, "learning_rate": 4.571274123109606e-05, "loss": 0.0997, "step": 45 }, { "epoch": 3.8181818181818183, "eval_loss": 0.046976786106824875, "eval_runtime": 3.4455, "eval_samples_per_second": 380.5, "eval_steps_per_second": 0.871, "eval_telecom-ir-eval_cosine_accuracy@1": 0.965675057208238, "eval_telecom-ir-eval_cosine_accuracy@10": 0.9938977879481312, "eval_telecom-ir-eval_cosine_accuracy@3": 0.992372234935164, "eval_telecom-ir-eval_cosine_accuracy@5": 0.9931350114416476, "eval_telecom-ir-eval_cosine_map@100": 0.9786169716375667, "eval_telecom-ir-eval_cosine_mrr@10": 0.9784334023464457, "eval_telecom-ir-eval_cosine_ndcg@10": 0.9824027787882591, "eval_telecom-ir-eval_cosine_precision@1": 0.965675057208238, "eval_telecom-ir-eval_cosine_recall@1": 0.965675057208238, "step": 45 } ], "logging_steps": 15, "max_steps": 165, "num_input_tokens_seen": 0, "num_train_epochs": 15, "save_steps": 15, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": false }, "attributes": {} } }, "total_flos": 0.0, "train_batch_size": 512, "trial_name": null, "trial_params": null }