stackexchange_codereview / trainer_log.jsonl
sedrickkeh's picture
Training in progress, epoch 2
4a0af91 verified
{"current_steps": 10, "total_steps": 198, "loss": 0.9599, "lr": 5e-06, "epoch": 0.15037593984962405, "percentage": 5.05, "elapsed_time": "0:09:47", "remaining_time": "3:04:06"}
{"current_steps": 20, "total_steps": 198, "loss": 0.8336, "lr": 5e-06, "epoch": 0.3007518796992481, "percentage": 10.1, "elapsed_time": "0:19:30", "remaining_time": "2:53:35"}
{"current_steps": 30, "total_steps": 198, "loss": 0.7791, "lr": 5e-06, "epoch": 0.45112781954887216, "percentage": 15.15, "elapsed_time": "0:29:11", "remaining_time": "2:43:31"}
{"current_steps": 40, "total_steps": 198, "loss": 0.7583, "lr": 5e-06, "epoch": 0.6015037593984962, "percentage": 20.2, "elapsed_time": "0:38:55", "remaining_time": "2:33:43"}
{"current_steps": 50, "total_steps": 198, "loss": 0.7441, "lr": 5e-06, "epoch": 0.7518796992481203, "percentage": 25.25, "elapsed_time": "0:48:38", "remaining_time": "2:23:59"}
{"current_steps": 60, "total_steps": 198, "loss": 0.7377, "lr": 5e-06, "epoch": 0.9022556390977443, "percentage": 30.3, "elapsed_time": "0:58:20", "remaining_time": "2:14:11"}
{"current_steps": 66, "total_steps": 198, "eval_loss": 0.7360510230064392, "epoch": 0.9924812030075187, "percentage": 33.33, "elapsed_time": "1:05:49", "remaining_time": "2:11:39"}
{"current_steps": 70, "total_steps": 198, "loss": 0.7494, "lr": 5e-06, "epoch": 1.0526315789473684, "percentage": 35.35, "elapsed_time": "1:10:23", "remaining_time": "2:08:43"}
{"current_steps": 80, "total_steps": 198, "loss": 0.6823, "lr": 5e-06, "epoch": 1.2030075187969924, "percentage": 40.4, "elapsed_time": "1:20:06", "remaining_time": "1:58:10"}
{"current_steps": 90, "total_steps": 198, "loss": 0.6835, "lr": 5e-06, "epoch": 1.3533834586466165, "percentage": 45.45, "elapsed_time": "1:29:48", "remaining_time": "1:47:46"}
{"current_steps": 100, "total_steps": 198, "loss": 0.6778, "lr": 5e-06, "epoch": 1.5037593984962405, "percentage": 50.51, "elapsed_time": "1:39:30", "remaining_time": "1:37:31"}
{"current_steps": 110, "total_steps": 198, "loss": 0.6741, "lr": 5e-06, "epoch": 1.6541353383458648, "percentage": 55.56, "elapsed_time": "1:49:12", "remaining_time": "1:27:22"}
{"current_steps": 120, "total_steps": 198, "loss": 0.6786, "lr": 5e-06, "epoch": 1.8045112781954886, "percentage": 60.61, "elapsed_time": "1:58:52", "remaining_time": "1:17:16"}
{"current_steps": 130, "total_steps": 198, "loss": 0.6668, "lr": 5e-06, "epoch": 1.954887218045113, "percentage": 65.66, "elapsed_time": "2:08:34", "remaining_time": "1:07:15"}
{"current_steps": 133, "total_steps": 198, "eval_loss": 0.7167445421218872, "epoch": 2.0, "percentage": 67.17, "elapsed_time": "2:12:35", "remaining_time": "1:04:48"}
{"current_steps": 140, "total_steps": 198, "loss": 0.6702, "lr": 5e-06, "epoch": 2.1052631578947367, "percentage": 70.71, "elapsed_time": "2:20:35", "remaining_time": "0:58:14"}
{"current_steps": 150, "total_steps": 198, "loss": 0.6221, "lr": 5e-06, "epoch": 2.255639097744361, "percentage": 75.76, "elapsed_time": "2:30:17", "remaining_time": "0:48:05"}
{"current_steps": 160, "total_steps": 198, "loss": 0.6227, "lr": 5e-06, "epoch": 2.406015037593985, "percentage": 80.81, "elapsed_time": "2:40:00", "remaining_time": "0:38:00"}
{"current_steps": 170, "total_steps": 198, "loss": 0.625, "lr": 5e-06, "epoch": 2.556390977443609, "percentage": 85.86, "elapsed_time": "2:49:44", "remaining_time": "0:27:57"}
{"current_steps": 180, "total_steps": 198, "loss": 0.6189, "lr": 5e-06, "epoch": 2.706766917293233, "percentage": 90.91, "elapsed_time": "2:59:28", "remaining_time": "0:17:56"}
{"current_steps": 190, "total_steps": 198, "loss": 0.6284, "lr": 5e-06, "epoch": 2.857142857142857, "percentage": 95.96, "elapsed_time": "3:09:12", "remaining_time": "0:07:57"}
{"current_steps": 198, "total_steps": 198, "eval_loss": 0.7185549139976501, "epoch": 2.9774436090225564, "percentage": 100.0, "elapsed_time": "3:19:23", "remaining_time": "0:00:00"}
{"current_steps": 198, "total_steps": 198, "epoch": 2.9774436090225564, "percentage": 100.0, "elapsed_time": "3:20:39", "remaining_time": "0:00:00"}