stackexchange_codegolf / trainer_log.jsonl
sedrickkeh's picture
Training in progress, epoch 2
23fde87 verified
{"current_steps": 10, "total_steps": 150, "loss": 0.8013, "lr": 5e-06, "epoch": 0.19950124688279303, "percentage": 6.67, "elapsed_time": "0:09:31", "remaining_time": "2:13:14"}
{"current_steps": 20, "total_steps": 150, "loss": 0.6798, "lr": 5e-06, "epoch": 0.39900249376558605, "percentage": 13.33, "elapsed_time": "0:18:57", "remaining_time": "2:03:13"}
{"current_steps": 30, "total_steps": 150, "loss": 0.6411, "lr": 5e-06, "epoch": 0.5985037406483791, "percentage": 20.0, "elapsed_time": "0:28:23", "remaining_time": "1:53:34"}
{"current_steps": 40, "total_steps": 150, "loss": 0.6274, "lr": 5e-06, "epoch": 0.7980049875311721, "percentage": 26.67, "elapsed_time": "0:37:50", "remaining_time": "1:44:02"}
{"current_steps": 50, "total_steps": 150, "loss": 0.6123, "lr": 5e-06, "epoch": 0.9975062344139651, "percentage": 33.33, "elapsed_time": "0:47:15", "remaining_time": "1:34:31"}
{"current_steps": 50, "total_steps": 150, "eval_loss": 0.6066042184829712, "epoch": 0.9975062344139651, "percentage": 33.33, "elapsed_time": "0:48:16", "remaining_time": "1:36:32"}
{"current_steps": 60, "total_steps": 150, "loss": 0.6278, "lr": 5e-06, "epoch": 1.1970074812967582, "percentage": 40.0, "elapsed_time": "0:58:41", "remaining_time": "1:28:02"}
{"current_steps": 70, "total_steps": 150, "loss": 0.5677, "lr": 5e-06, "epoch": 1.3965087281795512, "percentage": 46.67, "elapsed_time": "1:08:07", "remaining_time": "1:17:51"}
{"current_steps": 80, "total_steps": 150, "loss": 0.5516, "lr": 5e-06, "epoch": 1.5960099750623442, "percentage": 53.33, "elapsed_time": "1:17:32", "remaining_time": "1:07:51"}
{"current_steps": 90, "total_steps": 150, "loss": 0.5397, "lr": 5e-06, "epoch": 1.7955112219451372, "percentage": 60.0, "elapsed_time": "1:26:57", "remaining_time": "0:57:58"}
{"current_steps": 100, "total_steps": 150, "loss": 0.5438, "lr": 5e-06, "epoch": 1.9950124688279303, "percentage": 66.67, "elapsed_time": "1:36:23", "remaining_time": "0:48:11"}
{"current_steps": 100, "total_steps": 150, "eval_loss": 0.5740869641304016, "epoch": 1.9950124688279303, "percentage": 66.67, "elapsed_time": "1:37:29", "remaining_time": "0:48:44"}
{"current_steps": 110, "total_steps": 150, "loss": 0.5407, "lr": 5e-06, "epoch": 2.1945137157107233, "percentage": 73.33, "elapsed_time": "1:47:51", "remaining_time": "0:39:13"}
{"current_steps": 120, "total_steps": 150, "loss": 0.4996, "lr": 5e-06, "epoch": 2.3940149625935163, "percentage": 80.0, "elapsed_time": "1:57:16", "remaining_time": "0:29:19"}
{"current_steps": 130, "total_steps": 150, "loss": 0.4972, "lr": 5e-06, "epoch": 2.5935162094763093, "percentage": 86.67, "elapsed_time": "2:06:44", "remaining_time": "0:19:29"}
{"current_steps": 140, "total_steps": 150, "loss": 0.4926, "lr": 5e-06, "epoch": 2.7930174563591024, "percentage": 93.33, "elapsed_time": "2:16:11", "remaining_time": "0:09:43"}
{"current_steps": 150, "total_steps": 150, "loss": 0.4952, "lr": 5e-06, "epoch": 2.9925187032418954, "percentage": 100.0, "elapsed_time": "2:25:37", "remaining_time": "0:00:00"}
{"current_steps": 150, "total_steps": 150, "eval_loss": 0.5672302842140198, "epoch": 2.9925187032418954, "percentage": 100.0, "elapsed_time": "2:27:42", "remaining_time": "0:00:00"}
{"current_steps": 150, "total_steps": 150, "epoch": 2.9925187032418954, "percentage": 100.0, "elapsed_time": "2:28:56", "remaining_time": "0:00:00"}