File size: 5,959 Bytes
78017bf
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
{"current_steps": 10, "total_steps": 250, "loss": 2.103, "learning_rate": 4.000000000000001e-06, "epoch": 0.08, "percentage": 4.0, "elapsed_time": "0:00:25", "remaining_time": "0:10:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 20, "total_steps": 250, "loss": 1.8909, "learning_rate": 8.000000000000001e-06, "epoch": 0.16, "percentage": 8.0, "elapsed_time": "0:00:43", "remaining_time": "0:08:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 30, "total_steps": 250, "loss": 1.824, "learning_rate": 9.987820251299121e-06, "epoch": 0.24, "percentage": 12.0, "elapsed_time": "0:01:02", "remaining_time": "0:07:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 40, "total_steps": 250, "loss": 1.7976, "learning_rate": 9.890738003669029e-06, "epoch": 0.32, "percentage": 16.0, "elapsed_time": "0:01:21", "remaining_time": "0:07:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 50, "total_steps": 250, "loss": 1.7517, "learning_rate": 9.698463103929542e-06, "epoch": 0.4, "percentage": 20.0, "elapsed_time": "0:01:38", "remaining_time": "0:06:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 60, "total_steps": 250, "loss": 1.7713, "learning_rate": 9.414737964294636e-06, "epoch": 0.48, "percentage": 24.0, "elapsed_time": "0:01:56", "remaining_time": "0:06:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 70, "total_steps": 250, "loss": 1.7739, "learning_rate": 9.045084971874738e-06, "epoch": 0.56, "percentage": 28.0, "elapsed_time": "0:02:14", "remaining_time": "0:05:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 80, "total_steps": 250, "loss": 1.7582, "learning_rate": 8.596699001693257e-06, "epoch": 0.64, "percentage": 32.0, "elapsed_time": "0:02:32", "remaining_time": "0:05:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 90, "total_steps": 250, "loss": 1.7622, "learning_rate": 8.078307376628292e-06, "epoch": 0.72, "percentage": 36.0, "elapsed_time": "0:02:49", "remaining_time": "0:05:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 100, "total_steps": 250, "loss": 1.7483, "learning_rate": 7.500000000000001e-06, "epoch": 0.8, "percentage": 40.0, "elapsed_time": "0:03:08", "remaining_time": "0:04:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 110, "total_steps": 250, "loss": 1.7125, "learning_rate": 6.873032967079562e-06, "epoch": 0.88, "percentage": 44.0, "elapsed_time": "0:03:26", "remaining_time": "0:04:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 120, "total_steps": 250, "loss": 1.7158, "learning_rate": 6.209609477998339e-06, "epoch": 0.96, "percentage": 48.0, "elapsed_time": "0:03:43", "remaining_time": "0:04:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 130, "total_steps": 250, "loss": 1.5306, "learning_rate": 5.522642316338268e-06, "epoch": 1.04, "percentage": 52.0, "elapsed_time": "0:04:02", "remaining_time": "0:03:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 140, "total_steps": 250, "loss": 1.216, "learning_rate": 4.825502516487497e-06, "epoch": 1.12, "percentage": 56.0, "elapsed_time": "0:04:19", "remaining_time": "0:03:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 150, "total_steps": 250, "loss": 1.2646, "learning_rate": 4.131759111665349e-06, "epoch": 1.2, "percentage": 60.0, "elapsed_time": "0:04:38", "remaining_time": "0:03:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 160, "total_steps": 250, "loss": 1.1715, "learning_rate": 3.4549150281252635e-06, "epoch": 1.28, "percentage": 64.0, "elapsed_time": "0:04:55", "remaining_time": "0:02:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 170, "total_steps": 250, "loss": 1.1951, "learning_rate": 2.8081442660546126e-06, "epoch": 1.3599999999999999, "percentage": 68.0, "elapsed_time": "0:05:13", "remaining_time": "0:02:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 180, "total_steps": 250, "loss": 1.183, "learning_rate": 2.204035482646267e-06, "epoch": 1.44, "percentage": 72.0, "elapsed_time": "0:05:32", "remaining_time": "0:02:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 190, "total_steps": 250, "loss": 1.1787, "learning_rate": 1.6543469682057105e-06, "epoch": 1.52, "percentage": 76.0, "elapsed_time": "0:05:49", "remaining_time": "0:01:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 200, "total_steps": 250, "loss": 1.215, "learning_rate": 1.1697777844051105e-06, "epoch": 1.6, "percentage": 80.0, "elapsed_time": "0:06:07", "remaining_time": "0:01:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 210, "total_steps": 250, "loss": 1.1823, "learning_rate": 7.597595192178702e-07, "epoch": 1.6800000000000002, "percentage": 84.0, "elapsed_time": "0:06:25", "remaining_time": "0:01:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 220, "total_steps": 250, "loss": 1.1846, "learning_rate": 4.322727117869951e-07, "epoch": 1.76, "percentage": 88.0, "elapsed_time": "0:06:44", "remaining_time": "0:00:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 230, "total_steps": 250, "loss": 1.1522, "learning_rate": 1.9369152030840553e-07, "epoch": 1.8399999999999999, "percentage": 92.0, "elapsed_time": "0:07:01", "remaining_time": "0:00:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 240, "total_steps": 250, "loss": 1.0957, "learning_rate": 4.865965629214819e-08, "epoch": 1.92, "percentage": 96.0, "elapsed_time": "0:07:18", "remaining_time": "0:00:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 250, "total_steps": 250, "loss": 1.1635, "learning_rate": 0.0, "epoch": 2.0, "percentage": 100.0, "elapsed_time": "0:07:36", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 250, "total_steps": 250, "epoch": 2.0, "percentage": 100.0, "elapsed_time": "0:08:40", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}