|
loss,grad_norm,learning_rate,epoch,step,eval_loss,eval_runtime,eval_samples_per_second,eval_steps_per_second,train_runtime,train_samples_per_second,train_steps_per_second,total_flos,train_loss |
|
1.2534,0.7888012528419495,4e-05,0.025,1,,,,,,,,, |
|
1.6814,1.304793119430542,8e-05,0.05,2,,,,,,,,, |
|
1.7566,1.2770837545394897,0.00012,0.075,3,,,,,,,,, |
|
1.3991,0.9290549755096436,0.00016,0.1,4,,,,,,,,, |
|
1.3387,0.8864096999168396,0.0002,0.125,5,,,,,,,,, |
|
,,,0.125,5,1.0552338361740112,7.1909,11.125,1.391,,,,, |
|
0.8119,0.3486979305744171,0.000192,0.15,6,,,,,,,,, |
|
0.8837,0.46293407678604126,0.00018400000000000003,0.175,7,,,,,,,,, |
|
0.6576,0.3244289755821228,0.00017600000000000002,0.2,8,,,,,,,,, |
|
0.6484,0.2247825413942337,0.000168,0.225,9,,,,,,,,, |
|
0.7436,0.4602418839931488,0.00016,0.25,10,,,,,,,,, |
|
,,,0.25,10,0.725510835647583,4.8682,16.433,2.054,,,,, |
|
0.7571,0.2589215636253357,0.000152,0.275,11,,,,,,,,, |
|
0.9006,0.40398478507995605,0.000144,0.3,12,,,,,,,,, |
|
0.5278,0.19507887959480286,0.00013600000000000003,0.325,13,,,,,,,,, |
|
0.5557,0.20721735060214996,0.00012800000000000002,0.35,14,,,,,,,,, |
|
0.5042,0.1408037394285202,0.00012,0.375,15,,,,,,,,, |
|
,,,0.375,15,0.6471825242042542,4.8773,16.403,2.05,,,,, |
|
0.6344,0.20234538614749908,0.00011200000000000001,0.4,16,,,,,,,,, |
|
0.5956,0.28273141384124756,0.00010400000000000001,0.425,17,,,,,,,,, |
|
0.6394,0.42618072032928467,9.6e-05,0.45,18,,,,,,,,, |
|
0.6881,0.23107975721359253,8.800000000000001e-05,0.475,19,,,,,,,,, |
|
0.5356,0.17914614081382751,8e-05,0.5,20,,,,,,,,, |
|
,,,0.5,20,0.5898063778877258,4.8632,16.45,2.056,,,,, |
|
0.5028,0.1842283010482788,7.2e-05,0.525,21,,,,,,,,, |
|
0.4696,0.17058564722537994,6.400000000000001e-05,0.55,22,,,,,,,,, |
|
0.6429,0.2980625331401825,5.6000000000000006e-05,0.575,23,,,,,,,,, |
|
0.5543,0.2445172369480133,4.8e-05,0.6,24,,,,,,,,, |
|
0.492,0.3871745765209198,4e-05,0.625,25,,,,,,,,, |
|
,,,0.625,25,0.5556104779243469,4.8657,16.442,2.055,,,,, |
|
0.4687,0.3489736318588257,3.2000000000000005e-05,0.65,26,,,,,,,,, |
|
0.5499,0.18392369151115417,2.4e-05,0.675,27,,,,,,,,, |
|
0.479,0.21796149015426636,1.6000000000000003e-05,0.7,28,,,,,,,,, |
|
0.5323,0.2878962457180023,8.000000000000001e-06,0.725,29,,,,,,,,, |
|
0.5485,0.22873283922672272,0.0,0.75,30,,,,,,,,, |
|
,,,0.75,30,0.5422899127006531,4.8679,16.434,2.054,,,,, |
|
,,,0.75,30,,,,,116.3306,2.063,0.258,2819390830755840.0,0.7584310283263525 |
|
|