fayetitchenal's picture
Training in progress, step 18000, checkpoint
510bd2e verified
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 10.61320754716981,
"eval_steps": 2250,
"global_step": 18000,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.589622641509434,
"grad_norm": 9.137022018432617,
"learning_rate": 2.9481132075471702e-05,
"loss": 2.8435,
"step": 1000
},
{
"epoch": 1.179245283018868,
"grad_norm": 6.052332401275635,
"learning_rate": 5.8962264150943403e-05,
"loss": 1.791,
"step": 2000
},
{
"epoch": 1.3266509433962264,
"eval_accuracy_background": 0.6658729859800179,
"eval_accuracy_double_plant": 0.44796971861142204,
"eval_accuracy_drydown": 0.838452272819733,
"eval_accuracy_endrow": 0.6564099936974693,
"eval_accuracy_nutrient_deficiency": 0.5255760511997533,
"eval_accuracy_planter_skip": 0.7062276764551357,
"eval_accuracy_water": 0.9873387227342924,
"eval_accuracy_waterway": 0.5770296385642565,
"eval_accuracy_weed_cluster": 0.4428120632960455,
"eval_iou_background": 0.5904190410028399,
"eval_iou_double_plant": 0.21713659970128166,
"eval_iou_drydown": 0.5191145408680865,
"eval_iou_endrow": 0.146705809299966,
"eval_iou_nutrient_deficiency": 0.3433700256479391,
"eval_iou_planter_skip": 0.19867844175237825,
"eval_iou_water": 0.3151796347651091,
"eval_iou_waterway": 0.17710299517028666,
"eval_iou_weed_cluster": 0.2871479144864637,
"eval_loss": 1.6307891607284546,
"eval_mean_accuracy": 0.6497432359286807,
"eval_mean_iou": 0.31053944474381673,
"eval_overall_accuracy": 0.6703095203666921,
"eval_runtime": 550.4413,
"eval_samples_per_second": 15.489,
"eval_steps_per_second": 0.485,
"step": 2250
},
{
"epoch": 1.7688679245283019,
"grad_norm": 10.023482322692871,
"learning_rate": 8.84433962264151e-05,
"loss": 1.5821,
"step": 3000
},
{
"epoch": 2.358490566037736,
"grad_norm": 3.805853843688965,
"learning_rate": 9.990216178505835e-05,
"loss": 1.4645,
"step": 4000
},
{
"epoch": 2.6533018867924527,
"eval_accuracy_background": 0.6928149295345922,
"eval_accuracy_double_plant": 0.520600810240665,
"eval_accuracy_drydown": 0.9041661302317083,
"eval_accuracy_endrow": 0.41216652623141536,
"eval_accuracy_nutrient_deficiency": 0.5572999343661789,
"eval_accuracy_planter_skip": 0.5885655971148109,
"eval_accuracy_water": 0.9012349964392468,
"eval_accuracy_waterway": 0.5122856732827319,
"eval_accuracy_weed_cluster": 0.3529035479823603,
"eval_iou_background": 0.6154372685119965,
"eval_iou_double_plant": 0.286691279808622,
"eval_iou_drydown": 0.5005889595647872,
"eval_iou_endrow": 0.23071917367118422,
"eval_iou_nutrient_deficiency": 0.34903960157986247,
"eval_iou_planter_skip": 0.3404743586046269,
"eval_iou_water": 0.4866735755203849,
"eval_iou_waterway": 0.17740336931417308,
"eval_iou_weed_cluster": 0.25445442999377565,
"eval_loss": 1.6076184511184692,
"eval_mean_accuracy": 0.6046709050470789,
"eval_mean_iou": 0.36016466850771256,
"eval_overall_accuracy": 0.6938899108737494,
"eval_runtime": 529.8506,
"eval_samples_per_second": 16.091,
"eval_steps_per_second": 0.504,
"step": 4500
},
{
"epoch": 2.94811320754717,
"grad_norm": 3.9986305236816406,
"learning_rate": 9.931699497285711e-05,
"loss": 1.3957,
"step": 5000
},
{
"epoch": 3.5377358490566038,
"grad_norm": 2.7372334003448486,
"learning_rate": 9.821001342355031e-05,
"loss": 1.3124,
"step": 6000
},
{
"epoch": 3.9799528301886795,
"eval_accuracy_background": 0.6307230231497055,
"eval_accuracy_double_plant": 0.48486363452173786,
"eval_accuracy_drydown": 0.8612367898895216,
"eval_accuracy_endrow": 0.5075110635399532,
"eval_accuracy_nutrient_deficiency": 0.6861430352037324,
"eval_accuracy_planter_skip": 0.6031976315027698,
"eval_accuracy_water": 0.9802194342104156,
"eval_accuracy_waterway": 0.48897799511586637,
"eval_accuracy_weed_cluster": 0.556708376519504,
"eval_iou_background": 0.5741567963414517,
"eval_iou_double_plant": 0.2860919486620036,
"eval_iou_drydown": 0.5029587941632667,
"eval_iou_endrow": 0.22521629078173816,
"eval_iou_nutrient_deficiency": 0.3596590524564408,
"eval_iou_planter_skip": 0.3023475517768152,
"eval_iou_water": 0.41466030404934484,
"eval_iou_waterway": 0.11905712637247004,
"eval_iou_weed_cluster": 0.3161136298740651,
"eval_loss": 1.6003777980804443,
"eval_mean_accuracy": 0.6443978870725785,
"eval_mean_iou": 0.34447349938639954,
"eval_overall_accuracy": 0.6672287911844751,
"eval_runtime": 529.5311,
"eval_samples_per_second": 16.101,
"eval_steps_per_second": 0.504,
"step": 6750
},
{
"epoch": 4.127358490566038,
"grad_norm": 3.5192806720733643,
"learning_rate": 9.65929299206612e-05,
"loss": 1.2631,
"step": 7000
},
{
"epoch": 4.716981132075472,
"grad_norm": 3.9972991943359375,
"learning_rate": 9.448285454973738e-05,
"loss": 1.2003,
"step": 8000
},
{
"epoch": 5.306603773584905,
"grad_norm": 5.617863178253174,
"learning_rate": 9.190211365944541e-05,
"loss": 1.1545,
"step": 9000
},
{
"epoch": 5.306603773584905,
"eval_accuracy_background": 0.7152218890852868,
"eval_accuracy_double_plant": 0.559446789259611,
"eval_accuracy_drydown": 0.7926407431922761,
"eval_accuracy_endrow": 0.5090316219335013,
"eval_accuracy_nutrient_deficiency": 0.5738896211353212,
"eval_accuracy_planter_skip": 0.6593127897989867,
"eval_accuracy_water": 0.9642661896511828,
"eval_accuracy_waterway": 0.46492080717677636,
"eval_accuracy_weed_cluster": 0.5152471841227493,
"eval_iou_background": 0.6309696025011753,
"eval_iou_double_plant": 0.33576586005371956,
"eval_iou_drydown": 0.5023456898026126,
"eval_iou_endrow": 0.24985551240605414,
"eval_iou_nutrient_deficiency": 0.36416354391893857,
"eval_iou_planter_skip": 0.3932620146979082,
"eval_iou_water": 0.46396310962016846,
"eval_iou_waterway": 0.16987197692528003,
"eval_iou_weed_cluster": 0.29655626229371107,
"eval_loss": 1.5461719036102295,
"eval_mean_accuracy": 0.6393308483728546,
"eval_mean_iou": 0.3785281746910631,
"eval_overall_accuracy": 0.7041663407297746,
"eval_runtime": 529.5113,
"eval_samples_per_second": 16.102,
"eval_steps_per_second": 0.504,
"step": 9000
},
{
"epoch": 5.89622641509434,
"grad_norm": 1.9349929094314575,
"learning_rate": 8.887801363027234e-05,
"loss": 1.1301,
"step": 10000
},
{
"epoch": 6.485849056603773,
"grad_norm": 3.736844539642334,
"learning_rate": 8.544255195035733e-05,
"loss": 1.0996,
"step": 11000
},
{
"epoch": 6.633254716981132,
"eval_accuracy_background": 0.7321345719725818,
"eval_accuracy_double_plant": 0.5061561579791534,
"eval_accuracy_drydown": 0.6959542485519916,
"eval_accuracy_endrow": 0.4876229883472026,
"eval_accuracy_nutrient_deficiency": 0.6450410877845559,
"eval_accuracy_planter_skip": 0.7014340631125459,
"eval_accuracy_water": 0.9722180984130999,
"eval_accuracy_waterway": 0.4680069536108854,
"eval_accuracy_weed_cluster": 0.5999105125905921,
"eval_iou_background": 0.6400560054890143,
"eval_iou_double_plant": 0.3502816119859484,
"eval_iou_drydown": 0.48456196377624977,
"eval_iou_endrow": 0.2639788246911193,
"eval_iou_nutrient_deficiency": 0.396585559445601,
"eval_iou_planter_skip": 0.3409834868970738,
"eval_iou_water": 0.44451378617604653,
"eval_iou_waterway": 0.16081881352962019,
"eval_iou_weed_cluster": 0.33812444541681147,
"eval_loss": 1.492088794708252,
"eval_mean_accuracy": 0.645386520262512,
"eval_mean_iou": 0.37998938860083165,
"eval_overall_accuracy": 0.7115690581547556,
"eval_runtime": 529.9729,
"eval_samples_per_second": 16.088,
"eval_steps_per_second": 0.504,
"step": 11250
},
{
"epoch": 7.0754716981132075,
"grad_norm": 1.84828782081604,
"learning_rate": 8.163207865551112e-05,
"loss": 1.0727,
"step": 12000
},
{
"epoch": 7.665094339622642,
"grad_norm": 2.411391258239746,
"learning_rate": 7.748691171566864e-05,
"loss": 1.0468,
"step": 13000
},
{
"epoch": 7.959905660377358,
"eval_accuracy_background": 0.7526398125858199,
"eval_accuracy_double_plant": 0.5617747160876485,
"eval_accuracy_drydown": 0.7416084130046285,
"eval_accuracy_endrow": 0.5035272340399668,
"eval_accuracy_nutrient_deficiency": 0.531805617343839,
"eval_accuracy_planter_skip": 0.6247280891527807,
"eval_accuracy_water": 0.9841431099962412,
"eval_accuracy_waterway": 0.4783465745730863,
"eval_accuracy_weed_cluster": 0.47373664220884076,
"eval_iou_background": 0.6514530993735008,
"eval_iou_double_plant": 0.3221799261469335,
"eval_iou_drydown": 0.496553324050437,
"eval_iou_endrow": 0.25636256499323895,
"eval_iou_nutrient_deficiency": 0.36014685659389084,
"eval_iou_planter_skip": 0.3605061710097777,
"eval_iou_water": 0.4365396537110217,
"eval_iou_waterway": 0.14037628353126624,
"eval_iou_weed_cluster": 0.3214568250037232,
"eval_loss": 1.5932934284210205,
"eval_mean_accuracy": 0.6280344676658723,
"eval_mean_iou": 0.37173052271264334,
"eval_overall_accuracy": 0.7170902700988321,
"eval_runtime": 529.3378,
"eval_samples_per_second": 16.107,
"eval_steps_per_second": 0.504,
"step": 13500
},
{
"epoch": 8.254716981132075,
"grad_norm": 1.4569978713989258,
"learning_rate": 7.305091043730557e-05,
"loss": 1.0271,
"step": 14000
},
{
"epoch": 8.84433962264151,
"grad_norm": 2.9907829761505127,
"learning_rate": 6.837101139557501e-05,
"loss": 1.0036,
"step": 15000
},
{
"epoch": 9.286556603773585,
"eval_accuracy_background": 0.7598414375076388,
"eval_accuracy_double_plant": 0.5177256602627419,
"eval_accuracy_drydown": 0.7154793750660278,
"eval_accuracy_endrow": 0.5012670182902391,
"eval_accuracy_nutrient_deficiency": 0.5368322761783371,
"eval_accuracy_planter_skip": 0.5468935952263279,
"eval_accuracy_water": 0.937019395570021,
"eval_accuracy_waterway": 0.49325926542068943,
"eval_accuracy_weed_cluster": 0.4951997709703656,
"eval_iou_background": 0.653841296382127,
"eval_iou_double_plant": 0.3556917179689535,
"eval_iou_drydown": 0.48554419750993316,
"eval_iou_endrow": 0.2419919783626517,
"eval_iou_nutrient_deficiency": 0.3544690920377324,
"eval_iou_planter_skip": 0.3770845151472525,
"eval_iou_water": 0.4813163648581422,
"eval_iou_waterway": 0.1553945460962498,
"eval_iou_weed_cluster": 0.32913578509118946,
"eval_loss": 1.6111669540405273,
"eval_mean_accuracy": 0.6115019771658209,
"eval_mean_iou": 0.3816077214949146,
"eval_overall_accuracy": 0.7184015448031484,
"eval_runtime": 530.1576,
"eval_samples_per_second": 16.082,
"eval_steps_per_second": 0.504,
"step": 15750
},
{
"epoch": 9.433962264150944,
"grad_norm": 1.7846933603286743,
"learning_rate": 6.34967318063877e-05,
"loss": 0.9725,
"step": 16000
},
{
"epoch": 10.023584905660377,
"grad_norm": 1.7969969511032104,
"learning_rate": 5.847964559317128e-05,
"loss": 0.9677,
"step": 17000
},
{
"epoch": 10.61320754716981,
"grad_norm": 3.443549156188965,
"learning_rate": 5.3372837691956955e-05,
"loss": 0.9443,
"step": 18000
},
{
"epoch": 10.61320754716981,
"eval_accuracy_background": 0.7705968530221318,
"eval_accuracy_double_plant": 0.5181034194377331,
"eval_accuracy_drydown": 0.6903163741892455,
"eval_accuracy_endrow": 0.4835231803753014,
"eval_accuracy_nutrient_deficiency": 0.5916561216478401,
"eval_accuracy_planter_skip": 0.5335884546146096,
"eval_accuracy_water": 0.9620806979435361,
"eval_accuracy_waterway": 0.43880698473219176,
"eval_accuracy_weed_cluster": 0.3965401585703216,
"eval_iou_background": 0.6599883230602321,
"eval_iou_double_plant": 0.34125555031911986,
"eval_iou_drydown": 0.48090155814983737,
"eval_iou_endrow": 0.27739686571309646,
"eval_iou_nutrient_deficiency": 0.37205107367408047,
"eval_iou_planter_skip": 0.34566214329213907,
"eval_iou_water": 0.4751891278946817,
"eval_iou_waterway": 0.18319416480334516,
"eval_iou_weed_cluster": 0.28830863200785295,
"eval_loss": 1.7351711988449097,
"eval_mean_accuracy": 0.5983569160592123,
"eval_mean_iou": 0.38043860432382054,
"eval_overall_accuracy": 0.7224762810473321,
"eval_runtime": 547.3444,
"eval_samples_per_second": 15.577,
"eval_steps_per_second": 0.488,
"step": 18000
}
],
"logging_steps": 1000,
"max_steps": 33920,
"num_input_tokens_seen": 0,
"num_train_epochs": 20,
"save_steps": 2250,
"total_flos": 3.0653390846567645e+20,
"train_batch_size": 32,
"trial_name": null,
"trial_params": null
}