Pham Thanh Dat
Upload checkpoints
de69c99
{
"best_metric": 0.5081,
"best_model_checkpoint": "ms-cond-detr-res-50-vehicles/checkpoint-80675",
"epoch": 36.0,
"eval_steps": 500,
"global_step": 82980,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.21691973969631237,
"grad_norm": 38753.67578125,
"learning_rate": 9.999686465963656e-05,
"loss": 1.2341,
"step": 500
},
{
"epoch": 0.43383947939262474,
"grad_norm": 14156.765625,
"learning_rate": 9.998728034076959e-05,
"loss": 1.1441,
"step": 1000
},
{
"epoch": 0.6507592190889371,
"grad_norm": 7688.85986328125,
"learning_rate": 9.99712861472983e-05,
"loss": 1.1357,
"step": 1500
},
{
"epoch": 0.8676789587852495,
"grad_norm": 10963.5341796875,
"learning_rate": 9.994882003818517e-05,
"loss": 1.1322,
"step": 2000
},
{
"epoch": 1.0,
"eval_loss": 1.0705492496490479,
"eval_map": 0.3886,
"eval_map_50": 0.7276,
"eval_map_75": 0.371,
"eval_map_bus": 0.4553,
"eval_map_car": 0.4267,
"eval_map_container": 0.4051,
"eval_map_large": 0.6092,
"eval_map_medium": 0.3725,
"eval_map_motorbike": 0.2674,
"eval_map_small": 0.0755,
"eval_mar_1": 0.2228,
"eval_mar_10": 0.4736,
"eval_mar_100": 0.5226,
"eval_mar_100_bus": 0.6014,
"eval_mar_100_car": 0.5398,
"eval_mar_100_container": 0.5541,
"eval_mar_100_motorbike": 0.395,
"eval_mar_large": 0.7004,
"eval_mar_medium": 0.5176,
"eval_mar_small": 0.2475,
"eval_runtime": 149.8641,
"eval_samples_per_second": 15.367,
"eval_steps_per_second": 1.922,
"step": 2305
},
{
"epoch": 1.0845986984815619,
"grad_norm": 8778.8525390625,
"learning_rate": 9.991991051623087e-05,
"loss": 1.1204,
"step": 2500
},
{
"epoch": 1.3015184381778742,
"grad_norm": 8215.1748046875,
"learning_rate": 9.988456131077249e-05,
"loss": 1.0925,
"step": 3000
},
{
"epoch": 1.5184381778741867,
"grad_norm": 15722.8212890625,
"learning_rate": 9.984277698186814e-05,
"loss": 1.0867,
"step": 3500
},
{
"epoch": 1.735357917570499,
"grad_norm": 17670.681640625,
"learning_rate": 9.979456291970887e-05,
"loss": 1.0714,
"step": 4000
},
{
"epoch": 1.9522776572668112,
"grad_norm": 15503.669921875,
"learning_rate": 9.974004102519452e-05,
"loss": 1.0605,
"step": 4500
},
{
"epoch": 2.0,
"eval_loss": 1.0418221950531006,
"eval_map": 0.3977,
"eval_map_50": 0.7371,
"eval_map_75": 0.389,
"eval_map_bus": 0.4529,
"eval_map_car": 0.4318,
"eval_map_container": 0.4316,
"eval_map_large": 0.6212,
"eval_map_medium": 0.3842,
"eval_map_motorbike": 0.2745,
"eval_map_small": 0.0841,
"eval_mar_1": 0.2265,
"eval_mar_10": 0.4923,
"eval_mar_100": 0.5393,
"eval_mar_100_bus": 0.6241,
"eval_mar_100_car": 0.5529,
"eval_mar_100_container": 0.5848,
"eval_mar_100_motorbike": 0.3954,
"eval_mar_large": 0.7101,
"eval_mar_medium": 0.5389,
"eval_mar_small": 0.2511,
"eval_runtime": 146.5587,
"eval_samples_per_second": 15.714,
"eval_steps_per_second": 1.965,
"step": 4610
},
{
"epoch": 2.1691973969631237,
"grad_norm": 3109.66162109375,
"learning_rate": 9.967899980939251e-05,
"loss": 1.0591,
"step": 5000
},
{
"epoch": 2.3861171366594363,
"grad_norm": 5812.068359375,
"learning_rate": 9.961154998764017e-05,
"loss": 1.0676,
"step": 5500
},
{
"epoch": 2.6030368763557483,
"grad_norm": 7711.87158203125,
"learning_rate": 9.953770026098485e-05,
"loss": 1.0673,
"step": 6000
},
{
"epoch": 2.819956616052061,
"grad_norm": 11271.8916015625,
"learning_rate": 9.945746015606358e-05,
"loss": 1.0634,
"step": 6500
},
{
"epoch": 3.0,
"eval_loss": 1.0088645219802856,
"eval_map": 0.4231,
"eval_map_50": 0.758,
"eval_map_75": 0.4223,
"eval_map_bus": 0.4788,
"eval_map_car": 0.4565,
"eval_map_container": 0.4648,
"eval_map_large": 0.658,
"eval_map_medium": 0.4084,
"eval_map_motorbike": 0.2923,
"eval_map_small": 0.09,
"eval_mar_1": 0.2352,
"eval_mar_10": 0.5048,
"eval_mar_100": 0.555,
"eval_mar_100_bus": 0.6323,
"eval_mar_100_car": 0.5672,
"eval_mar_100_container": 0.6028,
"eval_mar_100_motorbike": 0.4178,
"eval_mar_large": 0.7546,
"eval_mar_medium": 0.5521,
"eval_mar_small": 0.2802,
"eval_runtime": 147.4693,
"eval_samples_per_second": 15.617,
"eval_steps_per_second": 1.953,
"step": 6915
},
{
"epoch": 3.036876355748373,
"grad_norm": 20180.71484375,
"learning_rate": 9.937084002387407e-05,
"loss": 1.0418,
"step": 7000
},
{
"epoch": 3.2537960954446854,
"grad_norm": 11818.376953125,
"learning_rate": 9.927804336468942e-05,
"loss": 1.0386,
"step": 7500
},
{
"epoch": 3.470715835140998,
"grad_norm": 9070.5185546875,
"learning_rate": 9.917871022281522e-05,
"loss": 1.0635,
"step": 8000
},
{
"epoch": 3.6876355748373104,
"grad_norm": 7446.32666015625,
"learning_rate": 9.907303301249819e-05,
"loss": 1.0466,
"step": 8500
},
{
"epoch": 3.9045553145336225,
"grad_norm": 2428.818603515625,
"learning_rate": 9.896102536613032e-05,
"loss": 1.0288,
"step": 9000
},
{
"epoch": 4.0,
"eval_loss": 1.002821922302246,
"eval_map": 0.4297,
"eval_map_50": 0.7647,
"eval_map_75": 0.429,
"eval_map_bus": 0.4925,
"eval_map_car": 0.4582,
"eval_map_container": 0.4685,
"eval_map_large": 0.6667,
"eval_map_medium": 0.4184,
"eval_map_motorbike": 0.2997,
"eval_map_small": 0.0816,
"eval_mar_1": 0.2383,
"eval_mar_10": 0.5069,
"eval_mar_100": 0.5549,
"eval_mar_100_bus": 0.634,
"eval_mar_100_car": 0.5649,
"eval_mar_100_container": 0.5965,
"eval_mar_100_motorbike": 0.4243,
"eval_mar_large": 0.7579,
"eval_mar_medium": 0.5516,
"eval_mar_small": 0.2596,
"eval_runtime": 146.3143,
"eval_samples_per_second": 15.74,
"eval_steps_per_second": 1.968,
"step": 9220
},
{
"epoch": 4.1214750542299345,
"grad_norm": 4431.853515625,
"learning_rate": 9.88429446733437e-05,
"loss": 1.0289,
"step": 9500
},
{
"epoch": 4.3383947939262475,
"grad_norm": 16948.7890625,
"learning_rate": 9.871833290237144e-05,
"loss": 1.031,
"step": 10000
},
{
"epoch": 4.55531453362256,
"grad_norm": 5605.24951171875,
"learning_rate": 9.858743645176947e-05,
"loss": 1.0303,
"step": 10500
},
{
"epoch": 4.7722342733188725,
"grad_norm": 16235.091796875,
"learning_rate": 9.845027220721935e-05,
"loss": 1.0206,
"step": 11000
},
{
"epoch": 4.989154013015185,
"grad_norm": 20350.36328125,
"learning_rate": 9.830685786294999e-05,
"loss": 1.0226,
"step": 11500
},
{
"epoch": 5.0,
"eval_loss": 0.9774508476257324,
"eval_map": 0.4366,
"eval_map_50": 0.7785,
"eval_map_75": 0.4388,
"eval_map_bus": 0.5023,
"eval_map_car": 0.4658,
"eval_map_container": 0.4766,
"eval_map_large": 0.6605,
"eval_map_medium": 0.4243,
"eval_map_motorbike": 0.3015,
"eval_map_small": 0.0942,
"eval_mar_1": 0.2402,
"eval_mar_10": 0.5173,
"eval_mar_100": 0.5666,
"eval_mar_100_bus": 0.6534,
"eval_mar_100_car": 0.5747,
"eval_mar_100_container": 0.6145,
"eval_mar_100_motorbike": 0.4239,
"eval_mar_large": 0.751,
"eval_mar_medium": 0.5659,
"eval_mar_small": 0.2757,
"eval_runtime": 146.1171,
"eval_samples_per_second": 15.761,
"eval_steps_per_second": 1.971,
"step": 11525
},
{
"epoch": 5.206073752711497,
"grad_norm": 11680.388671875,
"learning_rate": 9.815721191945502e-05,
"loss": 1.0021,
"step": 12000
},
{
"epoch": 5.422993492407809,
"grad_norm": 6468.74072265625,
"learning_rate": 9.800167158422275e-05,
"loss": 1.0049,
"step": 12500
},
{
"epoch": 5.639913232104122,
"grad_norm": 10755.380859375,
"learning_rate": 9.78396335205612e-05,
"loss": 1.016,
"step": 13000
},
{
"epoch": 5.856832971800434,
"grad_norm": 6588.42578125,
"learning_rate": 9.767142412975505e-05,
"loss": 1.022,
"step": 13500
},
{
"epoch": 6.0,
"eval_loss": 0.9850358366966248,
"eval_map": 0.4356,
"eval_map_50": 0.7775,
"eval_map_75": 0.4345,
"eval_map_bus": 0.5032,
"eval_map_car": 0.455,
"eval_map_container": 0.4783,
"eval_map_large": 0.661,
"eval_map_medium": 0.4213,
"eval_map_motorbike": 0.3059,
"eval_map_small": 0.106,
"eval_mar_1": 0.2402,
"eval_mar_10": 0.514,
"eval_mar_100": 0.563,
"eval_mar_100_bus": 0.651,
"eval_mar_100_car": 0.5596,
"eval_mar_100_container": 0.6163,
"eval_mar_100_motorbike": 0.4251,
"eval_mar_large": 0.7479,
"eval_mar_medium": 0.5634,
"eval_mar_small": 0.2541,
"eval_runtime": 145.7736,
"eval_samples_per_second": 15.798,
"eval_steps_per_second": 1.976,
"step": 13830
},
{
"epoch": 6.073752711496746,
"grad_norm": 8365.4345703125,
"learning_rate": 9.749706511086642e-05,
"loss": 1.0065,
"step": 14000
},
{
"epoch": 6.290672451193059,
"grad_norm": 7092.89306640625,
"learning_rate": 9.731694602810796e-05,
"loss": 1.0004,
"step": 14500
},
{
"epoch": 6.507592190889371,
"grad_norm": 7779.22314453125,
"learning_rate": 9.713036820450053e-05,
"loss": 1.0193,
"step": 15000
},
{
"epoch": 6.724511930585683,
"grad_norm": 5161.82958984375,
"learning_rate": 9.693771054918806e-05,
"loss": 0.9992,
"step": 15500
},
{
"epoch": 6.941431670281996,
"grad_norm": 5342.78662109375,
"learning_rate": 9.673899791506617e-05,
"loss": 0.9936,
"step": 16000
},
{
"epoch": 7.0,
"eval_loss": 0.9677829742431641,
"eval_map": 0.4394,
"eval_map_50": 0.781,
"eval_map_75": 0.4415,
"eval_map_bus": 0.5059,
"eval_map_car": 0.4716,
"eval_map_container": 0.4731,
"eval_map_large": 0.6636,
"eval_map_medium": 0.4308,
"eval_map_motorbike": 0.307,
"eval_map_small": 0.109,
"eval_mar_1": 0.2401,
"eval_mar_10": 0.5184,
"eval_mar_100": 0.5674,
"eval_mar_100_bus": 0.6546,
"eval_mar_100_car": 0.5736,
"eval_mar_100_container": 0.6126,
"eval_mar_100_motorbike": 0.4289,
"eval_mar_large": 0.7468,
"eval_mar_medium": 0.5696,
"eval_mar_small": 0.2775,
"eval_runtime": 147.1057,
"eval_samples_per_second": 15.655,
"eval_steps_per_second": 1.958,
"step": 16135
},
{
"epoch": 7.158351409978308,
"grad_norm": 17945.982421875,
"learning_rate": 9.653425593612456e-05,
"loss": 0.9817,
"step": 16500
},
{
"epoch": 7.375271149674621,
"grad_norm": 2631.81591796875,
"learning_rate": 9.632393848695017e-05,
"loss": 0.9845,
"step": 17000
},
{
"epoch": 7.592190889370933,
"grad_norm": 1825.7994384765625,
"learning_rate": 9.61072297519293e-05,
"loss": 0.9839,
"step": 17500
},
{
"epoch": 7.809110629067245,
"grad_norm": 8929.837890625,
"learning_rate": 9.588457317037219e-05,
"loss": 0.9908,
"step": 18000
},
{
"epoch": 8.0,
"eval_loss": 0.9544239640235901,
"eval_map": 0.4515,
"eval_map_50": 0.7929,
"eval_map_75": 0.459,
"eval_map_bus": 0.5215,
"eval_map_car": 0.4759,
"eval_map_container": 0.4956,
"eval_map_large": 0.6707,
"eval_map_medium": 0.4407,
"eval_map_motorbike": 0.3131,
"eval_map_small": 0.103,
"eval_mar_1": 0.2439,
"eval_mar_10": 0.5243,
"eval_mar_100": 0.573,
"eval_mar_100_bus": 0.6558,
"eval_mar_100_car": 0.579,
"eval_mar_100_container": 0.6217,
"eval_mar_100_motorbike": 0.4355,
"eval_mar_large": 0.7575,
"eval_mar_medium": 0.5708,
"eval_mar_small": 0.3107,
"eval_runtime": 147.1314,
"eval_samples_per_second": 15.653,
"eval_steps_per_second": 1.957,
"step": 18440
},
{
"epoch": 8.026030368763557,
"grad_norm": 9851.580078125,
"learning_rate": 9.565599746504495e-05,
"loss": 0.9914,
"step": 18500
},
{
"epoch": 8.242950108459869,
"grad_norm": 46131.0703125,
"learning_rate": 9.542153212228251e-05,
"loss": 0.9789,
"step": 19000
},
{
"epoch": 8.459869848156183,
"grad_norm": 40477.8671875,
"learning_rate": 9.518120738818473e-05,
"loss": 0.9642,
"step": 19500
},
{
"epoch": 8.676789587852495,
"grad_norm": 21795.466796875,
"learning_rate": 9.493505426471479e-05,
"loss": 0.9637,
"step": 20000
},
{
"epoch": 8.893709327548807,
"grad_norm": 5294.40673828125,
"learning_rate": 9.468361416878137e-05,
"loss": 0.9853,
"step": 20500
},
{
"epoch": 9.0,
"eval_loss": 0.9467804431915283,
"eval_map": 0.4529,
"eval_map_50": 0.7951,
"eval_map_75": 0.46,
"eval_map_bus": 0.5273,
"eval_map_car": 0.4728,
"eval_map_container": 0.4969,
"eval_map_large": 0.6735,
"eval_map_medium": 0.4421,
"eval_map_motorbike": 0.3144,
"eval_map_small": 0.1016,
"eval_mar_1": 0.2466,
"eval_mar_10": 0.5271,
"eval_mar_100": 0.5772,
"eval_mar_100_bus": 0.6592,
"eval_mar_100_car": 0.5831,
"eval_mar_100_container": 0.6281,
"eval_mar_100_motorbike": 0.4385,
"eval_mar_large": 0.7607,
"eval_mar_medium": 0.5767,
"eval_mar_small": 0.2947,
"eval_runtime": 146.7224,
"eval_samples_per_second": 15.696,
"eval_steps_per_second": 1.963,
"step": 20745
},
{
"epoch": 9.11062906724512,
"grad_norm": 20100.53515625,
"learning_rate": 9.442591177115253e-05,
"loss": 0.973,
"step": 21000
},
{
"epoch": 9.327548806941431,
"grad_norm": 4432.14404296875,
"learning_rate": 9.416247841751377e-05,
"loss": 0.9844,
"step": 21500
},
{
"epoch": 9.544468546637743,
"grad_norm": 5448.53369140625,
"learning_rate": 9.389334809084711e-05,
"loss": 0.9783,
"step": 22000
},
{
"epoch": 9.761388286334057,
"grad_norm": 18744.869140625,
"learning_rate": 9.361855550904582e-05,
"loss": 0.9591,
"step": 22500
},
{
"epoch": 9.97830802603037,
"grad_norm": 9256.87890625,
"learning_rate": 9.333870255084278e-05,
"loss": 0.9536,
"step": 23000
},
{
"epoch": 10.0,
"eval_loss": 0.9346117377281189,
"eval_map": 0.4603,
"eval_map_50": 0.8028,
"eval_map_75": 0.4763,
"eval_map_bus": 0.5317,
"eval_map_car": 0.4808,
"eval_map_container": 0.5064,
"eval_map_large": 0.6826,
"eval_map_medium": 0.4525,
"eval_map_motorbike": 0.3221,
"eval_map_small": 0.108,
"eval_mar_1": 0.2479,
"eval_mar_10": 0.532,
"eval_mar_100": 0.5823,
"eval_mar_100_bus": 0.6637,
"eval_mar_100_car": 0.591,
"eval_mar_100_container": 0.6308,
"eval_mar_100_motorbike": 0.4437,
"eval_mar_large": 0.7735,
"eval_mar_medium": 0.5844,
"eval_mar_small": 0.2885,
"eval_runtime": 144.7391,
"eval_samples_per_second": 15.911,
"eval_steps_per_second": 1.99,
"step": 23050
},
{
"epoch": 10.195227765726681,
"grad_norm": 6654.49365234375,
"learning_rate": 9.30532812271677e-05,
"loss": 0.9821,
"step": 23500
},
{
"epoch": 10.412147505422993,
"grad_norm": 12540.853515625,
"learning_rate": 9.276173960919273e-05,
"loss": 0.9966,
"step": 24000
},
{
"epoch": 10.629067245119305,
"grad_norm": 8583.029296875,
"learning_rate": 9.246468171391835e-05,
"loss": 0.9826,
"step": 24500
},
{
"epoch": 10.845986984815617,
"grad_norm": 5945.16796875,
"learning_rate": 9.216214586190261e-05,
"loss": 0.9769,
"step": 25000
},
{
"epoch": 11.0,
"eval_loss": 0.9336058497428894,
"eval_map": 0.4511,
"eval_map_50": 0.8,
"eval_map_75": 0.4575,
"eval_map_bus": 0.5073,
"eval_map_car": 0.4708,
"eval_map_container": 0.5006,
"eval_map_large": 0.6611,
"eval_map_medium": 0.4469,
"eval_map_motorbike": 0.3259,
"eval_map_small": 0.1072,
"eval_mar_1": 0.2412,
"eval_mar_10": 0.5266,
"eval_mar_100": 0.5752,
"eval_mar_100_bus": 0.6493,
"eval_mar_100_car": 0.5772,
"eval_mar_100_container": 0.6233,
"eval_mar_100_motorbike": 0.4511,
"eval_mar_large": 0.7508,
"eval_mar_medium": 0.5789,
"eval_mar_small": 0.2908,
"eval_runtime": 147.6126,
"eval_samples_per_second": 15.602,
"eval_steps_per_second": 1.951,
"step": 25355
},
{
"epoch": 11.062906724511931,
"grad_norm": 10052.8896484375,
"learning_rate": 9.185417108036163e-05,
"loss": 0.9731,
"step": 25500
},
{
"epoch": 11.279826464208243,
"grad_norm": 3725.647216796875,
"learning_rate": 9.154079709813505e-05,
"loss": 0.9572,
"step": 26000
},
{
"epoch": 11.496746203904555,
"grad_norm": 10829.8896484375,
"learning_rate": 9.122206434056104e-05,
"loss": 0.9558,
"step": 26500
},
{
"epoch": 11.713665943600867,
"grad_norm": 16212.732421875,
"learning_rate": 9.08980139242614e-05,
"loss": 0.9622,
"step": 27000
},
{
"epoch": 11.93058568329718,
"grad_norm": 12326.623046875,
"learning_rate": 9.056868765183752e-05,
"loss": 0.9506,
"step": 27500
},
{
"epoch": 12.0,
"eval_loss": 0.9213413596153259,
"eval_map": 0.4617,
"eval_map_50": 0.8095,
"eval_map_75": 0.4735,
"eval_map_bus": 0.5252,
"eval_map_car": 0.4891,
"eval_map_container": 0.5052,
"eval_map_large": 0.676,
"eval_map_medium": 0.455,
"eval_map_motorbike": 0.3272,
"eval_map_small": 0.1083,
"eval_mar_1": 0.2461,
"eval_mar_10": 0.5327,
"eval_mar_100": 0.5818,
"eval_mar_100_bus": 0.6626,
"eval_mar_100_car": 0.5902,
"eval_mar_100_container": 0.627,
"eval_mar_100_motorbike": 0.4475,
"eval_mar_large": 0.7631,
"eval_mar_medium": 0.5838,
"eval_mar_small": 0.2935,
"eval_runtime": 143.9851,
"eval_samples_per_second": 15.995,
"eval_steps_per_second": 2.0,
"step": 27660
},
{
"epoch": 12.147505422993492,
"grad_norm": 23455.04296875,
"learning_rate": 9.023412800647782e-05,
"loss": 0.9338,
"step": 28000
},
{
"epoch": 12.364425162689805,
"grad_norm": 7761.9912109375,
"learning_rate": 8.989506279701155e-05,
"loss": 0.9535,
"step": 28500
},
{
"epoch": 12.581344902386117,
"grad_norm": 7034.04052734375,
"learning_rate": 8.955017679879593e-05,
"loss": 0.9507,
"step": 29000
},
{
"epoch": 12.79826464208243,
"grad_norm": 5548.38525390625,
"learning_rate": 8.920018881585156e-05,
"loss": 0.9417,
"step": 29500
},
{
"epoch": 13.0,
"eval_loss": 0.9276334643363953,
"eval_map": 0.4608,
"eval_map_50": 0.8076,
"eval_map_75": 0.4687,
"eval_map_bus": 0.5336,
"eval_map_car": 0.4866,
"eval_map_container": 0.4992,
"eval_map_large": 0.6724,
"eval_map_medium": 0.4511,
"eval_map_motorbike": 0.3238,
"eval_map_small": 0.1064,
"eval_mar_1": 0.2472,
"eval_mar_10": 0.5288,
"eval_mar_100": 0.5752,
"eval_mar_100_bus": 0.6588,
"eval_mar_100_car": 0.5895,
"eval_mar_100_container": 0.6158,
"eval_mar_100_motorbike": 0.4369,
"eval_mar_large": 0.7512,
"eval_mar_medium": 0.5708,
"eval_mar_small": 0.2981,
"eval_runtime": 145.1236,
"eval_samples_per_second": 15.869,
"eval_steps_per_second": 1.985,
"step": 29965
},
{
"epoch": 13.015184381778742,
"grad_norm": 12253.849609375,
"learning_rate": 8.884514399673369e-05,
"loss": 0.9555,
"step": 30000
},
{
"epoch": 13.232104121475054,
"grad_norm": 13796.53125,
"learning_rate": 8.848508814233106e-05,
"loss": 0.9476,
"step": 30500
},
{
"epoch": 13.449023861171366,
"grad_norm": 5713.0361328125,
"learning_rate": 8.812080266430921e-05,
"loss": 0.9417,
"step": 31000
},
{
"epoch": 13.66594360086768,
"grad_norm": 3508.00634765625,
"learning_rate": 8.77508745092958e-05,
"loss": 0.9446,
"step": 31500
},
{
"epoch": 13.882863340563992,
"grad_norm": 4413.595703125,
"learning_rate": 8.737607648009131e-05,
"loss": 0.9488,
"step": 32000
},
{
"epoch": 14.0,
"eval_loss": 0.9241105318069458,
"eval_map": 0.4602,
"eval_map_50": 0.8064,
"eval_map_75": 0.4696,
"eval_map_bus": 0.5309,
"eval_map_car": 0.4761,
"eval_map_container": 0.5062,
"eval_map_large": 0.6817,
"eval_map_medium": 0.4503,
"eval_map_motorbike": 0.3275,
"eval_map_small": 0.1122,
"eval_mar_1": 0.2462,
"eval_mar_10": 0.5333,
"eval_mar_100": 0.5819,
"eval_mar_100_bus": 0.6633,
"eval_mar_100_car": 0.5828,
"eval_mar_100_container": 0.6259,
"eval_mar_100_motorbike": 0.4557,
"eval_mar_large": 0.7655,
"eval_mar_medium": 0.5804,
"eval_mar_small": 0.2896,
"eval_runtime": 145.7229,
"eval_samples_per_second": 15.804,
"eval_steps_per_second": 1.976,
"step": 32270
},
{
"epoch": 14.099783080260304,
"grad_norm": 7677.90478515625,
"learning_rate": 8.699645692575454e-05,
"loss": 0.9519,
"step": 32500
},
{
"epoch": 14.316702819956616,
"grad_norm": 4366.18212890625,
"learning_rate": 8.661283833169138e-05,
"loss": 0.9471,
"step": 33000
},
{
"epoch": 14.533622559652928,
"grad_norm": 5411.373046875,
"learning_rate": 8.622373265190294e-05,
"loss": 0.9423,
"step": 33500
},
{
"epoch": 14.750542299349242,
"grad_norm": 7791.236328125,
"learning_rate": 8.582995409968335e-05,
"loss": 0.9357,
"step": 34000
},
{
"epoch": 14.967462039045554,
"grad_norm": 20878.41796875,
"learning_rate": 8.543155347258457e-05,
"loss": 0.9371,
"step": 34500
},
{
"epoch": 15.0,
"eval_loss": 0.9158653020858765,
"eval_map": 0.4646,
"eval_map_50": 0.8109,
"eval_map_75": 0.479,
"eval_map_bus": 0.525,
"eval_map_car": 0.4942,
"eval_map_container": 0.5118,
"eval_map_large": 0.6799,
"eval_map_medium": 0.4567,
"eval_map_motorbike": 0.3276,
"eval_map_small": 0.1141,
"eval_mar_1": 0.2484,
"eval_mar_10": 0.533,
"eval_mar_100": 0.5795,
"eval_mar_100_bus": 0.6523,
"eval_mar_100_car": 0.5909,
"eval_mar_100_container": 0.6278,
"eval_mar_100_motorbike": 0.447,
"eval_mar_large": 0.7745,
"eval_mar_medium": 0.5767,
"eval_mar_small": 0.3179,
"eval_runtime": 143.8949,
"eval_samples_per_second": 16.005,
"eval_steps_per_second": 2.001,
"step": 34575
},
{
"epoch": 15.184381778741866,
"grad_norm": 8804.869140625,
"learning_rate": 8.502858216440758e-05,
"loss": 0.9249,
"step": 35000
},
{
"epoch": 15.401301518438178,
"grad_norm": 7941.79443359375,
"learning_rate": 8.462191161340177e-05,
"loss": 0.9341,
"step": 35500
},
{
"epoch": 15.61822125813449,
"grad_norm": 11279.1513671875,
"learning_rate": 8.420996435565979e-05,
"loss": 0.9342,
"step": 36000
},
{
"epoch": 15.835140997830802,
"grad_norm": 2519.469970703125,
"learning_rate": 8.379360400220391e-05,
"loss": 0.9311,
"step": 36500
},
{
"epoch": 16.0,
"eval_loss": 0.8999801278114319,
"eval_map": 0.4741,
"eval_map_50": 0.8169,
"eval_map_75": 0.4893,
"eval_map_bus": 0.5392,
"eval_map_car": 0.5006,
"eval_map_container": 0.5198,
"eval_map_large": 0.6914,
"eval_map_medium": 0.4673,
"eval_map_motorbike": 0.3368,
"eval_map_small": 0.1224,
"eval_mar_1": 0.2523,
"eval_mar_10": 0.544,
"eval_mar_100": 0.5909,
"eval_mar_100_bus": 0.6792,
"eval_mar_100_car": 0.5917,
"eval_mar_100_container": 0.6356,
"eval_mar_100_motorbike": 0.4571,
"eval_mar_large": 0.7817,
"eval_mar_medium": 0.593,
"eval_mar_small": 0.3192,
"eval_runtime": 144.4917,
"eval_samples_per_second": 15.939,
"eval_steps_per_second": 1.993,
"step": 36880
},
{
"epoch": 16.052060737527114,
"grad_norm": 6870.65673828125,
"learning_rate": 8.337288426364522e-05,
"loss": 0.9394,
"step": 37000
},
{
"epoch": 16.268980477223426,
"grad_norm": 18748.70703125,
"learning_rate": 8.294785941295685e-05,
"loss": 0.9206,
"step": 37500
},
{
"epoch": 16.485900216919738,
"grad_norm": 8770.451171875,
"learning_rate": 8.251944703380834e-05,
"loss": 0.9277,
"step": 38000
},
{
"epoch": 16.702819956616054,
"grad_norm": 10527.71484375,
"learning_rate": 8.208598532633761e-05,
"loss": 0.9363,
"step": 38500
},
{
"epoch": 16.919739696312366,
"grad_norm": 13457.677734375,
"learning_rate": 8.164838451708801e-05,
"loss": 0.9284,
"step": 39000
},
{
"epoch": 17.0,
"eval_loss": 0.9076481461524963,
"eval_map": 0.472,
"eval_map_50": 0.8148,
"eval_map_75": 0.4845,
"eval_map_bus": 0.5397,
"eval_map_car": 0.4969,
"eval_map_container": 0.5162,
"eval_map_large": 0.684,
"eval_map_medium": 0.4625,
"eval_map_motorbike": 0.3354,
"eval_map_small": 0.1174,
"eval_mar_1": 0.252,
"eval_mar_10": 0.5415,
"eval_mar_100": 0.5905,
"eval_mar_100_bus": 0.6732,
"eval_mar_100_car": 0.5938,
"eval_mar_100_container": 0.6354,
"eval_mar_100_motorbike": 0.4596,
"eval_mar_large": 0.767,
"eval_mar_medium": 0.5905,
"eval_mar_small": 0.315,
"eval_runtime": 145.0152,
"eval_samples_per_second": 15.881,
"eval_steps_per_second": 1.986,
"step": 39185
},
{
"epoch": 17.136659436008678,
"grad_norm": 6826.60595703125,
"learning_rate": 8.120670105669583e-05,
"loss": 0.9237,
"step": 39500
},
{
"epoch": 17.35357917570499,
"grad_norm": 10753.5400390625,
"learning_rate": 8.076099192246061e-05,
"loss": 0.9257,
"step": 40000
},
{
"epoch": 17.570498915401302,
"grad_norm": 5758.92919921875,
"learning_rate": 8.031131461099501e-05,
"loss": 0.9247,
"step": 40500
},
{
"epoch": 17.787418655097614,
"grad_norm": 11779.173828125,
"learning_rate": 7.985772713080777e-05,
"loss": 0.9107,
"step": 41000
},
{
"epoch": 18.0,
"eval_loss": 0.9001684188842773,
"eval_map": 0.4753,
"eval_map_50": 0.8198,
"eval_map_75": 0.4952,
"eval_map_bus": 0.5451,
"eval_map_car": 0.501,
"eval_map_container": 0.5198,
"eval_map_large": 0.6944,
"eval_map_medium": 0.4679,
"eval_map_motorbike": 0.3352,
"eval_map_small": 0.1207,
"eval_mar_1": 0.2516,
"eval_mar_10": 0.5428,
"eval_mar_100": 0.5902,
"eval_mar_100_bus": 0.6716,
"eval_mar_100_car": 0.5977,
"eval_mar_100_container": 0.6353,
"eval_mar_100_motorbike": 0.4562,
"eval_mar_large": 0.7743,
"eval_mar_medium": 0.592,
"eval_mar_small": 0.3133,
"eval_runtime": 143.7248,
"eval_samples_per_second": 16.024,
"eval_steps_per_second": 2.004,
"step": 41490
},
{
"epoch": 18.004338394793926,
"grad_norm": 3542.92626953125,
"learning_rate": 7.940120667790506e-05,
"loss": 0.919,
"step": 41500
},
{
"epoch": 18.22125813449024,
"grad_norm": 22165.880859375,
"learning_rate": 7.893998242197806e-05,
"loss": 0.928,
"step": 42000
},
{
"epoch": 18.43817787418655,
"grad_norm": 3429.292236328125,
"learning_rate": 7.84750248995952e-05,
"loss": 0.9192,
"step": 42500
},
{
"epoch": 18.655097613882862,
"grad_norm": 10154.87109375,
"learning_rate": 7.800639409041694e-05,
"loss": 0.9183,
"step": 43000
},
{
"epoch": 18.872017353579174,
"grad_norm": 25265.55078125,
"learning_rate": 7.753415044795898e-05,
"loss": 0.9125,
"step": 43500
},
{
"epoch": 19.0,
"eval_loss": 0.8902826905250549,
"eval_map": 0.4805,
"eval_map_50": 0.8223,
"eval_map_75": 0.5006,
"eval_map_bus": 0.5537,
"eval_map_car": 0.5047,
"eval_map_container": 0.5198,
"eval_map_large": 0.6876,
"eval_map_medium": 0.4736,
"eval_map_motorbike": 0.3438,
"eval_map_small": 0.119,
"eval_mar_1": 0.2528,
"eval_mar_10": 0.5449,
"eval_mar_100": 0.5921,
"eval_mar_100_bus": 0.6688,
"eval_mar_100_car": 0.6008,
"eval_mar_100_container": 0.6319,
"eval_mar_100_motorbike": 0.4669,
"eval_mar_large": 0.7716,
"eval_mar_medium": 0.5905,
"eval_mar_small": 0.3164,
"eval_runtime": 146.715,
"eval_samples_per_second": 15.697,
"eval_steps_per_second": 1.963,
"step": 43795
},
{
"epoch": 19.088937093275486,
"grad_norm": 7347.31640625,
"learning_rate": 7.705835489179352e-05,
"loss": 0.9033,
"step": 44000
},
{
"epoch": 19.305856832971802,
"grad_norm": 5815.42822265625,
"learning_rate": 7.658003081440886e-05,
"loss": 0.9049,
"step": 44500
},
{
"epoch": 19.522776572668114,
"grad_norm": 5560.4921875,
"learning_rate": 7.609732280983515e-05,
"loss": 0.9124,
"step": 45000
},
{
"epoch": 19.739696312364426,
"grad_norm": 5130.99462890625,
"learning_rate": 7.56112482427524e-05,
"loss": 0.9205,
"step": 45500
},
{
"epoch": 19.95661605206074,
"grad_norm": 17505.642578125,
"learning_rate": 7.512186981692624e-05,
"loss": 0.913,
"step": 46000
},
{
"epoch": 20.0,
"eval_loss": 0.8936046957969666,
"eval_map": 0.4822,
"eval_map_50": 0.8243,
"eval_map_75": 0.504,
"eval_map_bus": 0.5592,
"eval_map_car": 0.4984,
"eval_map_container": 0.5236,
"eval_map_large": 0.6904,
"eval_map_medium": 0.4777,
"eval_map_motorbike": 0.3475,
"eval_map_small": 0.115,
"eval_mar_1": 0.2536,
"eval_mar_10": 0.5453,
"eval_mar_100": 0.5923,
"eval_mar_100_bus": 0.6727,
"eval_mar_100_car": 0.5953,
"eval_mar_100_container": 0.6347,
"eval_mar_100_motorbike": 0.4666,
"eval_mar_large": 0.7683,
"eval_mar_medium": 0.5946,
"eval_mar_small": 0.3124,
"eval_runtime": 146.1172,
"eval_samples_per_second": 15.761,
"eval_steps_per_second": 1.971,
"step": 46100
},
{
"epoch": 20.17353579175705,
"grad_norm": 21176.666015625,
"learning_rate": 7.462925066232113e-05,
"loss": 0.9039,
"step": 46500
},
{
"epoch": 20.390455531453362,
"grad_norm": 4085.164306640625,
"learning_rate": 7.413444904801033e-05,
"loss": 0.9082,
"step": 47000
},
{
"epoch": 20.607375271149674,
"grad_norm": 20771.896484375,
"learning_rate": 7.363554565211042e-05,
"loss": 0.9087,
"step": 47500
},
{
"epoch": 20.824295010845987,
"grad_norm": 5990.69580078125,
"learning_rate": 7.313359326369684e-05,
"loss": 0.908,
"step": 48000
},
{
"epoch": 21.0,
"eval_loss": 0.8810420036315918,
"eval_map": 0.483,
"eval_map_50": 0.8249,
"eval_map_75": 0.5047,
"eval_map_bus": 0.5531,
"eval_map_car": 0.5081,
"eval_map_container": 0.5229,
"eval_map_large": 0.7091,
"eval_map_medium": 0.4743,
"eval_map_motorbike": 0.348,
"eval_map_small": 0.1233,
"eval_mar_1": 0.2539,
"eval_mar_10": 0.5486,
"eval_mar_100": 0.5987,
"eval_mar_100_bus": 0.6764,
"eval_mar_100_car": 0.6079,
"eval_mar_100_container": 0.6426,
"eval_mar_100_motorbike": 0.4679,
"eval_mar_large": 0.7947,
"eval_mar_medium": 0.5992,
"eval_mar_small": 0.3117,
"eval_runtime": 143.798,
"eval_samples_per_second": 16.016,
"eval_steps_per_second": 2.003,
"step": 48405
},
{
"epoch": 21.0412147505423,
"grad_norm": 4679.26220703125,
"learning_rate": 7.262865663477902e-05,
"loss": 0.9023,
"step": 48500
},
{
"epoch": 21.25813449023861,
"grad_norm": 18654.177734375,
"learning_rate": 7.21208009023343e-05,
"loss": 0.9069,
"step": 49000
},
{
"epoch": 21.475054229934923,
"grad_norm": 10939.3623046875,
"learning_rate": 7.161009157990521e-05,
"loss": 0.8956,
"step": 49500
},
{
"epoch": 21.691973969631235,
"grad_norm": 14381.9765625,
"learning_rate": 7.109659454914833e-05,
"loss": 0.8925,
"step": 50000
},
{
"epoch": 21.90889370932755,
"grad_norm": 5005.86865234375,
"learning_rate": 7.058141116015095e-05,
"loss": 0.8997,
"step": 50500
},
{
"epoch": 22.0,
"eval_loss": 0.8783358335494995,
"eval_map": 0.4846,
"eval_map_50": 0.8275,
"eval_map_75": 0.5024,
"eval_map_bus": 0.5507,
"eval_map_car": 0.5086,
"eval_map_container": 0.5299,
"eval_map_large": 0.699,
"eval_map_medium": 0.4761,
"eval_map_motorbike": 0.3491,
"eval_map_small": 0.1256,
"eval_mar_1": 0.2542,
"eval_mar_10": 0.5503,
"eval_mar_100": 0.5994,
"eval_mar_100_bus": 0.6731,
"eval_mar_100_car": 0.6068,
"eval_mar_100_container": 0.6486,
"eval_mar_100_motorbike": 0.469,
"eval_mar_large": 0.7854,
"eval_mar_medium": 0.5993,
"eval_mar_small": 0.3314,
"eval_runtime": 144.6256,
"eval_samples_per_second": 15.924,
"eval_steps_per_second": 1.991,
"step": 50710
},
{
"epoch": 22.125813449023862,
"grad_norm": 19755.140625,
"learning_rate": 7.006254303068497e-05,
"loss": 0.8975,
"step": 51000
},
{
"epoch": 22.342733188720175,
"grad_norm": 11582.6494140625,
"learning_rate": 6.954108682712056e-05,
"loss": 0.898,
"step": 51500
},
{
"epoch": 22.559652928416487,
"grad_norm": 6819.56396484375,
"learning_rate": 6.901710981746509e-05,
"loss": 0.8999,
"step": 52000
},
{
"epoch": 22.7765726681128,
"grad_norm": 7609.8115234375,
"learning_rate": 6.849067959491079e-05,
"loss": 0.8978,
"step": 52500
},
{
"epoch": 22.99349240780911,
"grad_norm": 10856.244140625,
"learning_rate": 6.796186406911505e-05,
"loss": 0.8865,
"step": 53000
},
{
"epoch": 23.0,
"eval_loss": 0.871816098690033,
"eval_map": 0.4901,
"eval_map_50": 0.8289,
"eval_map_75": 0.5202,
"eval_map_bus": 0.5591,
"eval_map_car": 0.5153,
"eval_map_container": 0.5306,
"eval_map_large": 0.7037,
"eval_map_medium": 0.4841,
"eval_map_motorbike": 0.3553,
"eval_map_small": 0.1243,
"eval_mar_1": 0.2558,
"eval_mar_10": 0.5526,
"eval_mar_100": 0.6008,
"eval_mar_100_bus": 0.6757,
"eval_mar_100_car": 0.6077,
"eval_mar_100_container": 0.6452,
"eval_mar_100_motorbike": 0.4746,
"eval_mar_large": 0.788,
"eval_mar_medium": 0.6019,
"eval_mar_small": 0.3201,
"eval_runtime": 145.8422,
"eval_samples_per_second": 15.791,
"eval_steps_per_second": 1.975,
"step": 53015
},
{
"epoch": 23.210412147505423,
"grad_norm": 6373.787109375,
"learning_rate": 6.743286051281191e-05,
"loss": 0.8974,
"step": 53500
},
{
"epoch": 23.427331887201735,
"grad_norm": 3711.38671875,
"learning_rate": 6.68994881889314e-05,
"loss": 0.9048,
"step": 54000
},
{
"epoch": 23.644251626898047,
"grad_norm": 1683.364501953125,
"learning_rate": 6.636393582598046e-05,
"loss": 0.911,
"step": 54500
},
{
"epoch": 23.86117136659436,
"grad_norm": 2381.84423828125,
"learning_rate": 6.582627251037533e-05,
"loss": 0.9052,
"step": 55000
},
{
"epoch": 24.0,
"eval_loss": 0.8951303958892822,
"eval_map": 0.4779,
"eval_map_50": 0.8254,
"eval_map_75": 0.4914,
"eval_map_bus": 0.5509,
"eval_map_car": 0.5002,
"eval_map_container": 0.5227,
"eval_map_large": 0.697,
"eval_map_medium": 0.469,
"eval_map_motorbike": 0.3376,
"eval_map_small": 0.1198,
"eval_mar_1": 0.2524,
"eval_mar_10": 0.5426,
"eval_mar_100": 0.5902,
"eval_mar_100_bus": 0.6715,
"eval_mar_100_car": 0.5914,
"eval_mar_100_container": 0.643,
"eval_mar_100_motorbike": 0.455,
"eval_mar_large": 0.7785,
"eval_mar_medium": 0.5885,
"eval_mar_small": 0.319,
"eval_runtime": 145.8551,
"eval_samples_per_second": 15.79,
"eval_steps_per_second": 1.975,
"step": 55320
},
{
"epoch": 24.07809110629067,
"grad_norm": 19113.990234375,
"learning_rate": 6.528656760084578e-05,
"loss": 0.9112,
"step": 55500
},
{
"epoch": 24.295010845986983,
"grad_norm": 20675.185546875,
"learning_rate": 6.474489071948787e-05,
"loss": 0.8944,
"step": 56000
},
{
"epoch": 24.5119305856833,
"grad_norm": 10454.0859375,
"learning_rate": 6.420131174278254e-05,
"loss": 0.8915,
"step": 56500
},
{
"epoch": 24.72885032537961,
"grad_norm": 4770.7431640625,
"learning_rate": 6.365590079258165e-05,
"loss": 0.8891,
"step": 57000
},
{
"epoch": 24.945770065075923,
"grad_norm": 16598.36328125,
"learning_rate": 6.310872822706217e-05,
"loss": 0.8982,
"step": 57500
},
{
"epoch": 25.0,
"eval_loss": 0.8864476084709167,
"eval_map": 0.4662,
"eval_map_50": 0.8105,
"eval_map_75": 0.4884,
"eval_map_bus": 0.515,
"eval_map_car": 0.4889,
"eval_map_container": 0.5084,
"eval_map_large": 0.6737,
"eval_map_medium": 0.4711,
"eval_map_motorbike": 0.3524,
"eval_map_small": 0.1286,
"eval_mar_1": 0.2482,
"eval_mar_10": 0.5444,
"eval_mar_100": 0.5934,
"eval_mar_100_bus": 0.6696,
"eval_mar_100_car": 0.5993,
"eval_mar_100_container": 0.6371,
"eval_mar_100_motorbike": 0.4675,
"eval_mar_large": 0.7729,
"eval_mar_medium": 0.5969,
"eval_mar_small": 0.3226,
"eval_runtime": 144.7854,
"eval_samples_per_second": 15.906,
"eval_steps_per_second": 1.989,
"step": 57625
},
{
"epoch": 25.162689804772235,
"grad_norm": 6422.17041015625,
"learning_rate": 6.25609639994632e-05,
"loss": 0.8784,
"step": 58000
},
{
"epoch": 25.379609544468547,
"grad_norm": 16689.212890625,
"learning_rate": 6.201048334737784e-05,
"loss": 0.8855,
"step": 58500
},
{
"epoch": 25.59652928416486,
"grad_norm": 18894.322265625,
"learning_rate": 6.145845333932029e-05,
"loss": 0.8872,
"step": 59000
},
{
"epoch": 25.81344902386117,
"grad_norm": 4359.09521484375,
"learning_rate": 6.090494518732801e-05,
"loss": 0.8835,
"step": 59500
},
{
"epoch": 26.0,
"eval_loss": 0.8596058487892151,
"eval_map": 0.4972,
"eval_map_50": 0.8376,
"eval_map_75": 0.5257,
"eval_map_bus": 0.5714,
"eval_map_car": 0.5186,
"eval_map_container": 0.5391,
"eval_map_large": 0.7028,
"eval_map_medium": 0.4915,
"eval_map_motorbike": 0.3598,
"eval_map_small": 0.1342,
"eval_mar_1": 0.2583,
"eval_mar_10": 0.5574,
"eval_mar_100": 0.6057,
"eval_mar_100_bus": 0.6883,
"eval_mar_100_car": 0.6094,
"eval_mar_100_container": 0.6514,
"eval_mar_100_motorbike": 0.4737,
"eval_mar_large": 0.7866,
"eval_mar_medium": 0.6078,
"eval_mar_small": 0.3419,
"eval_runtime": 145.0724,
"eval_samples_per_second": 15.875,
"eval_steps_per_second": 1.985,
"step": 59930
},
{
"epoch": 26.030368763557483,
"grad_norm": 28658.181640625,
"learning_rate": 6.0350030294119464e-05,
"loss": 0.8825,
"step": 60000
},
{
"epoch": 26.247288503253795,
"grad_norm": 6283.97509765625,
"learning_rate": 5.979489402880387e-05,
"loss": 0.8833,
"step": 60500
},
{
"epoch": 26.464208242950107,
"grad_norm": 4272.13037109375,
"learning_rate": 5.923738303304234e-05,
"loss": 0.8844,
"step": 61000
},
{
"epoch": 26.68112798264642,
"grad_norm": 14047.6572265625,
"learning_rate": 5.8678680412085076e-05,
"loss": 0.8785,
"step": 61500
},
{
"epoch": 26.89804772234273,
"grad_norm": 8514.8544921875,
"learning_rate": 5.811885823873863e-05,
"loss": 0.8692,
"step": 62000
},
{
"epoch": 27.0,
"eval_loss": 0.8606675863265991,
"eval_map": 0.4927,
"eval_map_50": 0.837,
"eval_map_75": 0.5186,
"eval_map_bus": 0.5641,
"eval_map_car": 0.5122,
"eval_map_container": 0.5369,
"eval_map_large": 0.7052,
"eval_map_medium": 0.4874,
"eval_map_motorbike": 0.3576,
"eval_map_small": 0.1426,
"eval_mar_1": 0.2578,
"eval_mar_10": 0.5566,
"eval_mar_100": 0.6043,
"eval_mar_100_bus": 0.6885,
"eval_mar_100_car": 0.6043,
"eval_mar_100_container": 0.6507,
"eval_mar_100_motorbike": 0.4737,
"eval_mar_large": 0.7936,
"eval_mar_medium": 0.608,
"eval_mar_small": 0.3251,
"eval_runtime": 145.9029,
"eval_samples_per_second": 15.784,
"eval_steps_per_second": 1.974,
"step": 62235
},
{
"epoch": 27.114967462039047,
"grad_norm": 17592.478515625,
"learning_rate": 5.755798873023209e-05,
"loss": 0.8719,
"step": 62500
},
{
"epoch": 27.33188720173536,
"grad_norm": 28705.041015625,
"learning_rate": 5.699614423890112e-05,
"loss": 0.873,
"step": 63000
},
{
"epoch": 27.54880694143167,
"grad_norm": 14412.8916015625,
"learning_rate": 5.643339724285447e-05,
"loss": 0.8654,
"step": 63500
},
{
"epoch": 27.765726681127983,
"grad_norm": 11298.9375,
"learning_rate": 5.587094827038153e-05,
"loss": 0.8829,
"step": 64000
},
{
"epoch": 27.982646420824295,
"grad_norm": 8732.7822265625,
"learning_rate": 5.530661559735304e-05,
"loss": 0.8694,
"step": 64500
},
{
"epoch": 28.0,
"eval_loss": 0.8637914657592773,
"eval_map": 0.4929,
"eval_map_50": 0.8355,
"eval_map_75": 0.5204,
"eval_map_bus": 0.5621,
"eval_map_car": 0.5152,
"eval_map_container": 0.5343,
"eval_map_large": 0.7119,
"eval_map_medium": 0.4885,
"eval_map_motorbike": 0.3601,
"eval_map_small": 0.1308,
"eval_mar_1": 0.2571,
"eval_mar_10": 0.556,
"eval_mar_100": 0.6029,
"eval_mar_100_bus": 0.6851,
"eval_mar_100_car": 0.6085,
"eval_mar_100_container": 0.6431,
"eval_mar_100_motorbike": 0.4749,
"eval_mar_large": 0.7964,
"eval_mar_medium": 0.6042,
"eval_mar_small": 0.3162,
"eval_runtime": 145.47,
"eval_samples_per_second": 15.831,
"eval_steps_per_second": 1.98,
"step": 64540
},
{
"epoch": 28.199566160520607,
"grad_norm": 6033.21923828125,
"learning_rate": 5.474159836931288e-05,
"loss": 0.8805,
"step": 65000
},
{
"epoch": 28.41648590021692,
"grad_norm": 7858.236328125,
"learning_rate": 5.417596947365383e-05,
"loss": 0.878,
"step": 65500
},
{
"epoch": 28.63340563991323,
"grad_norm": 11765.7236328125,
"learning_rate": 5.361093470095784e-05,
"loss": 0.8746,
"step": 66000
},
{
"epoch": 28.850325379609544,
"grad_norm": 3453.400146484375,
"learning_rate": 5.304430229684755e-05,
"loss": 0.8744,
"step": 66500
},
{
"epoch": 29.0,
"eval_loss": 0.8675053119659424,
"eval_map": 0.4883,
"eval_map_50": 0.8358,
"eval_map_75": 0.5122,
"eval_map_bus": 0.5564,
"eval_map_car": 0.5131,
"eval_map_container": 0.5244,
"eval_map_large": 0.6955,
"eval_map_medium": 0.4818,
"eval_map_motorbike": 0.3594,
"eval_map_small": 0.1305,
"eval_mar_1": 0.2542,
"eval_mar_10": 0.5483,
"eval_mar_100": 0.5948,
"eval_mar_100_bus": 0.6693,
"eval_mar_100_car": 0.602,
"eval_mar_100_container": 0.6352,
"eval_mar_100_motorbike": 0.4727,
"eval_mar_large": 0.7802,
"eval_mar_medium": 0.5936,
"eval_mar_small": 0.3363,
"eval_runtime": 145.2093,
"eval_samples_per_second": 15.86,
"eval_steps_per_second": 1.983,
"step": 66845
},
{
"epoch": 29.067245119305856,
"grad_norm": 4124.80615234375,
"learning_rate": 5.24772771768233e-05,
"loss": 0.8763,
"step": 67000
},
{
"epoch": 29.284164859002168,
"grad_norm": 12881.8603515625,
"learning_rate": 5.1909932487296506e-05,
"loss": 0.8783,
"step": 67500
},
{
"epoch": 29.501084598698483,
"grad_norm": 11561.8046875,
"learning_rate": 5.134234141590315e-05,
"loss": 0.867,
"step": 68000
},
{
"epoch": 29.718004338394795,
"grad_norm": 4195.20458984375,
"learning_rate": 5.077571283466763e-05,
"loss": 0.8623,
"step": 68500
},
{
"epoch": 29.934924078091107,
"grad_norm": 6831.716796875,
"learning_rate": 5.020784880687298e-05,
"loss": 0.8608,
"step": 69000
},
{
"epoch": 30.0,
"eval_loss": 0.8547199964523315,
"eval_map": 0.5,
"eval_map_50": 0.8401,
"eval_map_75": 0.5304,
"eval_map_bus": 0.5762,
"eval_map_car": 0.5197,
"eval_map_container": 0.5424,
"eval_map_large": 0.7118,
"eval_map_medium": 0.4962,
"eval_map_motorbike": 0.3617,
"eval_map_small": 0.1291,
"eval_mar_1": 0.2596,
"eval_mar_10": 0.559,
"eval_mar_100": 0.6079,
"eval_mar_100_bus": 0.6877,
"eval_mar_100_car": 0.6139,
"eval_mar_100_container": 0.6542,
"eval_mar_100_motorbike": 0.4756,
"eval_mar_large": 0.7898,
"eval_mar_medium": 0.6093,
"eval_mar_small": 0.34,
"eval_runtime": 144.8308,
"eval_samples_per_second": 15.901,
"eval_steps_per_second": 1.989,
"step": 69150
},
{
"epoch": 30.15184381778742,
"grad_norm": 9134.2763671875,
"learning_rate": 4.9639957966519604e-05,
"loss": 0.8683,
"step": 69500
},
{
"epoch": 30.36876355748373,
"grad_norm": 6325.7216796875,
"learning_rate": 4.907211357169706e-05,
"loss": 0.8653,
"step": 70000
},
{
"epoch": 30.585683297180044,
"grad_norm": 13625.853515625,
"learning_rate": 4.850438887450347e-05,
"loss": 0.8714,
"step": 70500
},
{
"epoch": 30.802603036876356,
"grad_norm": 15019.505859375,
"learning_rate": 4.793799193390669e-05,
"loss": 0.8566,
"step": 71000
},
{
"epoch": 31.0,
"eval_loss": 0.8513031005859375,
"eval_map": 0.5,
"eval_map_50": 0.8418,
"eval_map_75": 0.5333,
"eval_map_bus": 0.5714,
"eval_map_car": 0.5239,
"eval_map_container": 0.5422,
"eval_map_large": 0.7031,
"eval_map_medium": 0.4972,
"eval_map_motorbike": 0.3626,
"eval_map_small": 0.1282,
"eval_mar_1": 0.2582,
"eval_mar_10": 0.5594,
"eval_mar_100": 0.6082,
"eval_mar_100_bus": 0.6856,
"eval_mar_100_car": 0.6153,
"eval_mar_100_container": 0.6545,
"eval_mar_100_motorbike": 0.4772,
"eval_mar_large": 0.7875,
"eval_mar_medium": 0.6116,
"eval_mar_small": 0.3505,
"eval_runtime": 144.5939,
"eval_samples_per_second": 15.927,
"eval_steps_per_second": 1.992,
"step": 71455
},
{
"epoch": 31.019522776572668,
"grad_norm": 9826.4052734375,
"learning_rate": 4.7370725711717407e-05,
"loss": 0.8693,
"step": 71500
},
{
"epoch": 31.23644251626898,
"grad_norm": 3330.38623046875,
"learning_rate": 4.6803798666703856e-05,
"loss": 0.8625,
"step": 72000
},
{
"epoch": 31.453362255965292,
"grad_norm": 4638.60107421875,
"learning_rate": 4.623728393262576e-05,
"loss": 0.8672,
"step": 72500
},
{
"epoch": 31.670281995661604,
"grad_norm": 10907.923828125,
"learning_rate": 4.5672386115774904e-05,
"loss": 0.8625,
"step": 73000
},
{
"epoch": 31.887201735357916,
"grad_norm": 3609.915283203125,
"learning_rate": 4.5106913993021883e-05,
"loss": 0.8586,
"step": 73500
},
{
"epoch": 32.0,
"eval_loss": 0.8532082438468933,
"eval_map": 0.5035,
"eval_map_50": 0.8414,
"eval_map_75": 0.538,
"eval_map_bus": 0.5799,
"eval_map_car": 0.5235,
"eval_map_container": 0.5481,
"eval_map_large": 0.7084,
"eval_map_medium": 0.4993,
"eval_map_motorbike": 0.3626,
"eval_map_small": 0.1292,
"eval_mar_1": 0.2603,
"eval_mar_10": 0.5621,
"eval_mar_100": 0.6094,
"eval_mar_100_bus": 0.6893,
"eval_mar_100_car": 0.6139,
"eval_mar_100_container": 0.6587,
"eval_mar_100_motorbike": 0.4758,
"eval_mar_large": 0.7924,
"eval_mar_medium": 0.6135,
"eval_mar_small": 0.3286,
"eval_runtime": 145.9881,
"eval_samples_per_second": 15.775,
"eval_steps_per_second": 1.973,
"step": 73760
},
{
"epoch": 32.10412147505423,
"grad_norm": 11651.8828125,
"learning_rate": 4.4542073079838684e-05,
"loss": 0.8618,
"step": 74000
},
{
"epoch": 32.321041214750544,
"grad_norm": 17436.388671875,
"learning_rate": 4.39779362408734e-05,
"loss": 0.8542,
"step": 74500
},
{
"epoch": 32.53796095444685,
"grad_norm": 20459.701171875,
"learning_rate": 4.341457624994828e-05,
"loss": 0.8554,
"step": 75000
},
{
"epoch": 32.75488069414317,
"grad_norm": 5393.4375,
"learning_rate": 4.285318990553778e-05,
"loss": 0.8528,
"step": 75500
},
{
"epoch": 32.971800433839476,
"grad_norm": 4986.16796875,
"learning_rate": 4.229159960541767e-05,
"loss": 0.8598,
"step": 76000
},
{
"epoch": 33.0,
"eval_loss": 0.8493744134902954,
"eval_map": 0.499,
"eval_map_50": 0.8415,
"eval_map_75": 0.5323,
"eval_map_bus": 0.5708,
"eval_map_car": 0.5215,
"eval_map_container": 0.5432,
"eval_map_large": 0.7104,
"eval_map_medium": 0.4969,
"eval_map_motorbike": 0.3606,
"eval_map_small": 0.1301,
"eval_mar_1": 0.2582,
"eval_mar_10": 0.5605,
"eval_mar_100": 0.6084,
"eval_mar_100_bus": 0.6857,
"eval_mar_100_car": 0.615,
"eval_mar_100_container": 0.6551,
"eval_mar_100_motorbike": 0.4778,
"eval_mar_large": 0.7942,
"eval_mar_medium": 0.6113,
"eval_mar_small": 0.3277,
"eval_runtime": 144.7755,
"eval_samples_per_second": 15.907,
"eval_steps_per_second": 1.989,
"step": 76065
},
{
"epoch": 33.18872017353579,
"grad_norm": 6646.677734375,
"learning_rate": 4.173212384261402e-05,
"loss": 0.8671,
"step": 76500
},
{
"epoch": 33.40563991323211,
"grad_norm": 4728.1552734375,
"learning_rate": 4.1172592425996225e-05,
"loss": 0.8671,
"step": 77000
},
{
"epoch": 33.622559652928416,
"grad_norm": 9825.3720703125,
"learning_rate": 4.0614199747616364e-05,
"loss": 0.8668,
"step": 77500
},
{
"epoch": 33.83947939262473,
"grad_norm": 3324.343505859375,
"learning_rate": 4.0057017840298235e-05,
"loss": 0.8728,
"step": 78000
},
{
"epoch": 34.0,
"eval_loss": 0.8495970368385315,
"eval_map": 0.5027,
"eval_map_50": 0.841,
"eval_map_75": 0.5357,
"eval_map_bus": 0.5809,
"eval_map_car": 0.5196,
"eval_map_container": 0.5452,
"eval_map_large": 0.715,
"eval_map_medium": 0.4969,
"eval_map_motorbike": 0.3652,
"eval_map_small": 0.1332,
"eval_mar_1": 0.2609,
"eval_mar_10": 0.5617,
"eval_mar_100": 0.6105,
"eval_mar_100_bus": 0.6941,
"eval_mar_100_car": 0.6116,
"eval_mar_100_container": 0.6565,
"eval_mar_100_motorbike": 0.4799,
"eval_mar_large": 0.7994,
"eval_mar_medium": 0.6147,
"eval_mar_small": 0.3335,
"eval_runtime": 145.9053,
"eval_samples_per_second": 15.784,
"eval_steps_per_second": 1.974,
"step": 78370
},
{
"epoch": 34.05639913232104,
"grad_norm": 20089.041015625,
"learning_rate": 3.950111858067586e-05,
"loss": 0.8606,
"step": 78500
},
{
"epoch": 34.273318872017356,
"grad_norm": 22944.431640625,
"learning_rate": 3.894657367992129e-05,
"loss": 0.8592,
"step": 79000
},
{
"epoch": 34.490238611713664,
"grad_norm": 6247.44970703125,
"learning_rate": 3.8393454674493866e-05,
"loss": 0.8535,
"step": 79500
},
{
"epoch": 34.70715835140998,
"grad_norm": 8178.81982421875,
"learning_rate": 3.7841832916912035e-05,
"loss": 0.8499,
"step": 80000
},
{
"epoch": 34.92407809110629,
"grad_norm": 6138.80712890625,
"learning_rate": 3.7291779566548805e-05,
"loss": 0.8496,
"step": 80500
},
{
"epoch": 35.0,
"eval_loss": 0.8385424613952637,
"eval_map": 0.5081,
"eval_map_50": 0.8476,
"eval_map_75": 0.5424,
"eval_map_bus": 0.5828,
"eval_map_car": 0.5317,
"eval_map_container": 0.5475,
"eval_map_large": 0.7206,
"eval_map_medium": 0.504,
"eval_map_motorbike": 0.3703,
"eval_map_small": 0.1423,
"eval_mar_1": 0.2623,
"eval_mar_10": 0.5665,
"eval_mar_100": 0.6148,
"eval_mar_100_bus": 0.6954,
"eval_mar_100_car": 0.6213,
"eval_mar_100_container": 0.6591,
"eval_mar_100_motorbike": 0.4833,
"eval_mar_large": 0.8048,
"eval_mar_medium": 0.6188,
"eval_mar_small": 0.3475,
"eval_runtime": 144.7118,
"eval_samples_per_second": 15.914,
"eval_steps_per_second": 1.99,
"step": 80675
},
{
"epoch": 35.140997830802604,
"grad_norm": 5527.109375,
"learning_rate": 3.674446072528038e-05,
"loss": 0.8416,
"step": 81000
},
{
"epoch": 35.35791757049891,
"grad_norm": 6165.18603515625,
"learning_rate": 3.619775335834121e-05,
"loss": 0.8443,
"step": 81500
},
{
"epoch": 35.57483731019523,
"grad_norm": 7007.72900390625,
"learning_rate": 3.5652826485379264e-05,
"loss": 0.8546,
"step": 82000
},
{
"epoch": 35.79175704989154,
"grad_norm": 7134.87548828125,
"learning_rate": 3.5109750402125426e-05,
"loss": 0.8477,
"step": 82500
},
{
"epoch": 36.0,
"eval_loss": 0.840656042098999,
"eval_map": 0.5078,
"eval_map_50": 0.8475,
"eval_map_75": 0.543,
"eval_map_bus": 0.5808,
"eval_map_car": 0.5308,
"eval_map_container": 0.5506,
"eval_map_large": 0.7143,
"eval_map_medium": 0.5038,
"eval_map_motorbike": 0.3689,
"eval_map_small": 0.1375,
"eval_mar_1": 0.2612,
"eval_mar_10": 0.5658,
"eval_mar_100": 0.6127,
"eval_mar_100_bus": 0.6911,
"eval_mar_100_car": 0.6198,
"eval_mar_100_container": 0.6566,
"eval_mar_100_motorbike": 0.4835,
"eval_mar_large": 0.7981,
"eval_mar_medium": 0.6156,
"eval_mar_small": 0.3327,
"eval_runtime": 144.8577,
"eval_samples_per_second": 15.898,
"eval_steps_per_second": 1.988,
"step": 82980
}
],
"logging_steps": 500,
"max_steps": 138300,
"num_input_tokens_seen": 0,
"num_train_epochs": 60,
"save_steps": 500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": false
},
"attributes": {}
}
},
"total_flos": 1.526046904086461e+20,
"train_batch_size": 4,
"trial_name": null,
"trial_params": null
}