{ "best_metric": 2.9787235260009766, "best_model_checkpoint": "/mnt/output/projects/sca-xiaoke-v3/amlt-results/7300886584.15971-e315970f-15b9-410a-b0a9-3912402cdf8b/checkpoint-195000", "epoch": 82.67879288962381, "global_step": 200000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "_prepare_inputs_in_ms": 14.42616805434227, "compute_loss_in_ms": 1299.8907640576363, "epoch": 0.0, "learning_rate/full": 0.0, "loss": 9.016, "step": 1, "training_step_in_ms": 2032.6302126049995 }, { "epoch": 0.0, "eval_visual_genome-densecap-local-densecap-test_loss": 9.1282958984375, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.03355821582361717, "eval_visual_genome-densecap-local-densecap-test_runtime": 189.4348, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 4.223, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.132, "step": 1 }, { "_prepare_inputs_in_ms": 4.084589669218985, "compute_loss_in_ms": 284.03653898784466, "epoch": 0.41, "learning_rate/full": 0.00039998495845181817, "loss": 3.8908, "step": 1000, "training_step_in_ms": 1082.7972516678535 }, { "_prepare_inputs_in_ms": 4.054305288940668, "compute_loss_in_ms": 284.15025370568037, "epoch": 0.83, "learning_rate/full": 0.0003999216713877652, "loss": 3.4805, "step": 2000, "training_step_in_ms": 1086.274579320103 }, { "_prepare_inputs_in_ms": 4.071794345974922, "compute_loss_in_ms": 284.45942908525467, "epoch": 1.24, "learning_rate/full": 0.00039980895784128267, "loss": 3.405, "step": 3000, "training_step_in_ms": 1119.1077427528799 }, { "_prepare_inputs_in_ms": 4.085798408836126, "compute_loss_in_ms": 284.8285736106336, "epoch": 1.65, "learning_rate/full": 0.00039964684567845476, "loss": 3.3537, "step": 4000, "training_step_in_ms": 1150.6125138737261 }, { "_prepare_inputs_in_ms": 4.0938322730362415, "compute_loss_in_ms": 285.10985093563795, "epoch": 2.07, "learning_rate/full": 0.0003994358471466495, "loss": 3.3218, "step": 5000, "training_step_in_ms": 1108.4499053694308 }, { "epoch": 2.07, "eval_visual_genome-densecap-local-densecap-test_loss": 3.269989252090454, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.21715476097311398, "eval_visual_genome-densecap-local-densecap-test_runtime": 111.5411, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.172, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.224, "step": 5000 }, { "_prepare_inputs_in_ms": 4.128877357011888, "compute_loss_in_ms": 285.1207774169743, "epoch": 2.48, "learning_rate/full": 0.0003991751687428334, "loss": 3.2918, "step": 6000, "training_step_in_ms": 1120.3654654994607 }, { "_prepare_inputs_in_ms": 4.121768821030855, "compute_loss_in_ms": 284.9130438826978, "epoch": 2.89, "learning_rate/full": 0.0003988659173490642, "loss": 3.2675, "step": 7000, "training_step_in_ms": 1130.791154742241 }, { "_prepare_inputs_in_ms": 4.129346951842308, "compute_loss_in_ms": 285.35304405912757, "epoch": 3.31, "learning_rate/full": 0.0003985069299623724, "loss": 3.2451, "step": 8000, "training_step_in_ms": 1133.7338739708066 }, { "_prepare_inputs_in_ms": 4.133303381502628, "compute_loss_in_ms": 285.2391963750124, "epoch": 3.72, "learning_rate/full": 0.0003980992984040504, "loss": 3.2334, "step": 9000, "training_step_in_ms": 1086.6298492662609 }, { "_prepare_inputs_in_ms": 4.132662046700716, "compute_loss_in_ms": 285.1939390525222, "epoch": 4.13, "learning_rate/full": 0.00039764230739017226, "loss": 3.2122, "step": 10000, "training_step_in_ms": 1111.2217365466058 }, { "epoch": 4.13, "eval_visual_genome-densecap-local-densecap-test_loss": 3.1718945503234863, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.23451229725961228, "eval_visual_genome-densecap-local-densecap-test_runtime": 108.8619, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.349, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.23, "step": 10000 }, { "_prepare_inputs_in_ms": 4.151588522079514, "compute_loss_in_ms": 285.39055866748095, "epoch": 4.55, "learning_rate/full": 0.00039713751381134497, "loss": 3.1979, "step": 11000, "training_step_in_ms": 1089.2837468609214 }, { "_prepare_inputs_in_ms": 4.139887526631355, "compute_loss_in_ms": 285.3860225379467, "epoch": 4.96, "learning_rate/full": 0.000396583019288311, "loss": 3.1933, "step": 12000, "training_step_in_ms": 1084.1714271605015 }, { "_prepare_inputs_in_ms": 4.176147662103176, "compute_loss_in_ms": 285.6273371577263, "epoch": 5.37, "learning_rate/full": 0.0003959805510184613, "loss": 3.1765, "step": 13000, "training_step_in_ms": 1089.3080548346043 }, { "_prepare_inputs_in_ms": 4.1766685508191586, "compute_loss_in_ms": 285.3720509596169, "epoch": 5.79, "learning_rate/full": 0.00039532972748016767, "loss": 3.1727, "step": 14000, "training_step_in_ms": 1091.7199603579938 }, { "_prepare_inputs_in_ms": 4.191178072243929, "compute_loss_in_ms": 285.4580160602927, "epoch": 6.2, "learning_rate/full": 0.0003946307092543998, "loss": 3.1591, "step": 15000, "training_step_in_ms": 1090.6033144891262 }, { "epoch": 6.2, "eval_visual_genome-densecap-local-densecap-test_loss": 3.1219239234924316, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.24624792238728155, "eval_visual_genome-densecap-local-densecap-test_runtime": 108.8497, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.35, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.23, "step": 15000 }, { "_prepare_inputs_in_ms": 4.180258305334464, "compute_loss_in_ms": 285.4601420760155, "epoch": 6.61, "learning_rate/full": 0.0003938828970266217, "loss": 3.1562, "step": 16000, "training_step_in_ms": 1084.842809855938 }, { "_prepare_inputs_in_ms": 4.194100107997656, "compute_loss_in_ms": 285.48905945569277, "epoch": 7.03, "learning_rate/full": 0.00039308797090204444, "loss": 3.1508, "step": 17000, "training_step_in_ms": 1085.5392471551895 }, { "_prepare_inputs_in_ms": 4.201232250779867, "compute_loss_in_ms": 285.61364733427763, "epoch": 7.44, "learning_rate/full": 0.0003922445359987763, "loss": 3.1333, "step": 18000, "training_step_in_ms": 1091.4973263852298 }, { "_prepare_inputs_in_ms": 4.189023811370134, "compute_loss_in_ms": 285.4624082148075, "epoch": 7.85, "learning_rate/full": 0.0003913554018411121, "loss": 3.1351, "step": 19000, "training_step_in_ms": 1095.9623138792813 }, { "_prepare_inputs_in_ms": 4.215472485870123, "compute_loss_in_ms": 285.6230415776372, "epoch": 8.27, "learning_rate/full": 0.00039041818639024787, "loss": 3.1297, "step": 20000, "training_step_in_ms": 1185.9847482070327 }, { "epoch": 8.27, "eval_visual_genome-densecap-local-densecap-test_loss": 3.094672918319702, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.24975866124736495, "eval_visual_genome-densecap-local-densecap-test_runtime": 108.4566, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.376, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.231, "step": 20000 }, { "_prepare_inputs_in_ms": 4.1831618874538234, "compute_loss_in_ms": 285.3183429725468, "epoch": 8.68, "learning_rate/full": 0.00038943398810118026, "loss": 3.119, "step": 21000, "training_step_in_ms": 1082.7558356113732 }, { "_prepare_inputs_in_ms": 4.174146838486195, "compute_loss_in_ms": 285.4058397859335, "epoch": 9.09, "learning_rate/full": 0.0003884019945070803, "loss": 3.1178, "step": 22000, "training_step_in_ms": 1087.0350129008293 }, { "_prepare_inputs_in_ms": 4.204949229955673, "compute_loss_in_ms": 285.3504670076072, "epoch": 9.51, "learning_rate/full": 0.00038732452418171673, "loss": 3.1093, "step": 23000, "training_step_in_ms": 1090.7997342124581 }, { "_prepare_inputs_in_ms": 4.196985870599747, "compute_loss_in_ms": 285.4016271494329, "epoch": 9.92, "learning_rate/full": 0.0003862008343330083, "loss": 3.1062, "step": 24000, "training_step_in_ms": 1090.5269000642002 }, { "_prepare_inputs_in_ms": 4.206760194152594, "compute_loss_in_ms": 285.6653628349304, "epoch": 10.33, "learning_rate/full": 0.00038503000849003844, "loss": 3.0972, "step": 25000, "training_step_in_ms": 1090.913136728108 }, { "epoch": 10.33, "eval_visual_genome-densecap-local-densecap-test_loss": 3.075335741043091, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.25707208633373096, "eval_visual_genome-densecap-local-densecap-test_runtime": 108.472, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.375, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.23, "step": 25000 }, { "_prepare_inputs_in_ms": 4.204354642367944, "compute_loss_in_ms": 285.44070146232843, "epoch": 10.75, "learning_rate/full": 0.0003838159164157488, "loss": 3.097, "step": 26000, "training_step_in_ms": 1085.0929874032736 }, { "_prepare_inputs_in_ms": 4.202797457575798, "compute_loss_in_ms": 285.55905482545495, "epoch": 11.16, "learning_rate/full": 0.00038255527679000744, "loss": 3.0903, "step": 27000, "training_step_in_ms": 1089.4926370121539 }, { "_prepare_inputs_in_ms": 4.2012519761919975, "compute_loss_in_ms": 285.71758703514934, "epoch": 11.58, "learning_rate/full": 0.0003812482649321827, "loss": 3.0892, "step": 28000, "training_step_in_ms": 1090.198759533465 }, { "_prepare_inputs_in_ms": 4.220829274505377, "compute_loss_in_ms": 285.5986107811332, "epoch": 11.99, "learning_rate/full": 0.0003798978172979138, "loss": 3.0889, "step": 29000, "training_step_in_ms": 1085.0686310827732 }, { "_prepare_inputs_in_ms": 4.217640113085508, "compute_loss_in_ms": 285.6399230584502, "epoch": 12.4, "learning_rate/full": 0.0003785029825690954, "loss": 3.0749, "step": 30000, "training_step_in_ms": 1087.9900991134346 }, { "epoch": 12.4, "eval_visual_genome-densecap-local-densecap-test_loss": 3.058861017227173, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.25600252799309026, "eval_visual_genome-densecap-local-densecap-test_runtime": 109.6245, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.298, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.228, "step": 30000 }, { "_prepare_inputs_in_ms": 4.224213841484814, "compute_loss_in_ms": 285.3009058833122, "epoch": 12.82, "learning_rate/full": 0.00037706410490032555, "loss": 3.0794, "step": 31000, "training_step_in_ms": 1087.378763064742 }, { "_prepare_inputs_in_ms": 4.233129996806383, "compute_loss_in_ms": 285.4745088033378, "epoch": 13.23, "learning_rate/full": 0.0003755815393131386, "loss": 3.074, "step": 32000, "training_step_in_ms": 1091.7205754183233 }, { "_prepare_inputs_in_ms": 4.223707340657711, "compute_loss_in_ms": 285.1553194858134, "epoch": 13.64, "learning_rate/full": 0.0003740556516084091, "loss": 3.0686, "step": 33000, "training_step_in_ms": 1087.8120190612972 }, { "_prepare_inputs_in_ms": 4.245889626443386, "compute_loss_in_ms": 285.67459550127387, "epoch": 14.06, "learning_rate/full": 0.0003724852264850082, "loss": 3.0733, "step": 34000, "training_step_in_ms": 1086.3751963675022 }, { "_prepare_inputs_in_ms": 4.233293745666742, "compute_loss_in_ms": 285.4981838874519, "epoch": 14.47, "learning_rate/full": 0.00037087542640234865, "loss": 3.064, "step": 35000, "training_step_in_ms": 1089.8129360377789 }, { "epoch": 14.47, "eval_visual_genome-densecap-local-densecap-test_loss": 3.052946090698242, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.2584196718918565, "eval_visual_genome-densecap-local-densecap-test_runtime": 108.4779, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.375, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.23, "step": 35000 }, { "_prepare_inputs_in_ms": 4.194417025257901, "compute_loss_in_ms": 285.25339871644974, "epoch": 14.88, "learning_rate/full": 0.00036922019737873653, "loss": 3.064, "step": 36000, "training_step_in_ms": 1084.3368335030973 }, { "_prepare_inputs_in_ms": 4.225800335407257, "compute_loss_in_ms": 285.52921985834837, "epoch": 15.3, "learning_rate/full": 0.00036752484999829976, "loss": 3.0581, "step": 37000, "training_step_in_ms": 1090.5179475583136 }, { "_prepare_inputs_in_ms": 4.208773214370012, "compute_loss_in_ms": 285.2426546551287, "epoch": 15.71, "learning_rate/full": 0.0003657881683678541, "loss": 3.0581, "step": 38000, "training_step_in_ms": 1089.0830878019333 }, { "_prepare_inputs_in_ms": 4.219740275293589, "compute_loss_in_ms": 285.45426247641444, "epoch": 16.12, "learning_rate/full": 0.00036401058098760525, "loss": 3.0534, "step": 39000, "training_step_in_ms": 1088.1995187923312 }, { "_prepare_inputs_in_ms": 4.224584739655256, "compute_loss_in_ms": 285.29780930280685, "epoch": 16.54, "learning_rate/full": 0.00036219068645119566, "loss": 3.0525, "step": 40000, "training_step_in_ms": 1088.9517585895956 }, { "epoch": 16.54, "eval_visual_genome-densecap-local-densecap-test_loss": 3.0416412353515625, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.26328806809020683, "eval_visual_genome-densecap-local-densecap-test_runtime": 110.03, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.271, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.227, "step": 40000 }, { "_prepare_inputs_in_ms": 4.210097938776016, "compute_loss_in_ms": 285.2052926979959, "epoch": 16.95, "learning_rate/full": 0.0003603344533347134, "loss": 3.0483, "step": 41000, "training_step_in_ms": 1085.6118382960558 }, { "_prepare_inputs_in_ms": 4.248851552605629, "compute_loss_in_ms": 285.6537539064884, "epoch": 17.36, "learning_rate/full": 0.00035843490089475537, "loss": 3.0399, "step": 42000, "training_step_in_ms": 1091.6559825353324 }, { "_prepare_inputs_in_ms": 4.214634284377098, "compute_loss_in_ms": 285.3575124628842, "epoch": 17.78, "learning_rate/full": 0.0003564981368437495, "loss": 3.0455, "step": 43000, "training_step_in_ms": 1088.8244492001832 }, { "_prepare_inputs_in_ms": 4.242138650268316, "compute_loss_in_ms": 285.5602181442082, "epoch": 18.19, "learning_rate/full": 0.00035452076268085417, "loss": 3.0397, "step": 44000, "training_step_in_ms": 1087.6106830611825 }, { "_prepare_inputs_in_ms": 4.231096193194389, "compute_loss_in_ms": 285.38128500804305, "epoch": 18.6, "learning_rate/full": 0.0003525072209606466, "loss": 3.0366, "step": 45000, "training_step_in_ms": 1090.0634618513286 }, { "epoch": 18.6, "eval_visual_genome-densecap-local-densecap-test_loss": 3.0333669185638428, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.262616571295984, "eval_visual_genome-densecap-local-densecap-test_runtime": 108.2623, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.389, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.231, "step": 45000 }, { "_prepare_inputs_in_ms": 4.224474132061005, "compute_loss_in_ms": 285.69229750707746, "epoch": 19.02, "learning_rate/full": 0.00035045605036568154, "loss": 3.0403, "step": 46000, "training_step_in_ms": 1087.4972796961665 }, { "_prepare_inputs_in_ms": 4.218343399465084, "compute_loss_in_ms": 285.2950618080795, "epoch": 19.43, "learning_rate/full": 0.0003483677569916109, "loss": 3.0296, "step": 47000, "training_step_in_ms": 1088.6641021184623 }, { "_prepare_inputs_in_ms": 4.212014690041542, "compute_loss_in_ms": 285.24483662098646, "epoch": 19.84, "learning_rate/full": 0.0003462450012513184, "loss": 3.0351, "step": 48000, "training_step_in_ms": 1086.902916610241 }, { "_prepare_inputs_in_ms": 4.228286672383547, "compute_loss_in_ms": 285.4265847504139, "epoch": 20.26, "learning_rate/full": 0.0003440818719590809, "loss": 3.0301, "step": 49000, "training_step_in_ms": 1089.4173335321248 }, { "_prepare_inputs_in_ms": 4.209285493940115, "compute_loss_in_ms": 285.17769135162234, "epoch": 20.67, "learning_rate/full": 0.0003418853377786221, "loss": 3.0266, "step": 50000, "training_step_in_ms": 1092.610530115664 }, { "epoch": 20.67, "eval_visual_genome-densecap-local-densecap-test_loss": 3.026047468185425, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.26601445767420673, "eval_visual_genome-densecap-local-densecap-test_runtime": 111.3497, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.185, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.225, "step": 50000 }, { "_prepare_inputs_in_ms": 4.215818756237263, "compute_loss_in_ms": 285.3216738887131, "epoch": 21.08, "learning_rate/full": 0.00033965379551414244, "loss": 3.0364, "step": 51000, "training_step_in_ms": 1090.6509163863957 }, { "_prepare_inputs_in_ms": 4.2158047296106815, "compute_loss_in_ms": 285.3607781082392, "epoch": 21.5, "learning_rate/full": 0.00033738779576530426, "loss": 3.0221, "step": 52000, "training_step_in_ms": 1089.9412010349333 }, { "_prepare_inputs_in_ms": 4.225385930389166, "compute_loss_in_ms": 285.4064598791301, "epoch": 21.91, "learning_rate/full": 0.0003350878976336386, "loss": 3.0233, "step": 53000, "training_step_in_ms": 1086.4266870431602 }, { "_prepare_inputs_in_ms": 4.2348253689706326, "compute_loss_in_ms": 285.5650148577988, "epoch": 22.32, "learning_rate/full": 0.0003327546685845955, "loss": 3.0177, "step": 54000, "training_step_in_ms": 1090.5466065071523 }, { "_prepare_inputs_in_ms": 4.244904510676861, "compute_loss_in_ms": 285.4943734779954, "epoch": 22.74, "learning_rate/full": 0.00033038868430752995, "loss": 3.0227, "step": 55000, "training_step_in_ms": 1089.5386388339102 }, { "epoch": 22.74, "eval_visual_genome-densecap-local-densecap-test_loss": 3.0213677883148193, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.26657402454724916, "eval_visual_genome-densecap-local-densecap-test_runtime": 109.863, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.282, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.228, "step": 55000 }, { "_prepare_inputs_in_ms": 4.222077999900027, "compute_loss_in_ms": 285.3860865868628, "epoch": 23.15, "learning_rate/full": 0.00032798811209649607, "loss": 3.0201, "step": 56000, "training_step_in_ms": 1089.8713997229934 }, { "_prepare_inputs_in_ms": 4.218684710562229, "compute_loss_in_ms": 285.196179587394, "epoch": 23.56, "learning_rate/full": 0.0003255583453025672, "loss": 3.0133, "step": 57000, "training_step_in_ms": 1088.3847643770278 }, { "_prepare_inputs_in_ms": 4.225137319415808, "compute_loss_in_ms": 285.31357542052865, "epoch": 23.98, "learning_rate/full": 0.0003231000773635045, "loss": 3.0174, "step": 58000, "training_step_in_ms": 1086.5370167195797 }, { "_prepare_inputs_in_ms": 4.230918549001217, "compute_loss_in_ms": 285.4190446138382, "epoch": 24.39, "learning_rate/full": 0.0003206140056326384, "loss": 3.0116, "step": 59000, "training_step_in_ms": 1090.3938182927668 }, { "_prepare_inputs_in_ms": 4.227691676467657, "compute_loss_in_ms": 285.3117839321494, "epoch": 24.8, "learning_rate/full": 0.000318090679282307, "loss": 3.0123, "step": 60000, "training_step_in_ms": 1090.3038867227733 }, { "epoch": 24.8, "eval_visual_genome-densecap-local-densecap-test_loss": 3.0163190364837646, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.2694944095513101, "eval_visual_genome-densecap-local-densecap-test_runtime": 109.5302, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.304, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.228, "step": 60000 }, { "_prepare_inputs_in_ms": 4.2251157578898635, "compute_loss_in_ms": 285.44914393499494, "epoch": 25.22, "learning_rate/full": 0.0003155381574633497, "loss": 3.0074, "step": 61000, "training_step_in_ms": 1087.7947441898286 }, { "_prepare_inputs_in_ms": 4.233858399093151, "compute_loss_in_ms": 285.5572083890438, "epoch": 25.63, "learning_rate/full": 0.0003129570712337902, "loss": 3.0038, "step": 62000, "training_step_in_ms": 1091.406288355589 }, { "_prepare_inputs_in_ms": 4.241201400756836, "compute_loss_in_ms": 285.4022887274623, "epoch": 26.04, "learning_rate/full": 0.00031035068146119334, "loss": 3.0069, "step": 63000, "training_step_in_ms": 1089.0374966450036 }, { "_prepare_inputs_in_ms": 4.214517045766115, "compute_loss_in_ms": 285.32751731202006, "epoch": 26.46, "learning_rate/full": 0.0003077170643091587, "loss": 3.0004, "step": 64000, "training_step_in_ms": 1089.311513543129 }, { "_prepare_inputs_in_ms": 4.223439604043961, "compute_loss_in_ms": 285.6179902665317, "epoch": 26.87, "learning_rate/full": 0.00030505419362911944, "loss": 3.0048, "step": 65000, "training_step_in_ms": 1088.4543421529233 }, { "epoch": 26.87, "eval_visual_genome-densecap-local-densecap-test_loss": 3.012563705444336, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.26603180141607496, "eval_visual_genome-densecap-local-densecap-test_runtime": 108.7667, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.355, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.23, "step": 65000 }, { "_prepare_inputs_in_ms": 4.235190596522354, "compute_loss_in_ms": 285.59519398212433, "epoch": 27.28, "learning_rate/full": 0.0003023680520765336, "loss": 2.9934, "step": 66000, "training_step_in_ms": 1088.0777766555548 }, { "_prepare_inputs_in_ms": 4.217139046639204, "compute_loss_in_ms": 285.50919711589813, "epoch": 27.7, "learning_rate/full": 0.0002996566527388639, "loss": 2.9982, "step": 67000, "training_step_in_ms": 1091.6493426598608 }, { "_prepare_inputs_in_ms": 4.244372218847275, "compute_loss_in_ms": 285.5752951391041, "epoch": 28.11, "learning_rate/full": 0.0002969206646133254, "loss": 2.9969, "step": 68000, "training_step_in_ms": 1088.2136982679367 }, { "_prepare_inputs_in_ms": 4.213636931031942, "compute_loss_in_ms": 285.255677562207, "epoch": 28.52, "learning_rate/full": 0.0002941607627640486, "loss": 2.9923, "step": 69000, "training_step_in_ms": 1088.9643149748445 }, { "_prepare_inputs_in_ms": 4.2318920604884624, "compute_loss_in_ms": 285.6222639977932, "epoch": 28.94, "learning_rate/full": 0.0002913748308243434, "loss": 2.9912, "step": 70000, "training_step_in_ms": 1086.640508864075 }, { "epoch": 28.94, "eval_visual_genome-densecap-local-densecap-test_loss": 3.01218318939209, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.2704365100152127, "eval_visual_genome-densecap-local-densecap-test_runtime": 109.8069, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.286, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.228, "step": 70000 }, { "_prepare_inputs_in_ms": 4.22964243627176, "compute_loss_in_ms": 285.81058219075203, "epoch": 29.35, "learning_rate/full": 0.00028856630835486283, "loss": 2.9907, "step": 71000, "training_step_in_ms": 1089.0001546032727 }, { "_prepare_inputs_in_ms": 4.219989389181137, "compute_loss_in_ms": 285.4850408025086, "epoch": 29.76, "learning_rate/full": 0.00028574157192993993, "loss": 2.9922, "step": 72000, "training_step_in_ms": 1112.2257943935692 }, { "_prepare_inputs_in_ms": 4.236269619315863, "compute_loss_in_ms": 285.3517268039286, "epoch": 30.18, "learning_rate/full": 0.0002828899985518552, "loss": 2.9829, "step": 73000, "training_step_in_ms": 1115.709298092872 }, { "_prepare_inputs_in_ms": 4.212801028043032, "compute_loss_in_ms": 285.1435379870236, "epoch": 30.59, "learning_rate/full": 0.0002800179323426103, "loss": 2.9854, "step": 74000, "training_step_in_ms": 1112.750349264592 }, { "_prepare_inputs_in_ms": 4.226626381278038, "compute_loss_in_ms": 285.37043143063784, "epoch": 31.0, "learning_rate/full": 0.0002771289848538608, "loss": 2.9928, "step": 75000, "training_step_in_ms": 1113.63447811082 }, { "epoch": 31.0, "eval_visual_genome-densecap-local-densecap-test_loss": 3.00150203704834, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.27227553064507803, "eval_visual_genome-densecap-local-densecap-test_runtime": 110.2006, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.259, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.227, "step": 75000 }, { "_prepare_inputs_in_ms": 4.221666444365571, "compute_loss_in_ms": 285.4123991020024, "epoch": 31.42, "learning_rate/full": 0.00027422392710754273, "loss": 2.9787, "step": 76000, "training_step_in_ms": 1110.9835148528218 }, { "_prepare_inputs_in_ms": 4.2181270979344845, "compute_loss_in_ms": 285.3203030079603, "epoch": 31.83, "learning_rate/full": 0.0002712947161076778, "loss": 2.9822, "step": 77000, "training_step_in_ms": 1113.9973731786013 }, { "_prepare_inputs_in_ms": 4.2350912764668465, "compute_loss_in_ms": 285.4480539858341, "epoch": 32.24, "learning_rate/full": 0.00026835083436875734, "loss": 2.9765, "step": 78000, "training_step_in_ms": 1115.4474330842495 }, { "_prepare_inputs_in_ms": 4.229009635746479, "compute_loss_in_ms": 285.5191092900932, "epoch": 32.66, "learning_rate/full": 0.0002653871161688328, "loss": 2.9801, "step": 79000, "training_step_in_ms": 1113.7964499779046 }, { "_prepare_inputs_in_ms": 4.2362766563892365, "compute_loss_in_ms": 285.7597692273557, "epoch": 33.07, "learning_rate/full": 0.00026241022007566643, "loss": 2.9807, "step": 80000, "training_step_in_ms": 1115.4754909984767 }, { "epoch": 33.07, "eval_visual_genome-densecap-local-densecap-test_loss": 3.000786781311035, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.2716794971860456, "eval_visual_genome-densecap-local-densecap-test_runtime": 108.7776, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.354, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.23, "step": 80000 }, { "_prepare_inputs_in_ms": 4.232099074416045, "compute_loss_in_ms": 285.50172889232635, "epoch": 33.48, "learning_rate/full": 0.0002594179251945605, "loss": 2.9739, "step": 81000, "training_step_in_ms": 1110.9056022837758 }, { "_prepare_inputs_in_ms": 4.237273696810007, "compute_loss_in_ms": 285.7116014882922, "epoch": 33.9, "learning_rate/full": 0.00025641096982950234, "loss": 2.9746, "step": 82000, "training_step_in_ms": 1110.9737426675856 }, { "_prepare_inputs_in_ms": 4.237969063222408, "compute_loss_in_ms": 285.6498990356922, "epoch": 34.31, "learning_rate/full": 0.00025339009590173424, "loss": 2.9727, "step": 83000, "training_step_in_ms": 1117.3185790739954 }, { "_prepare_inputs_in_ms": 4.234774090349674, "compute_loss_in_ms": 285.5246250964701, "epoch": 34.73, "learning_rate/full": 0.00025035604876669546, "loss": 2.9709, "step": 84000, "training_step_in_ms": 1111.8130441047251 }, { "_prepare_inputs_in_ms": 4.248618151992559, "compute_loss_in_ms": 285.6561874523759, "epoch": 35.14, "learning_rate/full": 0.00024731263251348453, "loss": 2.969, "step": 85000, "training_step_in_ms": 1112.8755748830736 }, { "epoch": 35.14, "eval_visual_genome-densecap-local-densecap-test_loss": 2.9980032444000244, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.2741870945987276, "eval_visual_genome-densecap-local-densecap-test_runtime": 110.6613, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.229, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.226, "step": 85000 }, { "_prepare_inputs_in_ms": 4.240446417796902, "compute_loss_in_ms": 285.5394543148577, "epoch": 35.55, "learning_rate/full": 0.00024425143236331536, "loss": 2.9639, "step": 86000, "training_step_in_ms": 1110.7865899279714 }, { "_prepare_inputs_in_ms": 4.2231163419783115, "compute_loss_in_ms": 285.532758615911, "epoch": 35.97, "learning_rate/full": 0.000241179291965253, "loss": 2.971, "step": 87000, "training_step_in_ms": 1113.825252827257 }, { "_prepare_inputs_in_ms": 4.229363452643156, "compute_loss_in_ms": 285.72211230918765, "epoch": 36.38, "learning_rate/full": 0.0002381000579951894, "loss": 2.9636, "step": 88000, "training_step_in_ms": 1118.3622099086642 }, { "_prepare_inputs_in_ms": 4.2257860116660595, "compute_loss_in_ms": 285.5116978622973, "epoch": 36.79, "learning_rate/full": 0.00023501142340591894, "loss": 2.9656, "step": 89000, "training_step_in_ms": 1111.638593826443 }, { "_prepare_inputs_in_ms": 4.221606273204088, "compute_loss_in_ms": 285.61226362735033, "epoch": 37.21, "learning_rate/full": 0.00023191415027181022, "loss": 2.9615, "step": 90000, "training_step_in_ms": 1116.2303377054632 }, { "epoch": 37.21, "eval_visual_genome-densecap-local-densecap-test_loss": 2.996258020401001, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.27303322222107285, "eval_visual_genome-densecap-local-densecap-test_runtime": 108.8741, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.348, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.23, "step": 90000 }, { "_prepare_inputs_in_ms": 4.207164986831386, "compute_loss_in_ms": 285.1755935549736, "epoch": 37.62, "learning_rate/full": 0.00022881211473645583, "loss": 2.963, "step": 91000, "training_step_in_ms": 1110.297369044274 }, { "_prepare_inputs_in_ms": 4.222084645181894, "compute_loss_in_ms": 285.53527039662004, "epoch": 38.03, "learning_rate/full": 0.00022570298446764845, "loss": 2.9633, "step": 92000, "training_step_in_ms": 1112.9915070161223 }, { "_prepare_inputs_in_ms": 4.232885275036097, "compute_loss_in_ms": 285.5158912166953, "epoch": 38.45, "learning_rate/full": 0.00022258127581536945, "loss": 2.9538, "step": 93000, "training_step_in_ms": 1114.245859079063 }, { "_prepare_inputs_in_ms": 4.250343676656485, "compute_loss_in_ms": 285.64605471119285, "epoch": 38.86, "learning_rate/full": 0.00021945398441148287, "loss": 2.9572, "step": 94000, "training_step_in_ms": 1112.7353053241968 }, { "_prepare_inputs_in_ms": 4.230448927730322, "compute_loss_in_ms": 285.5413333699107, "epoch": 39.27, "learning_rate/full": 0.00021632501765960936, "loss": 2.958, "step": 95000, "training_step_in_ms": 1112.5333589836955 }, { "epoch": 39.27, "eval_visual_genome-densecap-local-densecap-test_loss": 2.993772506713867, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.27348855682421375, "eval_visual_genome-densecap-local-densecap-test_runtime": 108.9695, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.342, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.229, "step": 95000 }, { "_prepare_inputs_in_ms": 4.215012745159428, "compute_loss_in_ms": 285.35930648073554, "epoch": 39.69, "learning_rate/full": 0.0002131920229539048, "loss": 2.9558, "step": 96000, "training_step_in_ms": 1111.498819194734 }, { "_prepare_inputs_in_ms": 4.221161104738712, "compute_loss_in_ms": 285.453462138772, "epoch": 40.1, "learning_rate/full": 0.00021005263255270636, "loss": 2.9559, "step": 97000, "training_step_in_ms": 1114.1434171833098 }, { "_prepare_inputs_in_ms": 4.220512144267559, "compute_loss_in_ms": 285.53688745573163, "epoch": 40.51, "learning_rate/full": 0.0002069107568468244, "loss": 2.9525, "step": 98000, "training_step_in_ms": 1116.582923579961 }, { "_prepare_inputs_in_ms": 4.22445010766387, "compute_loss_in_ms": 285.29584189876914, "epoch": 40.93, "learning_rate/full": 0.00020377031677881017, "loss": 2.9509, "step": 99000, "training_step_in_ms": 1112.9648886173964 }, { "_prepare_inputs_in_ms": 4.237125843763351, "compute_loss_in_ms": 285.87847367301583, "epoch": 41.34, "learning_rate/full": 0.00020062580171962844, "loss": 2.9397, "step": 100000, "training_step_in_ms": 1119.0427548959851 }, { "epoch": 41.34, "eval_visual_genome-densecap-local-densecap-test_loss": 2.9917938709259033, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.27402243679815436, "eval_visual_genome-densecap-local-densecap-test_runtime": 108.6022, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.366, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.23, "step": 100000 }, { "_prepare_inputs_in_ms": 4.220401306704777, "compute_loss_in_ms": 285.4624089188874, "epoch": 41.75, "learning_rate/full": 0.00019748427643225179, "loss": 2.9497, "step": 101000, "training_step_in_ms": 1113.234252423048 }, { "_prepare_inputs_in_ms": 4.218052037060261, "compute_loss_in_ms": 285.50472677126527, "epoch": 42.17, "learning_rate/full": 0.0001943402283833764, "loss": 2.9442, "step": 102000, "training_step_in_ms": 1114.7688954658806 }, { "_prepare_inputs_in_ms": 4.22609718888998, "compute_loss_in_ms": 285.6670557744801, "epoch": 42.58, "learning_rate/full": 0.0001911975795955237, "loss": 2.938, "step": 103000, "training_step_in_ms": 1114.2966277077794 }, { "_prepare_inputs_in_ms": 4.231020983308554, "compute_loss_in_ms": 285.41950649395585, "epoch": 42.99, "learning_rate/full": 0.00018806024615043859, "loss": 2.9429, "step": 104000, "training_step_in_ms": 1112.3123243488371 }, { "_prepare_inputs_in_ms": 4.231835335493088, "compute_loss_in_ms": 285.55181711539626, "epoch": 43.41, "learning_rate/full": 0.0001849258586609575, "loss": 2.9355, "step": 105000, "training_step_in_ms": 1116.4177654609084 }, { "epoch": 43.41, "eval_visual_genome-densecap-local-densecap-test_loss": 2.9879465103149414, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.275499690988243, "eval_visual_genome-densecap-local-densecap-test_runtime": 109.1682, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.328, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.229, "step": 105000 }, { "_prepare_inputs_in_ms": 4.192932469815743, "compute_loss_in_ms": 285.3939059227705, "epoch": 43.82, "learning_rate/full": 0.0001817951904902926, "loss": 2.9411, "step": 106000, "training_step_in_ms": 1111.0442412495613 }, { "_prepare_inputs_in_ms": 4.18786546587944, "compute_loss_in_ms": 285.60110822692513, "epoch": 44.23, "learning_rate/full": 0.00017866588728649688, "loss": 2.9389, "step": 107000, "training_step_in_ms": 1114.2360820770264 }, { "_prepare_inputs_in_ms": 4.191282417625189, "compute_loss_in_ms": 285.483426745981, "epoch": 44.65, "learning_rate/full": 0.00017554497963615946, "loss": 2.9396, "step": 108000, "training_step_in_ms": 1113.102070134133 }, { "_prepare_inputs_in_ms": 4.215992953628302, "compute_loss_in_ms": 285.87069864198565, "epoch": 45.06, "learning_rate/full": 0.00017243010589616854, "loss": 2.9398, "step": 109000, "training_step_in_ms": 1115.9531138837337 }, { "_prepare_inputs_in_ms": 4.180787291377783, "compute_loss_in_ms": 285.6199772916734, "epoch": 45.47, "learning_rate/full": 0.00016932203461501055, "loss": 2.9354, "step": 110000, "training_step_in_ms": 1112.3631411641836 }, { "epoch": 45.47, "eval_visual_genome-densecap-local-densecap-test_loss": 2.9866650104522705, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.27461185232552654, "eval_visual_genome-densecap-local-densecap-test_runtime": 108.9151, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.345, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.23, "step": 110000 }, { "_prepare_inputs_in_ms": 4.1715224159926905, "compute_loss_in_ms": 285.4828831627965, "epoch": 45.89, "learning_rate/full": 0.00016622153266276704, "loss": 2.9325, "step": 111000, "training_step_in_ms": 1110.1254166848958 }, { "_prepare_inputs_in_ms": 4.183446723967791, "compute_loss_in_ms": 285.5392692387104, "epoch": 46.3, "learning_rate/full": 0.00016312936504190095, "loss": 2.9271, "step": 112000, "training_step_in_ms": 1116.0438286960125 }, { "_prepare_inputs_in_ms": 4.181461203843355, "compute_loss_in_ms": 285.49605195596814, "epoch": 46.71, "learning_rate/full": 0.00016004321335415234, "loss": 2.9338, "step": 113000, "training_step_in_ms": 1114.0362310223281 }, { "_prepare_inputs_in_ms": 4.20052033662796, "compute_loss_in_ms": 285.6174496598542, "epoch": 47.13, "learning_rate/full": 0.00015696694015230966, "loss": 2.93, "step": 114000, "training_step_in_ms": 1112.158472020179 }, { "_prepare_inputs_in_ms": 4.184404268860817, "compute_loss_in_ms": 285.52299703657627, "epoch": 47.54, "learning_rate/full": 0.00015390436604853944, "loss": 2.9265, "step": 115000, "training_step_in_ms": 1114.8844772167504 }, { "epoch": 47.54, "eval_visual_genome-densecap-local-densecap-test_loss": 2.985903263092041, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.2781795787221218, "eval_visual_genome-densecap-local-densecap-test_runtime": 109.8815, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.281, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.228, "step": 115000 }, { "_prepare_inputs_in_ms": 4.152440788542352, "compute_loss_in_ms": 285.35162526741624, "epoch": 47.95, "learning_rate/full": 0.00015085316535270307, "loss": 2.9288, "step": 116000, "training_step_in_ms": 1108.712267011404 }, { "_prepare_inputs_in_ms": 4.172631837427616, "compute_loss_in_ms": 285.6740382388234, "epoch": 48.37, "learning_rate/full": 0.0001478110551124508, "loss": 2.9217, "step": 117000, "training_step_in_ms": 1119.9308814108372 }, { "_prepare_inputs_in_ms": 4.173140484839678, "compute_loss_in_ms": 285.33917328342795, "epoch": 48.78, "learning_rate/full": 0.0001447878925453241, "loss": 2.9189, "step": 118000, "training_step_in_ms": 1114.4561827853322 }, { "_prepare_inputs_in_ms": 4.208178836852312, "compute_loss_in_ms": 285.7572955302894, "epoch": 49.19, "learning_rate/full": 0.00014177531694909012, "loss": 2.9234, "step": 119000, "training_step_in_ms": 1117.5116944983602 }, { "_prepare_inputs_in_ms": 4.171714887022972, "compute_loss_in_ms": 285.51325725764036, "epoch": 49.61, "learning_rate/full": 0.00013877411365635932, "loss": 2.919, "step": 120000, "training_step_in_ms": 1114.4923375099897 }, { "epoch": 49.61, "eval_visual_genome-densecap-local-densecap-test_loss": 2.984545946121216, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.27571246372317004, "eval_visual_genome-densecap-local-densecap-test_runtime": 107.5626, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.438, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.232, "step": 120000 }, { "_prepare_inputs_in_ms": 4.169439662520478, "compute_loss_in_ms": 285.2081711217761, "epoch": 50.02, "learning_rate/full": 0.00013579102545242515, "loss": 2.9214, "step": 121000, "training_step_in_ms": 1117.0064120963216 }, { "_prepare_inputs_in_ms": 4.175419889390469, "compute_loss_in_ms": 285.44106700643897, "epoch": 50.43, "learning_rate/full": 0.00013282377985218108, "loss": 2.9123, "step": 122000, "training_step_in_ms": 1117.1209677942097 }, { "_prepare_inputs_in_ms": 4.1646773256361485, "compute_loss_in_ms": 285.5908838920295, "epoch": 50.85, "learning_rate/full": 0.0001298731089790791, "loss": 2.9181, "step": 123000, "training_step_in_ms": 1114.7672307156026 }, { "_prepare_inputs_in_ms": 4.172112949192524, "compute_loss_in_ms": 285.507780585438, "epoch": 51.26, "learning_rate/full": 0.0001269397408670054, "loss": 2.9124, "step": 124000, "training_step_in_ms": 1116.1798403412104 }, { "_prepare_inputs_in_ms": 4.171217355877161, "compute_loss_in_ms": 285.5308585166931, "epoch": 51.67, "learning_rate/full": 0.0001240214902928718, "loss": 2.9169, "step": 125000, "training_step_in_ms": 1119.0364625044167 }, { "epoch": 51.67, "eval_visual_genome-densecap-local-densecap-test_loss": 2.9826271533966064, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.27485379257600506, "eval_visual_genome-densecap-local-densecap-test_runtime": 109.595, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.3, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.228, "step": 125000 }, { "_prepare_inputs_in_ms": 4.1942793857760545, "compute_loss_in_ms": 285.4048260115087, "epoch": 52.09, "learning_rate/full": 0.00012112491367260039, "loss": 2.9117, "step": 126000, "training_step_in_ms": 1113.5866565182805 }, { "_prepare_inputs_in_ms": 4.165726162493229, "compute_loss_in_ms": 285.52386473864317, "epoch": 52.5, "learning_rate/full": 0.0001182477982996471, "loss": 2.9123, "step": 127000, "training_step_in_ms": 1115.4936682023108 }, { "_prepare_inputs_in_ms": 4.165291707962751, "compute_loss_in_ms": 285.37697672098875, "epoch": 52.91, "learning_rate/full": 0.00011539085405917883, "loss": 2.9127, "step": 128000, "training_step_in_ms": 1112.6525225900114 }, { "_prepare_inputs_in_ms": 4.205962881445885, "compute_loss_in_ms": 285.6344051398337, "epoch": 53.33, "learning_rate/full": 0.00011255195764553374, "loss": 2.9072, "step": 129000, "training_step_in_ms": 1114.8041105866432 }, { "_prepare_inputs_in_ms": 4.192876800894737, "compute_loss_in_ms": 285.6524411961436, "epoch": 53.74, "learning_rate/full": 0.00010973748719012139, "loss": 2.9105, "step": 130000, "training_step_in_ms": 1113.7267719507217 }, { "epoch": 53.74, "eval_visual_genome-densecap-local-densecap-test_loss": 2.983597993850708, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.2789962669075427, "eval_visual_genome-densecap-local-densecap-test_runtime": 109.5326, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.304, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.228, "step": 130000 }, { "_prepare_inputs_in_ms": 4.207222261806813, "compute_loss_in_ms": 285.5676299482584, "epoch": 54.15, "learning_rate/full": 0.0001069452876591179, "loss": 2.9063, "step": 131000, "training_step_in_ms": 1114.3601090423763 }, { "_prepare_inputs_in_ms": 4.189547453075647, "compute_loss_in_ms": 285.45121479034424, "epoch": 54.57, "learning_rate/full": 0.00010417604798597693, "loss": 2.9068, "step": 132000, "training_step_in_ms": 1116.6341638937593 }, { "_prepare_inputs_in_ms": 4.203598700463772, "compute_loss_in_ms": 285.4171659834683, "epoch": 54.98, "learning_rate/full": 0.00010142771516637335, "loss": 2.8989, "step": 133000, "training_step_in_ms": 1110.624721519649 }, { "_prepare_inputs_in_ms": 4.217664018273354, "compute_loss_in_ms": 285.5546323284507, "epoch": 55.39, "learning_rate/full": 9.870646386303746e-05, "loss": 2.8974, "step": 134000, "training_step_in_ms": 1115.4996632412076 }, { "_prepare_inputs_in_ms": 4.18796281516552, "compute_loss_in_ms": 285.3805873543024, "epoch": 55.81, "learning_rate/full": 9.601020522405566e-05, "loss": 2.8997, "step": 135000, "training_step_in_ms": 1114.3139710351825 }, { "epoch": 55.81, "eval_visual_genome-densecap-local-densecap-test_loss": 2.9829113483428955, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.2781282773190371, "eval_visual_genome-densecap-local-densecap-test_runtime": 109.4066, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.312, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.229, "step": 135000 }, { "_prepare_inputs_in_ms": 4.179593571802465, "compute_loss_in_ms": 285.6101936176419, "epoch": 56.22, "learning_rate/full": 9.333960451090202e-05, "loss": 2.9042, "step": 136000, "training_step_in_ms": 1112.9348441772163 }, { "_prepare_inputs_in_ms": 4.178862765431404, "compute_loss_in_ms": 285.4050006046891, "epoch": 56.63, "learning_rate/full": 9.069532065434167e-05, "loss": 2.8997, "step": 137000, "training_step_in_ms": 1110.1743725985289 }, { "_prepare_inputs_in_ms": 4.17331463098526, "compute_loss_in_ms": 285.60341618955135, "epoch": 57.05, "learning_rate/full": 8.807539988537217e-05, "loss": 2.8999, "step": 138000, "training_step_in_ms": 1112.455148395151 }, { "_prepare_inputs_in_ms": 4.164013888686895, "compute_loss_in_ms": 285.4794158451259, "epoch": 57.46, "learning_rate/full": 8.54857283641461e-05, "loss": 2.9008, "step": 139000, "training_step_in_ms": 1112.6597697511315 }, { "_prepare_inputs_in_ms": 4.174750838428736, "compute_loss_in_ms": 285.3338685967028, "epoch": 57.88, "learning_rate/full": 8.292176191253292e-05, "loss": 2.9003, "step": 140000, "training_step_in_ms": 1112.5756445713341 }, { "epoch": 57.88, "eval_visual_genome-densecap-local-densecap-test_loss": 2.983377456665039, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.2765083682413393, "eval_visual_genome-densecap-local-densecap-test_runtime": 109.2039, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.326, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.229, "step": 140000 }, { "_prepare_inputs_in_ms": 4.186901926267438, "compute_loss_in_ms": 285.5366085804999, "epoch": 58.29, "learning_rate/full": 8.038926097845864e-05, "loss": 2.89, "step": 141000, "training_step_in_ms": 1111.180388186127 }, { "_prepare_inputs_in_ms": 4.166560925543308, "compute_loss_in_ms": 285.2483623623848, "epoch": 58.7, "learning_rate/full": 7.788627220446403e-05, "loss": 2.8908, "step": 142000, "training_step_in_ms": 1112.5438826270401 }, { "_prepare_inputs_in_ms": 4.172076798975468, "compute_loss_in_ms": 285.31228306889534, "epoch": 59.12, "learning_rate/full": 7.541341316557602e-05, "loss": 2.888, "step": 143000, "training_step_in_ms": 1114.1774371489882 }, { "_prepare_inputs_in_ms": 4.1760097071528435, "compute_loss_in_ms": 285.51259553432465, "epoch": 59.53, "learning_rate/full": 7.29712940027603e-05, "loss": 2.8933, "step": 144000, "training_step_in_ms": 1113.300205629319 }, { "_prepare_inputs_in_ms": 4.171927604824305, "compute_loss_in_ms": 285.47950995340943, "epoch": 59.94, "learning_rate/full": 7.0560517272378e-05, "loss": 2.8946, "step": 145000, "training_step_in_ms": 1110.925380833447 }, { "epoch": 59.94, "eval_visual_genome-densecap-local-densecap-test_loss": 2.9790754318237305, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.27903548274273476, "eval_visual_genome-densecap-local-densecap-test_runtime": 108.6903, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.36, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.23, "step": 145000 }, { "_prepare_inputs_in_ms": 4.179818335829712, "compute_loss_in_ms": 285.67399540916085, "epoch": 60.36, "learning_rate/full": 6.818167779751427e-05, "loss": 2.8868, "step": 146000, "training_step_in_ms": 1113.526238951832 }, { "_prepare_inputs_in_ms": 4.174669615924358, "compute_loss_in_ms": 285.47526767477393, "epoch": 60.77, "learning_rate/full": 6.58353625212141e-05, "loss": 2.8908, "step": 147000, "training_step_in_ms": 1112.4517313353717 }, { "_prepare_inputs_in_ms": 4.206293076276779, "compute_loss_in_ms": 285.6568570397794, "epoch": 61.18, "learning_rate/full": 6.351985161010259e-05, "loss": 2.886, "step": 148000, "training_step_in_ms": 1114.374936837703 }, { "_prepare_inputs_in_ms": 4.173767436295748, "compute_loss_in_ms": 285.36785116791725, "epoch": 61.6, "learning_rate/full": 6.124034730854495e-05, "loss": 2.8877, "step": 149000, "training_step_in_ms": 1113.2941167131066 }, { "_prepare_inputs_in_ms": 4.186146479099989, "compute_loss_in_ms": 285.7034795098007, "epoch": 62.01, "learning_rate/full": 5.8995079874983696e-05, "loss": 2.887, "step": 150000, "training_step_in_ms": 1114.685032505542 }, { "epoch": 62.01, "eval_visual_genome-densecap-local-densecap-test_loss": 2.9789364337921143, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.2814554306931564, "eval_visual_genome-densecap-local-densecap-test_runtime": 110.1484, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.263, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.227, "step": 150000 }, { "_prepare_inputs_in_ms": 4.176326023369301, "compute_loss_in_ms": 285.46767780929804, "epoch": 62.42, "learning_rate/full": 5.678240821954202e-05, "loss": 2.8806, "step": 151000, "training_step_in_ms": 1111.9945207312703 }, { "_prepare_inputs_in_ms": 4.179010454565287, "compute_loss_in_ms": 285.4651117064059, "epoch": 62.84, "learning_rate/full": 5.460730353825116e-05, "loss": 2.8834, "step": 152000, "training_step_in_ms": 1110.2052029296756 }, { "_prepare_inputs_in_ms": 4.173945639282465, "compute_loss_in_ms": 285.60662161558867, "epoch": 63.25, "learning_rate/full": 5.246594910646354e-05, "loss": 2.8816, "step": 153000, "training_step_in_ms": 1115.5096570029855 }, { "_prepare_inputs_in_ms": 4.187856215983629, "compute_loss_in_ms": 285.6514365822077, "epoch": 63.66, "learning_rate/full": 5.0363155892235236e-05, "loss": 2.8866, "step": 154000, "training_step_in_ms": 1113.550076983869 }, { "_prepare_inputs_in_ms": 4.191848460584879, "compute_loss_in_ms": 285.825974162668, "epoch": 64.08, "learning_rate/full": 4.8297283330226226e-05, "loss": 2.8812, "step": 155000, "training_step_in_ms": 1113.2165458351374 }, { "epoch": 64.08, "eval_visual_genome-densecap-local-densecap-test_loss": 2.9803640842437744, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.28091860195000073, "eval_visual_genome-densecap-local-densecap-test_runtime": 110.2234, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.258, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.227, "step": 155000 }, { "_prepare_inputs_in_ms": 4.170489263970677, "compute_loss_in_ms": 285.33177894353867, "epoch": 64.49, "learning_rate/full": 4.626682959161812e-05, "loss": 2.8769, "step": 156000, "training_step_in_ms": 1107.8080112151802 }, { "_prepare_inputs_in_ms": 4.165396176278591, "compute_loss_in_ms": 285.30143217742443, "epoch": 64.9, "learning_rate/full": 4.427635648454991e-05, "loss": 2.8775, "step": 157000, "training_step_in_ms": 1111.1020593941212 }, { "_prepare_inputs_in_ms": 4.1787227392196655, "compute_loss_in_ms": 285.6033191792667, "epoch": 65.32, "learning_rate/full": 4.2324305856376166e-05, "loss": 2.8824, "step": 158000, "training_step_in_ms": 1114.8409751541913 }, { "_prepare_inputs_in_ms": 4.168594349175692, "compute_loss_in_ms": 285.385168325156, "epoch": 65.73, "learning_rate/full": 4.040926393437829e-05, "loss": 2.8742, "step": 159000, "training_step_in_ms": 1112.1875176765025 }, { "_prepare_inputs_in_ms": 4.188820585608482, "compute_loss_in_ms": 285.74348379299045, "epoch": 66.14, "learning_rate/full": 3.853553323166454e-05, "loss": 2.874, "step": 160000, "training_step_in_ms": 1114.071101732552 }, { "epoch": 66.14, "eval_visual_genome-densecap-local-densecap-test_loss": 2.980635404586792, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.2805308037735457, "eval_visual_genome-densecap-local-densecap-test_runtime": 109.2483, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.323, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.229, "step": 160000 }, { "_prepare_inputs_in_ms": 4.17639887550982, "compute_loss_in_ms": 285.54739573970437, "epoch": 66.56, "learning_rate/full": 3.6703457126541777e-05, "loss": 2.8751, "step": 161000, "training_step_in_ms": 1101.9119679294527 }, { "_prepare_inputs_in_ms": 4.183506786823273, "compute_loss_in_ms": 285.5607514716685, "epoch": 66.97, "learning_rate/full": 3.4908041134979454e-05, "loss": 2.8781, "step": 162000, "training_step_in_ms": 1103.5643678978086 }, { "_prepare_inputs_in_ms": 4.188889868557453, "compute_loss_in_ms": 285.67521207407117, "epoch": 67.38, "learning_rate/full": 3.315517477040358e-05, "loss": 2.878, "step": 163000, "training_step_in_ms": 1105.4489219635725 }, { "_prepare_inputs_in_ms": 4.175573732703924, "compute_loss_in_ms": 285.59245705604553, "epoch": 67.8, "learning_rate/full": 3.14417822230312e-05, "loss": 2.8757, "step": 164000, "training_step_in_ms": 1105.2035297378898 }, { "_prepare_inputs_in_ms": 4.187327720224857, "compute_loss_in_ms": 285.88794915005565, "epoch": 68.21, "learning_rate/full": 2.9771712961539955e-05, "loss": 2.8763, "step": 165000, "training_step_in_ms": 1105.2709091752768 }, { "epoch": 68.21, "eval_visual_genome-densecap-local-densecap-test_loss": 2.9800891876220703, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.2802985242098701, "eval_visual_genome-densecap-local-densecap-test_runtime": 110.8323, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.218, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.226, "step": 165000 }, { "_prepare_inputs_in_ms": 4.207263810605538, "compute_loss_in_ms": 285.7474652826786, "epoch": 68.62, "learning_rate/full": 2.8143644982694906e-05, "loss": 2.8761, "step": 166000, "training_step_in_ms": 1100.3973172418773 }, { "_prepare_inputs_in_ms": 4.210827711969614, "compute_loss_in_ms": 285.5911776944995, "epoch": 69.04, "learning_rate/full": 2.65579799879085e-05, "loss": 2.8751, "step": 167000, "training_step_in_ms": 1104.1183153651655 }, { "_prepare_inputs_in_ms": 4.198013573884964, "compute_loss_in_ms": 285.68624898046255, "epoch": 69.45, "learning_rate/full": 2.5015109216291467e-05, "loss": 2.8722, "step": 168000, "training_step_in_ms": 1105.6054084450006 }, { "_prepare_inputs_in_ms": 4.18689937889576, "compute_loss_in_ms": 285.61638662964106, "epoch": 69.86, "learning_rate/full": 2.3515413348120198e-05, "loss": 2.8743, "step": 169000, "training_step_in_ms": 1102.9215082861483 }, { "_prepare_inputs_in_ms": 4.210809834301472, "compute_loss_in_ms": 285.83876856043935, "epoch": 70.28, "learning_rate/full": 2.20592624109097e-05, "loss": 2.8696, "step": 170000, "training_step_in_ms": 1106.3744595497847 }, { "epoch": 70.28, "eval_visual_genome-densecap-local-densecap-test_loss": 2.979834794998169, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.28091535007381413, "eval_visual_genome-densecap-local-densecap-test_runtime": 109.6944, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.293, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.228, "step": 170000 }, { "_prepare_inputs_in_ms": 4.173562210507509, "compute_loss_in_ms": 285.2328538559377, "epoch": 70.69, "learning_rate/full": 2.064562414115867e-05, "loss": 2.8723, "step": 171000, "training_step_in_ms": 1101.5736067220569 }, { "_prepare_inputs_in_ms": 4.184829708188772, "compute_loss_in_ms": 285.7893420346081, "epoch": 71.1, "learning_rate/full": 1.9277674551421355e-05, "loss": 2.8712, "step": 172000, "training_step_in_ms": 1104.9391337744892 }, { "_prepare_inputs_in_ms": 4.175479732453823, "compute_loss_in_ms": 285.58204352483153, "epoch": 71.52, "learning_rate/full": 1.7954315491282236e-05, "loss": 2.868, "step": 173000, "training_step_in_ms": 1106.567913543433 }, { "_prepare_inputs_in_ms": 4.216715902090073, "compute_loss_in_ms": 285.6606830134988, "epoch": 71.93, "learning_rate/full": 1.6674616367900976e-05, "loss": 2.8675, "step": 174000, "training_step_in_ms": 1104.7934159226716 }, { "_prepare_inputs_in_ms": 4.171092137694359, "compute_loss_in_ms": 285.4122787192464, "epoch": 72.34, "learning_rate/full": 1.5441452273561308e-05, "loss": 2.8671, "step": 175000, "training_step_in_ms": 1106.7299974374473 }, { "epoch": 72.34, "eval_visual_genome-densecap-local-densecap-test_loss": 2.9793758392333984, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.281087276669587, "eval_visual_genome-densecap-local-densecap-test_runtime": 110.0629, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.269, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.227, "step": 175000 }, { "_prepare_inputs_in_ms": 4.168345641072204, "compute_loss_in_ms": 285.7807895615697, "epoch": 72.76, "learning_rate/full": 1.4253825239264306e-05, "loss": 2.8714, "step": 176000, "training_step_in_ms": 1101.577396351844 }, { "_prepare_inputs_in_ms": 4.185015048831701, "compute_loss_in_ms": 285.48355446383357, "epoch": 73.17, "learning_rate/full": 1.3110908410358026e-05, "loss": 2.8674, "step": 177000, "training_step_in_ms": 1106.790641155094 }, { "_prepare_inputs_in_ms": 4.181742530316114, "compute_loss_in_ms": 285.46897569671273, "epoch": 73.58, "learning_rate/full": 1.2015269571172228e-05, "loss": 2.8685, "step": 178000, "training_step_in_ms": 1105.456206858158 }, { "_prepare_inputs_in_ms": 4.189217183738947, "compute_loss_in_ms": 285.7022790014744, "epoch": 74.0, "learning_rate/full": 1.0966013151343868e-05, "loss": 2.8703, "step": 179000, "training_step_in_ms": 1103.0243016816676 }, { "_prepare_inputs_in_ms": 4.1993721053004265, "compute_loss_in_ms": 285.9701578617096, "epoch": 74.41, "learning_rate/full": 9.962417871458617e-06, "loss": 2.8679, "step": 180000, "training_step_in_ms": 1108.1376051008701 }, { "epoch": 74.41, "eval_visual_genome-densecap-local-densecap-test_loss": 2.978816032409668, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.28102599122389305, "eval_visual_genome-densecap-local-densecap-test_runtime": 110.271, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.255, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.227, "step": 180000 }, { "_prepare_inputs_in_ms": 4.160367134140759, "compute_loss_in_ms": 285.407042812556, "epoch": 74.82, "learning_rate/full": 9.006738502964407e-06, "loss": 2.8643, "step": 181000, "training_step_in_ms": 1101.3521456047893 }, { "_prepare_inputs_in_ms": 4.180663630366325, "compute_loss_in_ms": 285.55450112745166, "epoch": 75.24, "learning_rate/full": 8.098183863851083e-06, "loss": 2.8683, "step": 182000, "training_step_in_ms": 1107.5391217172146 }, { "_prepare_inputs_in_ms": 4.1743567287921906, "compute_loss_in_ms": 285.2670620009303, "epoch": 75.65, "learning_rate/full": 7.236978126380823e-06, "loss": 2.864, "step": 183000, "training_step_in_ms": 1103.5778979249299 }, { "_prepare_inputs_in_ms": 4.20133513212204, "compute_loss_in_ms": 285.7320618443191, "epoch": 76.06, "learning_rate/full": 6.424124390450504e-06, "loss": 2.8696, "step": 184000, "training_step_in_ms": 1102.3650901168585 }, { "_prepare_inputs_in_ms": 4.1793825179338455, "compute_loss_in_ms": 285.5250694230199, "epoch": 76.48, "learning_rate/full": 5.657451579824824e-06, "loss": 2.8645, "step": 185000, "training_step_in_ms": 1106.2330449260771 }, { "epoch": 76.48, "eval_visual_genome-densecap-local-densecap-test_loss": 2.9790234565734863, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.2804143185850342, "eval_visual_genome-densecap-local-densecap-test_runtime": 111.0093, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.207, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.225, "step": 185000 }, { "_prepare_inputs_in_ms": 4.18695215044952, "compute_loss_in_ms": 285.5290654525161, "epoch": 76.89, "learning_rate/full": 4.939520495279481e-06, "loss": 2.8657, "step": 186000, "training_step_in_ms": 1101.3268077746034 }, { "_prepare_inputs_in_ms": 4.185709021985531, "compute_loss_in_ms": 285.5161408223212, "epoch": 77.3, "learning_rate/full": 4.269717665299333e-06, "loss": 2.8633, "step": 187000, "training_step_in_ms": 1107.3937772586942 }, { "_prepare_inputs_in_ms": 4.219432931393385, "compute_loss_in_ms": 285.7696287557483, "epoch": 77.72, "learning_rate/full": 3.6476104696328672e-06, "loss": 2.8611, "step": 188000, "training_step_in_ms": 1103.4366898052394 }, { "_prepare_inputs_in_ms": 4.222444631159306, "compute_loss_in_ms": 285.7456459365785, "epoch": 78.13, "learning_rate/full": 3.0745965927555298e-06, "loss": 2.8682, "step": 189000, "training_step_in_ms": 1102.7803975529969 }, { "_prepare_inputs_in_ms": 4.181710965931416, "compute_loss_in_ms": 285.33873960748315, "epoch": 78.54, "learning_rate/full": 2.550171112510902e-06, "loss": 2.8619, "step": 190000, "training_step_in_ms": 1105.0700605846941 }, { "epoch": 78.54, "eval_visual_genome-densecap-local-densecap-test_loss": 2.979418992996216, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.28126194557201906, "eval_visual_genome-densecap-local-densecap-test_runtime": 110.0926, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.267, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.227, "step": 190000 }, { "_prepare_inputs_in_ms": 4.1674747299857255, "compute_loss_in_ms": 285.1683004386723, "epoch": 78.96, "learning_rate/full": 2.07446342303903e-06, "loss": 2.8623, "step": 191000, "training_step_in_ms": 1101.7088311165571 }, { "_prepare_inputs_in_ms": 4.192074902355671, "compute_loss_in_ms": 285.65734274312854, "epoch": 79.37, "learning_rate/full": 1.6475908980941423e-06, "loss": 2.8592, "step": 192000, "training_step_in_ms": 1110.4893043078482 }, { "_prepare_inputs_in_ms": 4.188501738011837, "compute_loss_in_ms": 285.3913672603667, "epoch": 79.79, "learning_rate/full": 1.2693051031663184e-06, "loss": 2.8693, "step": 193000, "training_step_in_ms": 1105.3064069263637 }, { "_prepare_inputs_in_ms": 4.1890876069664955, "compute_loss_in_ms": 285.6683066636324, "epoch": 80.2, "learning_rate/full": 9.404559306640304e-07, "loss": 2.8679, "step": 194000, "training_step_in_ms": 1106.7661010883749 }, { "_prepare_inputs_in_ms": 4.195614516735077, "compute_loss_in_ms": 285.7047406025231, "epoch": 80.61, "learning_rate/full": 6.607217220689466e-07, "loss": 2.8595, "step": 195000, "training_step_in_ms": 1110.2134825922549 }, { "epoch": 80.61, "eval_visual_genome-densecap-local-densecap-test_loss": 2.9787235260009766, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.2807572494534342, "eval_visual_genome-densecap-local-densecap-test_runtime": 109.6903, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.293, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.228, "step": 195000 }, { "_prepare_inputs_in_ms": 4.209323071125077, "compute_loss_in_ms": 285.70444655045867, "epoch": 81.03, "learning_rate/full": 4.301714976112869e-07, "loss": 2.8627, "step": 196000, "training_step_in_ms": 1106.642473962158 }, { "_prepare_inputs_in_ms": 4.216882940381765, "compute_loss_in_ms": 285.90086993202567, "epoch": 81.44, "learning_rate/full": 2.4870533697582963e-07, "loss": 2.861, "step": 197000, "training_step_in_ms": 1110.1682490482926 }, { "_prepare_inputs_in_ms": 4.208073288202286, "compute_loss_in_ms": 285.9070298522711, "epoch": 81.85, "learning_rate/full": 1.167309390885718e-07, "loss": 2.8634, "step": 198000, "training_step_in_ms": 1105.8664784356952 }, { "_prepare_inputs_in_ms": 4.220877002924681, "compute_loss_in_ms": 285.8088936395943, "epoch": 82.27, "learning_rate/full": 3.407474692453949e-08, "loss": 2.8649, "step": 199000, "training_step_in_ms": 1108.864688232541 }, { "_prepare_inputs_in_ms": 4.200665093958378, "compute_loss_in_ms": 285.4954933747649, "epoch": 82.68, "learning_rate/full": 7.485261950046507e-10, "loss": 2.8661, "step": 200000, "training_step_in_ms": 1107.0144655555487 }, { "epoch": 82.68, "eval_visual_genome-densecap-local-densecap-test_loss": 2.9789507389068604, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.28079051577715114, "eval_visual_genome-densecap-local-densecap-test_runtime": 109.9761, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 7.274, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.227, "step": 200000 } ], "max_steps": 200000, "num_train_epochs": 83, "total_flos": 4.81380362914756e+23, "trial_name": null, "trial_params": null }