{ "global_steps": 27050, "loss": { "train": [ { "step": 50, "logs": { "loss": 1.2091, "epoch": 0.018484288354898338, "learning_rate": 1.0584432680980562e-05 } }, { "step": 100, "logs": { "loss": 1.1315, "epoch": 0.036968576709796676, "learning_rate": 1.2459822860720352e-05 } }, { "step": 150, "logs": { "loss": 1.1118, "epoch": 0.05545286506469501, "learning_rate": 1.355685579689696e-05 } }, { "step": 200, "logs": { "loss": 1.1091, "epoch": 0.07393715341959335, "learning_rate": 1.4335213053988223e-05 } }, { "step": 250, "logs": { "loss": 1.1063, "epoch": 0.09242144177449169, "learning_rate": 1.4938953847726847e-05 } }, { "step": 300, "logs": { "loss": 1.1012, "epoch": 0.11090573012939002, "learning_rate": 1.5432245994674192e-05 } }, { "step": 350, "logs": { "loss": 1.0844, "epoch": 0.12939001848428835, "learning_rate": 1.5849318562425815e-05 } }, { "step": 400, "logs": { "loss": 1.0911, "epoch": 0.1478743068391867, "learning_rate": 1.6210603254020138e-05 } }, { "step": 450, "logs": { "loss": 1.0816, "epoch": 0.16635859519408502, "learning_rate": 1.652927893686328e-05 } }, { "step": 500, "logs": { "loss": 1.0819, "epoch": 0.18484288354898337, "learning_rate": 1.6814344049111566e-05 } }, { "step": 550, "logs": { "loss": 1.0757, "epoch": 0.2033271719038817, "learning_rate": 1.70722168104602e-05 } }, { "step": 600, "logs": { "loss": 1.0706, "epoch": 0.22181146025878004, "learning_rate": 1.7307636196960783e-05 } }, { "step": 650, "logs": { "loss": 1.0698, "epoch": 0.24029574861367836, "learning_rate": 1.7524201039271304e-05 } }, { "step": 700, "logs": { "loss": 1.0632, "epoch": 0.2587800369685767, "learning_rate": 1.7724708765356604e-05 } }, { "step": 750, "logs": { "loss": 1.0601, "epoch": 0.27726432532347506, "learning_rate": 1.7911376992503148e-05 } }, { "step": 800, "logs": { "loss": 1.0582, "epoch": 0.2957486136783734, "learning_rate": 1.808599345743407e-05 } }, { "step": 850, "logs": { "loss": 1.0512, "epoch": 0.3142329020332717, "learning_rate": 1.825002041317456e-05 } }, { "step": 900, "logs": { "loss": 1.0544, "epoch": 0.33271719038817005, "learning_rate": 1.840466914065299e-05 } }, { "step": 950, "logs": { "loss": 1.043, "epoch": 0.3512014787430684, "learning_rate": 1.855095428760744e-05 } }, { "step": 1000, "logs": { "loss": 1.047, "epoch": 0.36968576709796674, "learning_rate": 1.8689734253201903e-05 } }, { "step": 1050, "logs": { "loss": 1.0408, "epoch": 0.38817005545286504, "learning_rate": 1.8821741709263542e-05 } }, { "step": 1100, "logs": { "loss": 1.0431, "epoch": 0.4066543438077634, "learning_rate": 1.89476070147965e-05 } }, { "step": 1150, "logs": { "loss": 1.0431, "epoch": 0.42513863216266173, "learning_rate": 1.9067876421445012e-05 } }, { "step": 1200, "logs": { "loss": 1.034, "epoch": 0.4436229205175601, "learning_rate": 1.9183026401502057e-05 } }, { "step": 1250, "logs": { "loss": 1.039, "epoch": 0.46210720887245843, "learning_rate": 1.9293475049105016e-05 } }, { "step": 1300, "logs": { "loss": 1.0304, "epoch": 0.4805914972273567, "learning_rate": 1.9399591243986016e-05 } }, { "step": 1350, "logs": { "loss": 1.0385, "epoch": 0.49907578558225507, "learning_rate": 1.950170208484624e-05 } }, { "step": 1400, "logs": { "loss": 1.027, "epoch": 0.5175600739371534, "learning_rate": 1.9600098970219974e-05 } }, { "step": 1450, "logs": { "loss": 1.0281, "epoch": 0.5360443622920518, "learning_rate": 1.9695042611797287e-05 } }, { "step": 1500, "logs": { "loss": 1.0282, "epoch": 0.5545286506469501, "learning_rate": 1.978676719749536e-05 } }, { "step": 1550, "logs": { "loss": 1.0186, "epoch": 0.5730129390018485, "learning_rate": 1.9875483871657987e-05 } }, { "step": 1600, "logs": { "loss": 1.0237, "epoch": 0.5914972273567468, "learning_rate": 1.9961383662539012e-05 } }, { "step": 1650, "logs": { "loss": 1.0176, "epoch": 0.609981515711645, "learning_rate": 1.9978762732528416e-05 } }, { "step": 1700, "logs": { "loss": 1.4539, "epoch": 0.6284658040665434, "learning_rate": 1.9939434459432887e-05 } }, { "step": 1750, "logs": { "loss": 1.2593, "epoch": 0.6469500924214417, "learning_rate": 1.990010618633736e-05 } }, { "step": 1800, "logs": { "loss": 1.5937, "epoch": 0.6654343807763401, "learning_rate": 1.986077791324183e-05 } }, { "step": 1850, "logs": { "loss": 1.0165, "epoch": 0.6839186691312384, "learning_rate": 1.9821449640146302e-05 } }, { "step": 1900, "logs": { "loss": 1.4354, "epoch": 0.7024029574861368, "learning_rate": 1.9782121367050776e-05 } }, { "step": 1950, "logs": { "loss": 1.021, "epoch": 0.7208872458410351, "learning_rate": 1.9742793093955247e-05 } }, { "step": 2000, "logs": { "loss": 1.0078, "epoch": 0.7393715341959335, "learning_rate": 1.9703464820859717e-05 } }, { "step": 2050, "logs": { "loss": 1.0057, "epoch": 0.7578558225508318, "learning_rate": 1.966413654776419e-05 } }, { "step": 2100, "logs": { "loss": 1.0001, "epoch": 0.7763401109057301, "learning_rate": 1.9624808274668662e-05 } }, { "step": 2150, "logs": { "loss": 1.006, "epoch": 0.7948243992606284, "learning_rate": 1.9585480001573133e-05 } }, { "step": 2200, "logs": { "loss": 1.0103, "epoch": 0.8133086876155268, "learning_rate": 1.9546151728477603e-05 } }, { "step": 2250, "logs": { "loss": 1.0046, "epoch": 0.8317929759704251, "learning_rate": 1.9506823455382077e-05 } }, { "step": 2300, "logs": { "loss": 0.9941, "epoch": 0.8502772643253235, "learning_rate": 1.9467495182286548e-05 } }, { "step": 2350, "logs": { "loss": 0.9963, "epoch": 0.8687615526802218, "learning_rate": 1.942816690919102e-05 } }, { "step": 2400, "logs": { "loss": 0.9926, "epoch": 0.8872458410351202, "learning_rate": 1.938883863609549e-05 } }, { "step": 2450, "logs": { "loss": 0.9918, "epoch": 0.9057301293900185, "learning_rate": 1.934951036299996e-05 } }, { "step": 2500, "logs": { "loss": 0.9899, "epoch": 0.9242144177449169, "learning_rate": 1.9310182089904434e-05 } }, { "step": 2550, "logs": { "loss": 0.9887, "epoch": 0.9426987060998152, "learning_rate": 1.9270853816808904e-05 } }, { "step": 2600, "logs": { "loss": 0.9942, "epoch": 0.9611829944547134, "learning_rate": 1.9231525543713375e-05 } }, { "step": 2650, "logs": { "loss": 0.9817, "epoch": 0.9796672828096118, "learning_rate": 1.919219727061785e-05 } }, { "step": 2700, "logs": { "loss": 0.9811, "epoch": 0.9981515711645101, "learning_rate": 1.915286899752232e-05 } }, { "step": 2750, "logs": { "loss": 0.8466, "epoch": 1.0166358595194085, "learning_rate": 1.911354072442679e-05 } }, { "step": 2800, "logs": { "loss": 0.8316, "epoch": 1.0351201478743068, "learning_rate": 1.9074212451331264e-05 } }, { "step": 2850, "logs": { "loss": 0.8363, "epoch": 1.0536044362292052, "learning_rate": 1.9034884178235735e-05 } }, { "step": 2900, "logs": { "loss": 0.8378, "epoch": 1.0720887245841035, "learning_rate": 1.8995555905140205e-05 } }, { "step": 2950, "logs": { "loss": 0.8386, "epoch": 1.0905730129390019, "learning_rate": 1.895622763204468e-05 } }, { "step": 3000, "logs": { "loss": 0.8465, "epoch": 1.1090573012939002, "learning_rate": 1.891689935894915e-05 } }, { "step": 3050, "logs": { "loss": 0.8375, "epoch": 1.1275415896487986, "learning_rate": 1.887757108585362e-05 } }, { "step": 3100, "logs": { "loss": 0.8379, "epoch": 1.146025878003697, "learning_rate": 1.8838242812758095e-05 } }, { "step": 3150, "logs": { "loss": 0.836, "epoch": 1.1645101663585953, "learning_rate": 1.8798914539662565e-05 } }, { "step": 3200, "logs": { "loss": 0.8411, "epoch": 1.1829944547134936, "learning_rate": 1.8759586266567036e-05 } }, { "step": 3250, "logs": { "loss": 0.8442, "epoch": 1.201478743068392, "learning_rate": 1.872025799347151e-05 } }, { "step": 3300, "logs": { "loss": 0.8397, "epoch": 1.21996303142329, "learning_rate": 1.868092972037598e-05 } }, { "step": 3350, "logs": { "loss": 0.8415, "epoch": 1.2384473197781884, "learning_rate": 1.864160144728045e-05 } }, { "step": 3400, "logs": { "loss": 0.8397, "epoch": 1.2569316081330868, "learning_rate": 1.8602273174184925e-05 } }, { "step": 3450, "logs": { "loss": 0.8396, "epoch": 1.2754158964879851, "learning_rate": 1.8562944901089396e-05 } }, { "step": 3500, "logs": { "loss": 0.8452, "epoch": 1.2939001848428835, "learning_rate": 1.8523616627993866e-05 } }, { "step": 3550, "logs": { "loss": 0.8362, "epoch": 1.3123844731977818, "learning_rate": 1.848428835489834e-05 } }, { "step": 3600, "logs": { "loss": 0.8396, "epoch": 1.3308687615526802, "learning_rate": 1.844496008180281e-05 } }, { "step": 3650, "logs": { "loss": 0.8334, "epoch": 1.3493530499075785, "learning_rate": 1.840563180870728e-05 } }, { "step": 3700, "logs": { "loss": 0.834, "epoch": 1.3678373382624769, "learning_rate": 1.8366303535611752e-05 } }, { "step": 3750, "logs": { "loss": 0.8333, "epoch": 1.3863216266173752, "learning_rate": 1.8326975262516223e-05 } }, { "step": 3800, "logs": { "loss": 0.8357, "epoch": 1.4048059149722736, "learning_rate": 1.8287646989420697e-05 } }, { "step": 3850, "logs": { "loss": 0.8374, "epoch": 1.423290203327172, "learning_rate": 1.8248318716325167e-05 } }, { "step": 3900, "logs": { "loss": 0.837, "epoch": 1.4417744916820703, "learning_rate": 1.8208990443229638e-05 } }, { "step": 3950, "logs": { "loss": 0.835, "epoch": 1.4602587800369686, "learning_rate": 1.816966217013411e-05 } }, { "step": 4000, "logs": { "loss": 0.8352, "epoch": 1.478743068391867, "learning_rate": 1.8130333897038583e-05 } }, { "step": 4050, "logs": { "loss": 0.8475, "epoch": 1.4972273567467653, "learning_rate": 1.8091005623943053e-05 } }, { "step": 4100, "logs": { "loss": 0.8339, "epoch": 1.5157116451016637, "learning_rate": 1.8051677350847524e-05 } }, { "step": 4150, "logs": { "loss": 0.8382, "epoch": 1.534195933456562, "learning_rate": 1.8012349077751998e-05 } }, { "step": 4200, "logs": { "loss": 0.8376, "epoch": 1.5526802218114601, "learning_rate": 1.797302080465647e-05 } }, { "step": 4250, "logs": { "loss": 0.8302, "epoch": 1.5711645101663585, "learning_rate": 1.793369253156094e-05 } }, { "step": 4300, "logs": { "loss": 0.8312, "epoch": 1.5896487985212568, "learning_rate": 1.7894364258465413e-05 } }, { "step": 4350, "logs": { "loss": 0.8361, "epoch": 1.6081330868761552, "learning_rate": 1.7855035985369884e-05 } }, { "step": 4400, "logs": { "loss": 0.8321, "epoch": 1.6266173752310535, "learning_rate": 1.7815707712274354e-05 } }, { "step": 4450, "logs": { "loss": 0.8374, "epoch": 1.645101663585952, "learning_rate": 1.777637943917883e-05 } }, { "step": 4500, "logs": { "loss": 0.8287, "epoch": 1.6635859519408502, "learning_rate": 1.77370511660833e-05 } }, { "step": 4550, "logs": { "loss": 0.8367, "epoch": 1.6820702402957486, "learning_rate": 1.769772289298777e-05 } }, { "step": 4600, "logs": { "loss": 0.8439, "epoch": 1.700554528650647, "learning_rate": 1.7658394619892244e-05 } }, { "step": 4650, "logs": { "loss": 0.829, "epoch": 1.7190388170055453, "learning_rate": 1.7619066346796714e-05 } }, { "step": 4700, "logs": { "loss": 0.8325, "epoch": 1.7375231053604436, "learning_rate": 1.7579738073701185e-05 } }, { "step": 4750, "logs": { "loss": 0.837, "epoch": 1.756007393715342, "learning_rate": 1.754040980060566e-05 } }, { "step": 4800, "logs": { "loss": 0.8371, "epoch": 1.7744916820702403, "learning_rate": 1.750108152751013e-05 } }, { "step": 4850, "logs": { "loss": 0.832, "epoch": 1.7929759704251387, "learning_rate": 1.74617532544146e-05 } }, { "step": 4900, "logs": { "loss": 0.8342, "epoch": 1.811460258780037, "learning_rate": 1.7422424981319074e-05 } }, { "step": 4950, "logs": { "loss": 0.8331, "epoch": 1.8299445471349354, "learning_rate": 1.7383096708223545e-05 } }, { "step": 5000, "logs": { "loss": 0.8234, "epoch": 1.8484288354898337, "learning_rate": 1.7343768435128015e-05 } }, { "step": 5050, "logs": { "loss": 0.8311, "epoch": 1.866913123844732, "learning_rate": 1.7304440162032486e-05 } }, { "step": 5100, "logs": { "loss": 0.8259, "epoch": 1.8853974121996304, "learning_rate": 1.726511188893696e-05 } }, { "step": 5150, "logs": { "loss": 0.8253, "epoch": 1.9038817005545285, "learning_rate": 1.722578361584143e-05 } }, { "step": 5200, "logs": { "loss": 0.8297, "epoch": 1.922365988909427, "learning_rate": 1.71864553427459e-05 } }, { "step": 5250, "logs": { "loss": 0.8264, "epoch": 1.9408502772643252, "learning_rate": 1.7147127069650372e-05 } }, { "step": 5300, "logs": { "loss": 0.8283, "epoch": 1.9593345656192236, "learning_rate": 1.7107798796554846e-05 } }, { "step": 5350, "logs": { "loss": 0.8262, "epoch": 1.977818853974122, "learning_rate": 1.7068470523459316e-05 } }, { "step": 5400, "logs": { "loss": 0.829, "epoch": 1.9963031423290203, "learning_rate": 1.7029142250363787e-05 } }, { "step": 5450, "logs": { "loss": 0.6969, "epoch": 2.014787430683919, "learning_rate": 1.6989813977268258e-05 } }, { "step": 5500, "logs": { "loss": 0.6715, "epoch": 2.033271719038817, "learning_rate": 1.695048570417273e-05 } }, { "step": 5550, "logs": { "loss": 0.6636, "epoch": 2.0517560073937156, "learning_rate": 1.6911157431077202e-05 } }, { "step": 5600, "logs": { "loss": 0.6649, "epoch": 2.0702402957486137, "learning_rate": 1.6871829157981673e-05 } }, { "step": 5650, "logs": { "loss": 0.665, "epoch": 2.088724584103512, "learning_rate": 1.6832500884886147e-05 } }, { "step": 5700, "logs": { "loss": 0.6746, "epoch": 2.1072088724584104, "learning_rate": 1.6793172611790617e-05 } }, { "step": 5750, "logs": { "loss": 0.6678, "epoch": 2.1256931608133085, "learning_rate": 1.6753844338695088e-05 } }, { "step": 5800, "logs": { "loss": 0.6739, "epoch": 2.144177449168207, "learning_rate": 1.6714516065599562e-05 } }, { "step": 5850, "logs": { "loss": 0.6666, "epoch": 2.162661737523105, "learning_rate": 1.6675187792504033e-05 } }, { "step": 5900, "logs": { "loss": 0.674, "epoch": 2.1811460258780038, "learning_rate": 1.6635859519408503e-05 } }, { "step": 5950, "logs": { "loss": 0.6737, "epoch": 2.199630314232902, "learning_rate": 1.6596531246312977e-05 } }, { "step": 6000, "logs": { "loss": 0.675, "epoch": 2.2181146025878005, "learning_rate": 1.6557202973217448e-05 } }, { "step": 6050, "logs": { "loss": 0.6743, "epoch": 2.2365988909426986, "learning_rate": 1.651787470012192e-05 } }, { "step": 6100, "logs": { "loss": 0.6718, "epoch": 2.255083179297597, "learning_rate": 1.647854642702639e-05 } }, { "step": 6150, "logs": { "loss": 0.6735, "epoch": 2.2735674676524953, "learning_rate": 1.6439218153930863e-05 } }, { "step": 6200, "logs": { "loss": 0.6798, "epoch": 2.292051756007394, "learning_rate": 1.6399889880835334e-05 } }, { "step": 6250, "logs": { "loss": 0.6768, "epoch": 2.310536044362292, "learning_rate": 1.6360561607739804e-05 } }, { "step": 6300, "logs": { "loss": 0.6796, "epoch": 2.3290203327171906, "learning_rate": 1.632123333464428e-05 } }, { "step": 6350, "logs": { "loss": 0.6813, "epoch": 2.3475046210720887, "learning_rate": 1.628190506154875e-05 } }, { "step": 6400, "logs": { "loss": 0.6774, "epoch": 2.3659889094269873, "learning_rate": 1.624257678845322e-05 } }, { "step": 6450, "logs": { "loss": 0.6745, "epoch": 2.3844731977818854, "learning_rate": 1.6203248515357694e-05 } }, { "step": 6500, "logs": { "loss": 0.6809, "epoch": 2.402957486136784, "learning_rate": 1.6163920242262164e-05 } }, { "step": 6550, "logs": { "loss": 0.6831, "epoch": 2.421441774491682, "learning_rate": 1.6124591969166635e-05 } }, { "step": 6600, "logs": { "loss": 0.6803, "epoch": 2.43992606284658, "learning_rate": 1.608526369607111e-05 } }, { "step": 6650, "logs": { "loss": 0.6791, "epoch": 2.4584103512014788, "learning_rate": 1.604593542297558e-05 } }, { "step": 6700, "logs": { "loss": 0.6812, "epoch": 2.476894639556377, "learning_rate": 1.600660714988005e-05 } }, { "step": 6750, "logs": { "loss": 0.6866, "epoch": 2.4953789279112755, "learning_rate": 1.596727887678452e-05 } }, { "step": 6800, "logs": { "loss": 0.6837, "epoch": 2.5138632162661736, "learning_rate": 1.5927950603688995e-05 } }, { "step": 6850, "logs": { "loss": 0.6814, "epoch": 2.532347504621072, "learning_rate": 1.5888622330593465e-05 } }, { "step": 6900, "logs": { "loss": 0.6845, "epoch": 2.5508317929759703, "learning_rate": 1.5849294057497936e-05 } }, { "step": 6950, "logs": { "loss": 0.6832, "epoch": 2.569316081330869, "learning_rate": 1.5809965784402407e-05 } }, { "step": 7000, "logs": { "loss": 0.6795, "epoch": 2.587800369685767, "learning_rate": 1.5770637511306877e-05 } }, { "step": 7050, "logs": { "loss": 0.679, "epoch": 2.6062846580406656, "learning_rate": 1.573130923821135e-05 } }, { "step": 7100, "logs": { "loss": 0.6851, "epoch": 2.6247689463955637, "learning_rate": 1.5691980965115822e-05 } }, { "step": 7150, "logs": { "loss": 0.692, "epoch": 2.6432532347504623, "learning_rate": 1.5652652692020292e-05 } }, { "step": 7200, "logs": { "loss": 0.6956, "epoch": 2.6617375231053604, "learning_rate": 1.5613324418924766e-05 } }, { "step": 7250, "logs": { "loss": 0.6883, "epoch": 2.680221811460259, "learning_rate": 1.5573996145829237e-05 } }, { "step": 7300, "logs": { "loss": 0.6806, "epoch": 2.698706099815157, "learning_rate": 1.5534667872733708e-05 } }, { "step": 7350, "logs": { "loss": 0.6832, "epoch": 2.7171903881700556, "learning_rate": 1.549533959963818e-05 } }, { "step": 7400, "logs": { "loss": 0.6871, "epoch": 2.7356746765249538, "learning_rate": 1.5456011326542652e-05 } }, { "step": 7450, "logs": { "loss": 0.6843, "epoch": 2.7541589648798523, "learning_rate": 1.5416683053447123e-05 } }, { "step": 7500, "logs": { "loss": 0.6869, "epoch": 2.7726432532347505, "learning_rate": 1.5377354780351597e-05 } }, { "step": 7550, "logs": { "loss": 0.689, "epoch": 2.7911275415896486, "learning_rate": 1.5338026507256067e-05 } }, { "step": 7600, "logs": { "loss": 0.6864, "epoch": 2.809611829944547, "learning_rate": 1.5298698234160538e-05 } }, { "step": 7650, "logs": { "loss": 0.6875, "epoch": 2.8280961182994453, "learning_rate": 1.5259369961065012e-05 } }, { "step": 7700, "logs": { "loss": 0.6844, "epoch": 2.846580406654344, "learning_rate": 1.5220041687969483e-05 } }, { "step": 7750, "logs": { "loss": 0.6916, "epoch": 2.865064695009242, "learning_rate": 1.5180713414873953e-05 } }, { "step": 7800, "logs": { "loss": 0.6849, "epoch": 2.8835489833641406, "learning_rate": 1.5141385141778426e-05 } }, { "step": 7850, "logs": { "loss": 0.6835, "epoch": 2.9020332717190387, "learning_rate": 1.5102056868682898e-05 } }, { "step": 7900, "logs": { "loss": 0.6866, "epoch": 2.9205175600739373, "learning_rate": 1.5062728595587369e-05 } }, { "step": 7950, "logs": { "loss": 0.6863, "epoch": 2.9390018484288354, "learning_rate": 1.502340032249184e-05 } }, { "step": 8000, "logs": { "loss": 0.6903, "epoch": 2.957486136783734, "learning_rate": 1.4984072049396311e-05 } }, { "step": 8050, "logs": { "loss": 0.686, "epoch": 2.975970425138632, "learning_rate": 1.4944743776300784e-05 } }, { "step": 8100, "logs": { "loss": 0.6909, "epoch": 2.9944547134935307, "learning_rate": 1.4905415503205256e-05 } }, { "step": 8150, "logs": { "loss": 0.5832, "epoch": 3.0129390018484288, "learning_rate": 1.4866087230109727e-05 } }, { "step": 8200, "logs": { "loss": 0.5314, "epoch": 3.0314232902033273, "learning_rate": 1.4826758957014197e-05 } }, { "step": 8250, "logs": { "loss": 0.5332, "epoch": 3.0499075785582255, "learning_rate": 1.4787430683918671e-05 } }, { "step": 8300, "logs": { "loss": 0.5359, "epoch": 3.068391866913124, "learning_rate": 1.4748102410823142e-05 } }, { "step": 8350, "logs": { "loss": 0.5398, "epoch": 3.086876155268022, "learning_rate": 1.4708774137727613e-05 } }, { "step": 8400, "logs": { "loss": 0.5433, "epoch": 3.1053604436229203, "learning_rate": 1.4669445864632087e-05 } }, { "step": 8450, "logs": { "loss": 0.5368, "epoch": 3.123844731977819, "learning_rate": 1.4630117591536557e-05 } }, { "step": 8500, "logs": { "loss": 0.5419, "epoch": 3.142329020332717, "learning_rate": 1.4590789318441028e-05 } }, { "step": 8550, "logs": { "loss": 0.5398, "epoch": 3.1608133086876156, "learning_rate": 1.45514610453455e-05 } }, { "step": 8600, "logs": { "loss": 0.5442, "epoch": 3.1792975970425137, "learning_rate": 1.4512132772249972e-05 } }, { "step": 8650, "logs": { "loss": 0.544, "epoch": 3.1977818853974123, "learning_rate": 1.4472804499154443e-05 } }, { "step": 8700, "logs": { "loss": 0.5455, "epoch": 3.2162661737523104, "learning_rate": 1.4433476226058915e-05 } }, { "step": 8750, "logs": { "loss": 0.548, "epoch": 3.234750462107209, "learning_rate": 1.4394147952963386e-05 } }, { "step": 8800, "logs": { "loss": 0.5453, "epoch": 3.253234750462107, "learning_rate": 1.4354819679867858e-05 } }, { "step": 8850, "logs": { "loss": 0.5416, "epoch": 3.2717190388170057, "learning_rate": 1.431549140677233e-05 } }, { "step": 8900, "logs": { "loss": 0.5542, "epoch": 3.290203327171904, "learning_rate": 1.4276163133676801e-05 } }, { "step": 8950, "logs": { "loss": 0.5469, "epoch": 3.3086876155268024, "learning_rate": 1.4236834860581272e-05 } }, { "step": 9000, "logs": { "loss": 0.5545, "epoch": 3.3271719038817005, "learning_rate": 1.4197506587485746e-05 } }, { "step": 9050, "logs": { "loss": 0.5538, "epoch": 3.345656192236599, "learning_rate": 1.4158178314390216e-05 } }, { "step": 9100, "logs": { "loss": 0.5504, "epoch": 3.364140480591497, "learning_rate": 1.4118850041294687e-05 } }, { "step": 9150, "logs": { "loss": 0.5511, "epoch": 3.3826247689463957, "learning_rate": 1.4079521768199161e-05 } }, { "step": 9200, "logs": { "loss": 0.554, "epoch": 3.401109057301294, "learning_rate": 1.4040193495103632e-05 } }, { "step": 9250, "logs": { "loss": 0.5541, "epoch": 3.4195933456561924, "learning_rate": 1.4000865222008102e-05 } }, { "step": 9300, "logs": { "loss": 0.5502, "epoch": 3.4380776340110906, "learning_rate": 1.3961536948912575e-05 } }, { "step": 9350, "logs": { "loss": 0.5513, "epoch": 3.4565619223659887, "learning_rate": 1.3922208675817047e-05 } }, { "step": 9400, "logs": { "loss": 0.5579, "epoch": 3.4750462107208873, "learning_rate": 1.3882880402721517e-05 } }, { "step": 9450, "logs": { "loss": 0.5636, "epoch": 3.4935304990757854, "learning_rate": 1.384355212962599e-05 } }, { "step": 9500, "logs": { "loss": 0.5617, "epoch": 3.512014787430684, "learning_rate": 1.380422385653046e-05 } }, { "step": 9550, "logs": { "loss": 0.5549, "epoch": 3.530499075785582, "learning_rate": 1.3764895583434933e-05 } }, { "step": 9600, "logs": { "loss": 0.5599, "epoch": 3.5489833641404807, "learning_rate": 1.3725567310339405e-05 } }, { "step": 9650, "logs": { "loss": 0.5565, "epoch": 3.567467652495379, "learning_rate": 1.3686239037243876e-05 } }, { "step": 9700, "logs": { "loss": 0.5565, "epoch": 3.5859519408502774, "learning_rate": 1.3646910764148346e-05 } }, { "step": 9750, "logs": { "loss": 0.5558, "epoch": 3.6044362292051755, "learning_rate": 1.360758249105282e-05 } }, { "step": 9800, "logs": { "loss": 0.5599, "epoch": 3.622920517560074, "learning_rate": 1.356825421795729e-05 } }, { "step": 9850, "logs": { "loss": 0.561, "epoch": 3.641404805914972, "learning_rate": 1.3528925944861761e-05 } }, { "step": 9900, "logs": { "loss": 0.5596, "epoch": 3.6598890942698707, "learning_rate": 1.3489597671766235e-05 } }, { "step": 9950, "logs": { "loss": 0.5596, "epoch": 3.678373382624769, "learning_rate": 1.3450269398670706e-05 } }, { "step": 10000, "logs": { "loss": 0.5579, "epoch": 3.6968576709796674, "learning_rate": 1.3410941125575177e-05 } }, { "step": 10050, "logs": { "loss": 0.5611, "epoch": 3.7153419593345656, "learning_rate": 1.3371612852479649e-05 } }, { "step": 10100, "logs": { "loss": 0.5627, "epoch": 3.733826247689464, "learning_rate": 1.3332284579384121e-05 } }, { "step": 10150, "logs": { "loss": 0.5613, "epoch": 3.7523105360443623, "learning_rate": 1.3292956306288592e-05 } }, { "step": 10200, "logs": { "loss": 0.5607, "epoch": 3.770794824399261, "learning_rate": 1.3253628033193064e-05 } }, { "step": 10250, "logs": { "loss": 0.5651, "epoch": 3.789279112754159, "learning_rate": 1.3214299760097535e-05 } }, { "step": 10300, "logs": { "loss": 0.5604, "epoch": 3.807763401109057, "learning_rate": 1.3174971487002005e-05 } }, { "step": 10350, "logs": { "loss": 0.5676, "epoch": 3.8262476894639557, "learning_rate": 1.313564321390648e-05 } }, { "step": 10400, "logs": { "loss": 0.5601, "epoch": 3.844731977818854, "learning_rate": 1.309631494081095e-05 } }, { "step": 10450, "logs": { "loss": 0.5645, "epoch": 3.8632162661737524, "learning_rate": 1.305698666771542e-05 } }, { "step": 10500, "logs": { "loss": 0.5653, "epoch": 3.8817005545286505, "learning_rate": 1.3017658394619895e-05 } }, { "step": 10550, "logs": { "loss": 0.5618, "epoch": 3.900184842883549, "learning_rate": 1.2978330121524365e-05 } }, { "step": 10600, "logs": { "loss": 0.5624, "epoch": 3.918669131238447, "learning_rate": 1.2939001848428836e-05 } }, { "step": 10650, "logs": { "loss": 0.5621, "epoch": 3.9371534195933457, "learning_rate": 1.289967357533331e-05 } }, { "step": 10700, "logs": { "loss": 0.5633, "epoch": 3.955637707948244, "learning_rate": 1.286034530223778e-05 } }, { "step": 10750, "logs": { "loss": 0.5645, "epoch": 3.9741219963031424, "learning_rate": 1.2821017029142251e-05 } }, { "step": 10800, "logs": { "loss": 0.5675, "epoch": 3.9926062846580406, "learning_rate": 1.2781688756046723e-05 } }, { "step": 10850, "logs": { "loss": 0.4943, "epoch": 4.011090573012939, "learning_rate": 1.2742360482951194e-05 } }, { "step": 10900, "logs": { "loss": 0.4282, "epoch": 4.029574861367838, "learning_rate": 1.2703032209855666e-05 } }, { "step": 10950, "logs": { "loss": 0.4285, "epoch": 4.048059149722736, "learning_rate": 1.2663703936760139e-05 } }, { "step": 11000, "logs": { "loss": 0.4307, "epoch": 4.066543438077634, "learning_rate": 1.262437566366461e-05 } }, { "step": 11050, "logs": { "loss": 0.4372, "epoch": 4.085027726432532, "learning_rate": 1.258504739056908e-05 } }, { "step": 11100, "logs": { "loss": 0.4377, "epoch": 4.103512014787431, "learning_rate": 1.2545719117473554e-05 } }, { "step": 11150, "logs": { "loss": 0.4296, "epoch": 4.121996303142329, "learning_rate": 1.2506390844378025e-05 } }, { "step": 11200, "logs": { "loss": 0.4358, "epoch": 4.140480591497227, "learning_rate": 1.2467062571282495e-05 } }, { "step": 11250, "logs": { "loss": 0.4383, "epoch": 4.1589648798521255, "learning_rate": 1.2427734298186969e-05 } }, { "step": 11300, "logs": { "loss": 0.4355, "epoch": 4.177449168207024, "learning_rate": 1.238840602509144e-05 } }, { "step": 11350, "logs": { "loss": 0.44, "epoch": 4.195933456561923, "learning_rate": 1.234907775199591e-05 } }, { "step": 11400, "logs": { "loss": 0.4393, "epoch": 4.214417744916821, "learning_rate": 1.2309749478900384e-05 } }, { "step": 11450, "logs": { "loss": 0.4427, "epoch": 4.232902033271719, "learning_rate": 1.2270421205804855e-05 } }, { "step": 11500, "logs": { "loss": 0.4399, "epoch": 4.251386321626617, "learning_rate": 1.2231092932709326e-05 } }, { "step": 11550, "logs": { "loss": 0.4401, "epoch": 4.269870609981516, "learning_rate": 1.2191764659613798e-05 } }, { "step": 11600, "logs": { "loss": 0.4446, "epoch": 4.288354898336414, "learning_rate": 1.2152436386518269e-05 } }, { "step": 11650, "logs": { "loss": 0.4436, "epoch": 4.306839186691312, "learning_rate": 1.211310811342274e-05 } }, { "step": 11700, "logs": { "loss": 0.4478, "epoch": 4.32532347504621, "learning_rate": 1.2073779840327213e-05 } }, { "step": 11750, "logs": { "loss": 0.447, "epoch": 4.343807763401109, "learning_rate": 1.2034451567231684e-05 } }, { "step": 11800, "logs": { "loss": 0.4505, "epoch": 4.3622920517560075, "learning_rate": 1.1995123294136154e-05 } }, { "step": 11850, "logs": { "loss": 0.4461, "epoch": 4.380776340110906, "learning_rate": 1.1955795021040628e-05 } }, { "step": 11900, "logs": { "loss": 0.4511, "epoch": 4.399260628465804, "learning_rate": 1.1916466747945099e-05 } }, { "step": 11950, "logs": { "loss": 0.4481, "epoch": 4.417744916820703, "learning_rate": 1.187713847484957e-05 } }, { "step": 12000, "logs": { "loss": 0.4457, "epoch": 4.436229205175601, "learning_rate": 1.1837810201754044e-05 } }, { "step": 12050, "logs": { "loss": 0.4491, "epoch": 4.454713493530499, "learning_rate": 1.1798481928658514e-05 } }, { "step": 12100, "logs": { "loss": 0.453, "epoch": 4.473197781885397, "learning_rate": 1.1759153655562985e-05 } }, { "step": 12150, "logs": { "loss": 0.4557, "epoch": 4.491682070240295, "learning_rate": 1.1719825382467455e-05 } }, { "step": 12200, "logs": { "loss": 0.4588, "epoch": 4.510166358595194, "learning_rate": 1.168049710937193e-05 } }, { "step": 12250, "logs": { "loss": 0.4478, "epoch": 4.5286506469500925, "learning_rate": 1.16411688362764e-05 } }, { "step": 12300, "logs": { "loss": 0.4558, "epoch": 4.547134935304991, "learning_rate": 1.160184056318087e-05 } }, { "step": 12350, "logs": { "loss": 0.453, "epoch": 4.565619223659889, "learning_rate": 1.1562512290085343e-05 } }, { "step": 12400, "logs": { "loss": 0.4566, "epoch": 4.584103512014788, "learning_rate": 1.1523184016989815e-05 } }, { "step": 12450, "logs": { "loss": 0.4512, "epoch": 4.602587800369686, "learning_rate": 1.1483855743894286e-05 } }, { "step": 12500, "logs": { "loss": 0.4537, "epoch": 4.621072088724584, "learning_rate": 1.1444527470798758e-05 } }, { "step": 12550, "logs": { "loss": 0.4596, "epoch": 4.639556377079482, "learning_rate": 1.1405199197703229e-05 } }, { "step": 12600, "logs": { "loss": 0.4544, "epoch": 4.658040665434381, "learning_rate": 1.1365870924607701e-05 } }, { "step": 12650, "logs": { "loss": 0.4552, "epoch": 4.676524953789279, "learning_rate": 1.1326542651512173e-05 } }, { "step": 12700, "logs": { "loss": 0.4561, "epoch": 4.695009242144177, "learning_rate": 1.1287214378416644e-05 } }, { "step": 12750, "logs": { "loss": 0.456, "epoch": 4.7134935304990755, "learning_rate": 1.1247886105321115e-05 } }, { "step": 12800, "logs": { "loss": 0.455, "epoch": 4.7319778188539745, "learning_rate": 1.1208557832225589e-05 } }, { "step": 12850, "logs": { "loss": 0.4579, "epoch": 4.750462107208873, "learning_rate": 1.116922955913006e-05 } }, { "step": 12900, "logs": { "loss": 0.4569, "epoch": 4.768946395563771, "learning_rate": 1.112990128603453e-05 } }, { "step": 12950, "logs": { "loss": 0.459, "epoch": 4.787430683918669, "learning_rate": 1.1090573012939004e-05 } }, { "step": 13000, "logs": { "loss": 0.456, "epoch": 4.805914972273568, "learning_rate": 1.1051244739843475e-05 } }, { "step": 13050, "logs": { "loss": 0.4605, "epoch": 4.824399260628466, "learning_rate": 1.1011916466747945e-05 } }, { "step": 13100, "logs": { "loss": 0.4565, "epoch": 4.842883548983364, "learning_rate": 1.0972588193652417e-05 } }, { "step": 13150, "logs": { "loss": 0.4606, "epoch": 4.861367837338262, "learning_rate": 1.093325992055689e-05 } }, { "step": 13200, "logs": { "loss": 0.4586, "epoch": 4.87985212569316, "learning_rate": 1.089393164746136e-05 } }, { "step": 13250, "logs": { "loss": 0.4605, "epoch": 4.898336414048059, "learning_rate": 1.0854603374365833e-05 } }, { "step": 13300, "logs": { "loss": 0.4565, "epoch": 4.9168207024029575, "learning_rate": 1.0815275101270303e-05 } }, { "step": 13350, "logs": { "loss": 0.4585, "epoch": 4.935304990757856, "learning_rate": 1.0775946828174776e-05 } }, { "step": 13400, "logs": { "loss": 0.4588, "epoch": 4.953789279112754, "learning_rate": 1.0736618555079248e-05 } }, { "step": 13450, "logs": { "loss": 0.4639, "epoch": 4.972273567467653, "learning_rate": 1.0697290281983718e-05 } }, { "step": 13500, "logs": { "loss": 0.4666, "epoch": 4.990757855822551, "learning_rate": 1.0657962008888189e-05 } }, { "step": 13550, "logs": { "loss": 0.4109, "epoch": 5.009242144177449, "learning_rate": 1.0618633735792663e-05 } }, { "step": 13600, "logs": { "loss": 0.3538, "epoch": 5.027726432532347, "learning_rate": 1.0579305462697134e-05 } }, { "step": 13650, "logs": { "loss": 0.346, "epoch": 5.046210720887246, "learning_rate": 1.0539977189601604e-05 } }, { "step": 13700, "logs": { "loss": 0.3483, "epoch": 5.064695009242144, "learning_rate": 1.0500648916506078e-05 } }, { "step": 13750, "logs": { "loss": 0.3548, "epoch": 5.0831792975970425, "learning_rate": 1.0461320643410549e-05 } }, { "step": 13800, "logs": { "loss": 0.3567, "epoch": 5.101663585951941, "learning_rate": 1.042199237031502e-05 } }, { "step": 13850, "logs": { "loss": 0.3525, "epoch": 5.12014787430684, "learning_rate": 1.0382664097219492e-05 } }, { "step": 13900, "logs": { "loss": 0.3563, "epoch": 5.138632162661738, "learning_rate": 1.0343335824123964e-05 } }, { "step": 13950, "logs": { "loss": 0.3606, "epoch": 5.157116451016636, "learning_rate": 1.0304007551028435e-05 } }, { "step": 14000, "logs": { "loss": 0.3585, "epoch": 5.175600739371534, "learning_rate": 1.0264679277932907e-05 } }, { "step": 14050, "logs": { "loss": 0.3547, "epoch": 5.194085027726432, "learning_rate": 1.0225351004837378e-05 } }, { "step": 14100, "logs": { "loss": 0.359, "epoch": 5.212569316081331, "learning_rate": 1.018602273174185e-05 } }, { "step": 14150, "logs": { "loss": 0.3616, "epoch": 5.231053604436229, "learning_rate": 1.0146694458646322e-05 } }, { "step": 14200, "logs": { "loss": 0.3602, "epoch": 5.249537892791127, "learning_rate": 1.0107366185550793e-05 } }, { "step": 14250, "logs": { "loss": 0.3607, "epoch": 5.2680221811460255, "learning_rate": 1.0068037912455264e-05 } }, { "step": 14300, "logs": { "loss": 0.3642, "epoch": 5.2865064695009245, "learning_rate": 1.0028709639359738e-05 } }, { "step": 14350, "logs": { "loss": 0.3616, "epoch": 5.304990757855823, "learning_rate": 9.989381366264208e-06 } }, { "step": 14400, "logs": { "loss": 0.364, "epoch": 5.323475046210721, "learning_rate": 9.95005309316868e-06 } }, { "step": 14450, "logs": { "loss": 0.3656, "epoch": 5.341959334565619, "learning_rate": 9.910724820073151e-06 } }, { "step": 14500, "logs": { "loss": 0.3613, "epoch": 5.360443622920518, "learning_rate": 9.871396546977623e-06 } }, { "step": 14550, "logs": { "loss": 0.3655, "epoch": 5.378927911275416, "learning_rate": 9.832068273882096e-06 } }, { "step": 14600, "logs": { "loss": 0.3677, "epoch": 5.397412199630314, "learning_rate": 9.792740000786566e-06 } }, { "step": 14650, "logs": { "loss": 0.3678, "epoch": 5.415896487985212, "learning_rate": 9.753411727691039e-06 } }, { "step": 14700, "logs": { "loss": 0.364, "epoch": 5.434380776340111, "learning_rate": 9.71408345459551e-06 } }, { "step": 14750, "logs": { "loss": 0.3654, "epoch": 5.452865064695009, "learning_rate": 9.67475518149998e-06 } }, { "step": 14800, "logs": { "loss": 0.3671, "epoch": 5.4713493530499075, "learning_rate": 9.635426908404452e-06 } }, { "step": 14850, "logs": { "loss": 0.3724, "epoch": 5.489833641404806, "learning_rate": 9.596098635308924e-06 } }, { "step": 14900, "logs": { "loss": 1.4537, "epoch": 5.508317929759705, "learning_rate": 9.556770362213395e-06 } }, { "step": 14950, "logs": { "loss": 0.3685, "epoch": 5.526802218114603, "learning_rate": 9.517442089117867e-06 } }, { "step": 15000, "logs": { "loss": 0.3688, "epoch": 5.545286506469501, "learning_rate": 9.47811381602234e-06 } }, { "step": 15050, "logs": { "loss": 0.3726, "epoch": 5.563770794824399, "learning_rate": 9.43878554292681e-06 } }, { "step": 15100, "logs": { "loss": 0.3718, "epoch": 5.582255083179297, "learning_rate": 9.399457269831283e-06 } }, { "step": 15150, "logs": { "loss": 0.3691, "epoch": 5.600739371534196, "learning_rate": 9.360128996735755e-06 } }, { "step": 15200, "logs": { "loss": 0.3684, "epoch": 5.619223659889094, "learning_rate": 9.320800723640226e-06 } }, { "step": 15250, "logs": { "loss": 0.3747, "epoch": 5.6377079482439925, "learning_rate": 9.281472450544698e-06 } }, { "step": 15300, "logs": { "loss": 0.3727, "epoch": 5.656192236598891, "learning_rate": 9.24214417744917e-06 } }, { "step": 15350, "logs": { "loss": 0.3736, "epoch": 5.67467652495379, "learning_rate": 9.20281590435364e-06 } }, { "step": 15400, "logs": { "loss": 0.3725, "epoch": 5.693160813308688, "learning_rate": 9.163487631258111e-06 } }, { "step": 15450, "logs": { "loss": 0.3711, "epoch": 5.711645101663586, "learning_rate": 9.124159358162584e-06 } }, { "step": 15500, "logs": { "loss": 0.3705, "epoch": 5.730129390018484, "learning_rate": 9.084831085067054e-06 } }, { "step": 15550, "logs": { "loss": 0.3698, "epoch": 5.748613678373383, "learning_rate": 9.045502811971527e-06 } }, { "step": 15600, "logs": { "loss": 0.3725, "epoch": 5.767097966728281, "learning_rate": 9.006174538875999e-06 } }, { "step": 15650, "logs": { "loss": 0.3767, "epoch": 5.785582255083179, "learning_rate": 8.96684626578047e-06 } }, { "step": 15700, "logs": { "loss": 0.3696, "epoch": 5.804066543438077, "learning_rate": 8.927517992684942e-06 } }, { "step": 15750, "logs": { "loss": 0.3797, "epoch": 5.822550831792976, "learning_rate": 8.888189719589414e-06 } }, { "step": 15800, "logs": { "loss": 0.371, "epoch": 5.8410351201478745, "learning_rate": 8.848861446493885e-06 } }, { "step": 15850, "logs": { "loss": 0.3769, "epoch": 5.859519408502773, "learning_rate": 8.809533173398357e-06 } }, { "step": 15900, "logs": { "loss": 0.3731, "epoch": 5.878003696857671, "learning_rate": 8.77020490030283e-06 } }, { "step": 15950, "logs": { "loss": 0.3769, "epoch": 5.896487985212569, "learning_rate": 8.7308766272073e-06 } }, { "step": 16000, "logs": { "loss": 0.3711, "epoch": 5.914972273567468, "learning_rate": 8.691548354111772e-06 } }, { "step": 16050, "logs": { "loss": 0.3752, "epoch": 5.933456561922366, "learning_rate": 8.652220081016243e-06 } }, { "step": 16100, "logs": { "loss": 0.3697, "epoch": 5.951940850277264, "learning_rate": 8.612891807920715e-06 } }, { "step": 16150, "logs": { "loss": 0.3751, "epoch": 5.970425138632162, "learning_rate": 8.573563534825186e-06 } }, { "step": 16200, "logs": { "loss": 0.3791, "epoch": 5.988909426987061, "learning_rate": 8.534235261729658e-06 } }, { "step": 16250, "logs": { "loss": 0.3443, "epoch": 6.007393715341959, "learning_rate": 8.494906988634129e-06 } }, { "step": 16300, "logs": { "loss": 0.2903, "epoch": 6.0258780036968576, "learning_rate": 8.455578715538601e-06 } }, { "step": 16350, "logs": { "loss": 0.2906, "epoch": 6.044362292051756, "learning_rate": 8.416250442443073e-06 } }, { "step": 16400, "logs": { "loss": 0.2884, "epoch": 6.062846580406655, "learning_rate": 8.376922169347544e-06 } }, { "step": 16450, "logs": { "loss": 0.2913, "epoch": 6.081330868761553, "learning_rate": 8.337593896252016e-06 } }, { "step": 16500, "logs": { "loss": 0.2964, "epoch": 6.099815157116451, "learning_rate": 8.298265623156489e-06 } }, { "step": 16550, "logs": { "loss": 0.2877, "epoch": 6.118299445471349, "learning_rate": 8.25893735006096e-06 } }, { "step": 16600, "logs": { "loss": 0.2957, "epoch": 6.136783733826248, "learning_rate": 8.219609076965432e-06 } }, { "step": 16650, "logs": { "loss": 0.2974, "epoch": 6.155268022181146, "learning_rate": 8.180280803869902e-06 } }, { "step": 16700, "logs": { "loss": 0.295, "epoch": 6.173752310536044, "learning_rate": 8.140952530774374e-06 } }, { "step": 16750, "logs": { "loss": 0.2947, "epoch": 6.1922365988909425, "learning_rate": 8.101624257678847e-06 } }, { "step": 16800, "logs": { "loss": 0.2957, "epoch": 6.210720887245841, "learning_rate": 8.062295984583317e-06 } }, { "step": 16850, "logs": { "loss": 0.3001, "epoch": 6.22920517560074, "learning_rate": 8.02296771148779e-06 } }, { "step": 16900, "logs": { "loss": 0.2958, "epoch": 6.247689463955638, "learning_rate": 7.98363943839226e-06 } }, { "step": 16950, "logs": { "loss": 0.2956, "epoch": 6.266173752310536, "learning_rate": 7.944311165296733e-06 } }, { "step": 17000, "logs": { "loss": 0.3, "epoch": 6.284658040665434, "learning_rate": 7.904982892201203e-06 } }, { "step": 17050, "logs": { "loss": 0.3, "epoch": 6.303142329020333, "learning_rate": 7.865654619105676e-06 } }, { "step": 17100, "logs": { "loss": 0.3003, "epoch": 6.321626617375231, "learning_rate": 7.826326346010146e-06 } }, { "step": 17150, "logs": { "loss": 0.3029, "epoch": 6.340110905730129, "learning_rate": 7.786998072914618e-06 } }, { "step": 17200, "logs": { "loss": 0.301, "epoch": 6.358595194085027, "learning_rate": 7.74766979981909e-06 } }, { "step": 17250, "logs": { "loss": 0.297, "epoch": 6.377079482439926, "learning_rate": 7.708341526723561e-06 } }, { "step": 17300, "logs": { "loss": 0.2993, "epoch": 6.3955637707948245, "learning_rate": 7.669013253628034e-06 } }, { "step": 17350, "logs": { "loss": 0.3035, "epoch": 6.414048059149723, "learning_rate": 7.629684980532506e-06 } }, { "step": 17400, "logs": { "loss": 0.2988, "epoch": 6.432532347504621, "learning_rate": 7.590356707436977e-06 } }, { "step": 17450, "logs": { "loss": 0.3001, "epoch": 6.45101663585952, "learning_rate": 7.551028434341449e-06 } }, { "step": 17500, "logs": { "loss": 0.3024, "epoch": 6.469500924214418, "learning_rate": 7.51170016124592e-06 } }, { "step": 17550, "logs": { "loss": 0.3053, "epoch": 6.487985212569316, "learning_rate": 7.472371888150392e-06 } }, { "step": 17600, "logs": { "loss": 0.3081, "epoch": 6.506469500924214, "learning_rate": 7.433043615054863e-06 } }, { "step": 17650, "logs": { "loss": 0.3002, "epoch": 6.524953789279113, "learning_rate": 7.393715341959336e-06 } }, { "step": 17700, "logs": { "loss": 0.3044, "epoch": 6.543438077634011, "learning_rate": 7.354387068863806e-06 } }, { "step": 17750, "logs": { "loss": 0.3016, "epoch": 6.561922365988909, "learning_rate": 7.3150587957682786e-06 } }, { "step": 17800, "logs": { "loss": 0.3071, "epoch": 6.580406654343808, "learning_rate": 7.27573052267275e-06 } }, { "step": 17850, "logs": { "loss": 0.3002, "epoch": 6.598890942698706, "learning_rate": 7.2364022495772215e-06 } }, { "step": 17900, "logs": { "loss": 0.3042, "epoch": 6.617375231053605, "learning_rate": 7.197073976481693e-06 } }, { "step": 17950, "logs": { "loss": 0.3042, "epoch": 6.635859519408503, "learning_rate": 7.157745703386165e-06 } }, { "step": 18000, "logs": { "loss": 0.3063, "epoch": 6.654343807763401, "learning_rate": 7.118417430290636e-06 } }, { "step": 18050, "logs": { "loss": 0.3031, "epoch": 6.672828096118299, "learning_rate": 7.079089157195108e-06 } }, { "step": 18100, "logs": { "loss": 0.3081, "epoch": 6.691312384473198, "learning_rate": 7.0397608840995805e-06 } }, { "step": 18150, "logs": { "loss": 0.3041, "epoch": 6.709796672828096, "learning_rate": 7.000432611004051e-06 } }, { "step": 18200, "logs": { "loss": 0.3036, "epoch": 6.728280961182994, "learning_rate": 6.961104337908523e-06 } }, { "step": 18250, "logs": { "loss": 0.3044, "epoch": 6.7467652495378925, "learning_rate": 6.921776064812995e-06 } }, { "step": 18300, "logs": { "loss": 0.3057, "epoch": 6.7652495378927915, "learning_rate": 6.882447791717466e-06 } }, { "step": 18350, "logs": { "loss": 0.3081, "epoch": 6.78373382624769, "learning_rate": 6.843119518621938e-06 } }, { "step": 18400, "logs": { "loss": 0.3058, "epoch": 6.802218114602588, "learning_rate": 6.80379124552641e-06 } }, { "step": 18450, "logs": { "loss": 0.3072, "epoch": 6.820702402957486, "learning_rate": 6.764462972430881e-06 } }, { "step": 18500, "logs": { "loss": 0.3042, "epoch": 6.839186691312385, "learning_rate": 6.725134699335353e-06 } }, { "step": 18550, "logs": { "loss": 0.3091, "epoch": 6.857670979667283, "learning_rate": 6.6858064262398245e-06 } }, { "step": 18600, "logs": { "loss": 0.3036, "epoch": 6.876155268022181, "learning_rate": 6.646478153144296e-06 } }, { "step": 18650, "logs": { "loss": 0.3081, "epoch": 6.894639556377079, "learning_rate": 6.607149880048767e-06 } }, { "step": 18700, "logs": { "loss": 0.3018, "epoch": 6.913123844731977, "learning_rate": 6.56782160695324e-06 } }, { "step": 18750, "logs": { "loss": 0.3055, "epoch": 6.931608133086876, "learning_rate": 6.52849333385771e-06 } }, { "step": 18800, "logs": { "loss": 0.3046, "epoch": 6.9500924214417745, "learning_rate": 6.489165060762183e-06 } }, { "step": 18850, "logs": { "loss": 0.3083, "epoch": 6.968576709796673, "learning_rate": 6.449836787666655e-06 } }, { "step": 18900, "logs": { "loss": 0.3118, "epoch": 6.987060998151571, "learning_rate": 6.4105085145711256e-06 } }, { "step": 18950, "logs": { "loss": 0.2902, "epoch": 7.00554528650647, "learning_rate": 6.371180241475597e-06 } }, { "step": 19000, "logs": { "loss": 0.241, "epoch": 7.024029574861368, "learning_rate": 6.331851968380069e-06 } }, { "step": 19050, "logs": { "loss": 0.2432, "epoch": 7.042513863216266, "learning_rate": 6.29252369528454e-06 } }, { "step": 19100, "logs": { "loss": 0.2405, "epoch": 7.060998151571164, "learning_rate": 6.253195422189012e-06 } }, { "step": 19150, "logs": { "loss": 0.2447, "epoch": 7.079482439926063, "learning_rate": 6.2138671490934846e-06 } }, { "step": 19200, "logs": { "loss": 0.2458, "epoch": 7.097966728280961, "learning_rate": 6.174538875997955e-06 } }, { "step": 19250, "logs": { "loss": 0.2414, "epoch": 7.116451016635859, "learning_rate": 6.1352106029024275e-06 } }, { "step": 19300, "logs": { "loss": 0.2465, "epoch": 7.134935304990758, "learning_rate": 6.095882329806899e-06 } }, { "step": 19350, "logs": { "loss": 0.2474, "epoch": 7.153419593345657, "learning_rate": 6.05655405671137e-06 } }, { "step": 19400, "logs": { "loss": 0.2464, "epoch": 7.171903881700555, "learning_rate": 6.017225783615842e-06 } }, { "step": 19450, "logs": { "loss": 0.2443, "epoch": 7.190388170055453, "learning_rate": 5.977897510520314e-06 } }, { "step": 19500, "logs": { "loss": 0.2466, "epoch": 7.208872458410351, "learning_rate": 5.938569237424785e-06 } }, { "step": 19550, "logs": { "loss": 0.2497, "epoch": 7.22735674676525, "learning_rate": 5.899240964329257e-06 } }, { "step": 19600, "logs": { "loss": 0.2469, "epoch": 7.245841035120148, "learning_rate": 5.859912691233728e-06 } }, { "step": 19650, "logs": { "loss": 0.2468, "epoch": 7.264325323475046, "learning_rate": 5.8205844181382e-06 } }, { "step": 19700, "logs": { "loss": 0.2495, "epoch": 7.282809611829944, "learning_rate": 5.7812561450426715e-06 } }, { "step": 19750, "logs": { "loss": 0.2496, "epoch": 7.3012939001848425, "learning_rate": 5.741927871947143e-06 } }, { "step": 19800, "logs": { "loss": 0.2516, "epoch": 7.3197781885397415, "learning_rate": 5.702599598851614e-06 } }, { "step": 19850, "logs": { "loss": 0.2516, "epoch": 7.33826247689464, "learning_rate": 5.663271325756087e-06 } }, { "step": 19900, "logs": { "loss": 0.2493, "epoch": 7.356746765249538, "learning_rate": 5.623943052660557e-06 } }, { "step": 19950, "logs": { "loss": 0.2458, "epoch": 7.375231053604436, "learning_rate": 5.58461477956503e-06 } }, { "step": 20000, "logs": { "loss": 0.2494, "epoch": 7.393715341959335, "learning_rate": 5.545286506469502e-06 } }, { "step": 20050, "logs": { "loss": 0.2534, "epoch": 7.412199630314233, "learning_rate": 5.5059582333739726e-06 } }, { "step": 20100, "logs": { "loss": 0.2499, "epoch": 7.430683918669131, "learning_rate": 5.466629960278445e-06 } }, { "step": 20150, "logs": { "loss": 0.249, "epoch": 7.449168207024029, "learning_rate": 5.427301687182916e-06 } }, { "step": 20200, "logs": { "loss": 0.2498, "epoch": 7.467652495378928, "learning_rate": 5.387973414087388e-06 } }, { "step": 20250, "logs": { "loss": 0.2541, "epoch": 7.486136783733826, "learning_rate": 5.348645140991859e-06 } }, { "step": 20300, "logs": { "loss": 0.2579, "epoch": 7.5046210720887245, "learning_rate": 5.3093168678963316e-06 } }, { "step": 20350, "logs": { "loss": 0.2476, "epoch": 7.523105360443623, "learning_rate": 5.269988594800802e-06 } }, { "step": 20400, "logs": { "loss": 0.2538, "epoch": 7.541589648798522, "learning_rate": 5.2306603217052745e-06 } }, { "step": 20450, "logs": { "loss": 0.2537, "epoch": 7.56007393715342, "learning_rate": 5.191332048609746e-06 } }, { "step": 20500, "logs": { "loss": 0.2522, "epoch": 7.578558225508318, "learning_rate": 5.152003775514217e-06 } }, { "step": 20550, "logs": { "loss": 0.2491, "epoch": 7.597042513863216, "learning_rate": 5.112675502418689e-06 } }, { "step": 20600, "logs": { "loss": 0.2509, "epoch": 7.615526802218114, "learning_rate": 5.073347229323161e-06 } }, { "step": 20650, "logs": { "loss": 0.2496, "epoch": 7.634011090573013, "learning_rate": 5.034018956227632e-06 } }, { "step": 20700, "logs": { "loss": 0.2542, "epoch": 7.652495378927911, "learning_rate": 4.994690683132104e-06 } }, { "step": 20750, "logs": { "loss": 0.2517, "epoch": 7.6709796672828094, "learning_rate": 4.9553624100365756e-06 } }, { "step": 20800, "logs": { "loss": 0.2544, "epoch": 7.689463955637708, "learning_rate": 4.916034136941048e-06 } }, { "step": 20850, "logs": { "loss": 0.2489, "epoch": 7.707948243992607, "learning_rate": 4.876705863845519e-06 } }, { "step": 20900, "logs": { "loss": 0.2506, "epoch": 7.726432532347505, "learning_rate": 4.83737759074999e-06 } }, { "step": 20950, "logs": { "loss": 0.2535, "epoch": 7.744916820702403, "learning_rate": 4.798049317654462e-06 } }, { "step": 21000, "logs": { "loss": 0.2506, "epoch": 7.763401109057301, "learning_rate": 4.758721044558934e-06 } }, { "step": 21050, "logs": { "loss": 0.2547, "epoch": 7.7818853974122, "learning_rate": 4.719392771463405e-06 } }, { "step": 21100, "logs": { "loss": 0.2525, "epoch": 7.800369685767098, "learning_rate": 4.6800644983678775e-06 } }, { "step": 21150, "logs": { "loss": 0.2535, "epoch": 7.818853974121996, "learning_rate": 4.640736225272349e-06 } }, { "step": 21200, "logs": { "loss": 0.2508, "epoch": 7.837338262476894, "learning_rate": 4.60140795217682e-06 } }, { "step": 21250, "logs": { "loss": 0.254, "epoch": 7.855822550831793, "learning_rate": 4.562079679081292e-06 } }, { "step": 21300, "logs": { "loss": 0.251, "epoch": 7.8743068391866915, "learning_rate": 4.522751405985763e-06 } }, { "step": 21350, "logs": { "loss": 0.2545, "epoch": 7.89279112754159, "learning_rate": 4.483423132890235e-06 } }, { "step": 21400, "logs": { "loss": 0.2497, "epoch": 7.911275415896488, "learning_rate": 4.444094859794707e-06 } }, { "step": 21450, "logs": { "loss": 0.253, "epoch": 7.929759704251387, "learning_rate": 4.4047665866991786e-06 } }, { "step": 21500, "logs": { "loss": 0.249, "epoch": 7.948243992606285, "learning_rate": 4.36543831360365e-06 } }, { "step": 21550, "logs": { "loss": 0.2534, "epoch": 7.966728280961183, "learning_rate": 4.3261100405081215e-06 } }, { "step": 21600, "logs": { "loss": 0.2563, "epoch": 7.985212569316081, "learning_rate": 4.286781767412593e-06 } }, { "step": 21650, "logs": { "loss": 0.2489, "epoch": 8.00369685767098, "learning_rate": 4.247453494317064e-06 } }, { "step": 21700, "logs": { "loss": 0.2079, "epoch": 8.022181146025877, "learning_rate": 4.208125221221537e-06 } }, { "step": 21750, "logs": { "loss": 0.2079, "epoch": 8.040665434380776, "learning_rate": 4.168796948126008e-06 } }, { "step": 21800, "logs": { "loss": 0.2055, "epoch": 8.059149722735675, "learning_rate": 4.12946867503048e-06 } }, { "step": 21850, "logs": { "loss": 0.2115, "epoch": 8.077634011090574, "learning_rate": 4.090140401934951e-06 } }, { "step": 21900, "logs": { "loss": 0.2105, "epoch": 8.096118299445472, "learning_rate": 4.050812128839423e-06 } }, { "step": 21950, "logs": { "loss": 0.2055, "epoch": 8.11460258780037, "learning_rate": 4.011483855743895e-06 } }, { "step": 22000, "logs": { "loss": 0.2086, "epoch": 8.133086876155268, "learning_rate": 3.972155582648366e-06 } }, { "step": 22050, "logs": { "loss": 0.2102, "epoch": 8.151571164510166, "learning_rate": 3.932827309552838e-06 } }, { "step": 22100, "logs": { "loss": 0.21, "epoch": 8.170055452865064, "learning_rate": 3.893499036457309e-06 } }, { "step": 22150, "logs": { "loss": 0.2081, "epoch": 8.188539741219962, "learning_rate": 3.854170763361781e-06 } }, { "step": 22200, "logs": { "loss": 0.213, "epoch": 8.207024029574862, "learning_rate": 3.814842490266253e-06 } }, { "step": 22250, "logs": { "loss": 0.2114, "epoch": 8.22550831792976, "learning_rate": 3.7755142171707245e-06 } }, { "step": 22300, "logs": { "loss": 0.2116, "epoch": 8.243992606284658, "learning_rate": 3.736185944075196e-06 } }, { "step": 22350, "logs": { "loss": 0.2106, "epoch": 8.262476894639557, "learning_rate": 3.696857670979668e-06 } }, { "step": 22400, "logs": { "loss": 0.2097, "epoch": 8.280961182994455, "learning_rate": 3.6575293978841393e-06 } }, { "step": 22450, "logs": { "loss": 0.2119, "epoch": 8.299445471349353, "learning_rate": 3.6182011247886107e-06 } }, { "step": 22500, "logs": { "loss": 0.2144, "epoch": 8.317929759704251, "learning_rate": 3.5788728516930826e-06 } }, { "step": 22550, "logs": { "loss": 0.2125, "epoch": 8.336414048059149, "learning_rate": 3.539544578597554e-06 } }, { "step": 22600, "logs": { "loss": 0.2134, "epoch": 8.354898336414047, "learning_rate": 3.5002163055020256e-06 } }, { "step": 22650, "logs": { "loss": 0.2127, "epoch": 8.373382624768947, "learning_rate": 3.4608880324064974e-06 } }, { "step": 22700, "logs": { "loss": 0.2111, "epoch": 8.391866913123845, "learning_rate": 3.421559759310969e-06 } }, { "step": 22750, "logs": { "loss": 0.213, "epoch": 8.410351201478743, "learning_rate": 3.3822314862154404e-06 } }, { "step": 22800, "logs": { "loss": 0.2109, "epoch": 8.428835489833642, "learning_rate": 3.3429032131199122e-06 } }, { "step": 22850, "logs": { "loss": 0.2093, "epoch": 8.44731977818854, "learning_rate": 3.3035749400243837e-06 } }, { "step": 22900, "logs": { "loss": 0.2126, "epoch": 8.465804066543438, "learning_rate": 3.264246666928855e-06 } }, { "step": 22950, "logs": { "loss": 0.2127, "epoch": 8.484288354898336, "learning_rate": 3.2249183938333275e-06 } }, { "step": 23000, "logs": { "loss": 0.2184, "epoch": 8.502772643253234, "learning_rate": 3.1855901207377985e-06 } }, { "step": 23050, "logs": { "loss": 0.2108, "epoch": 8.521256931608134, "learning_rate": 3.14626184764227e-06 } }, { "step": 23100, "logs": { "loss": 0.2123, "epoch": 8.539741219963032, "learning_rate": 3.1069335745467423e-06 } }, { "step": 23150, "logs": { "loss": 0.2125, "epoch": 8.55822550831793, "learning_rate": 3.0676053014512137e-06 } }, { "step": 23200, "logs": { "loss": 0.2124, "epoch": 8.576709796672828, "learning_rate": 3.028277028355685e-06 } }, { "step": 23250, "logs": { "loss": 0.2112, "epoch": 8.595194085027726, "learning_rate": 2.988948755260157e-06 } }, { "step": 23300, "logs": { "loss": 0.2103, "epoch": 8.613678373382625, "learning_rate": 2.9496204821646285e-06 } }, { "step": 23350, "logs": { "loss": 0.2128, "epoch": 8.632162661737523, "learning_rate": 2.9102922090691e-06 } }, { "step": 23400, "logs": { "loss": 0.2125, "epoch": 8.65064695009242, "learning_rate": 2.8709639359735715e-06 } }, { "step": 23450, "logs": { "loss": 0.2109, "epoch": 8.669131238447319, "learning_rate": 2.8316356628780434e-06 } }, { "step": 23500, "logs": { "loss": 0.2132, "epoch": 8.687615526802219, "learning_rate": 2.792307389782515e-06 } }, { "step": 23550, "logs": { "loss": 0.2113, "epoch": 8.706099815157117, "learning_rate": 2.7529791166869863e-06 } }, { "step": 23600, "logs": { "loss": 0.2109, "epoch": 8.724584103512015, "learning_rate": 2.713650843591458e-06 } }, { "step": 23650, "logs": { "loss": 0.2138, "epoch": 8.743068391866913, "learning_rate": 2.6743225704959296e-06 } }, { "step": 23700, "logs": { "loss": 0.2098, "epoch": 8.761552680221811, "learning_rate": 2.634994297400401e-06 } }, { "step": 23750, "logs": { "loss": 0.2128, "epoch": 8.78003696857671, "learning_rate": 2.595666024304873e-06 } }, { "step": 23800, "logs": { "loss": 0.2143, "epoch": 8.798521256931608, "learning_rate": 2.5563377512093444e-06 } }, { "step": 23850, "logs": { "loss": 0.2132, "epoch": 8.817005545286506, "learning_rate": 2.517009478113816e-06 } }, { "step": 23900, "logs": { "loss": 0.2099, "epoch": 8.835489833641406, "learning_rate": 2.4776812050182878e-06 } }, { "step": 23950, "logs": { "loss": 0.2124, "epoch": 8.853974121996304, "learning_rate": 2.4383529319227597e-06 } }, { "step": 24000, "logs": { "loss": 0.2122, "epoch": 8.872458410351202, "learning_rate": 2.399024658827231e-06 } }, { "step": 24050, "logs": { "loss": 0.2136, "epoch": 8.8909426987061, "learning_rate": 2.3596963857317026e-06 } }, { "step": 24100, "logs": { "loss": 0.2103, "epoch": 8.909426987060998, "learning_rate": 2.3203681126361745e-06 } }, { "step": 24150, "logs": { "loss": 0.2132, "epoch": 8.927911275415896, "learning_rate": 2.281039839540646e-06 } }, { "step": 24200, "logs": { "loss": 0.2082, "epoch": 8.946395563770794, "learning_rate": 2.2417115664451174e-06 } }, { "step": 24250, "logs": { "loss": 0.213, "epoch": 8.964879852125692, "learning_rate": 2.2023832933495893e-06 } }, { "step": 24300, "logs": { "loss": 0.2142, "epoch": 8.98336414048059, "learning_rate": 2.1630550202540607e-06 } }, { "step": 24350, "logs": { "loss": 0.2123, "epoch": 9.00184842883549, "learning_rate": 2.123726747158532e-06 } }, { "step": 24400, "logs": { "loss": 0.1854, "epoch": 9.020332717190389, "learning_rate": 2.084398474063004e-06 } }, { "step": 24450, "logs": { "loss": 0.1848, "epoch": 9.038817005545287, "learning_rate": 2.0450702009674755e-06 } }, { "step": 24500, "logs": { "loss": 0.1802, "epoch": 9.057301293900185, "learning_rate": 2.0057419278719474e-06 } }, { "step": 24550, "logs": { "loss": 0.1859, "epoch": 9.075785582255083, "learning_rate": 1.966413654776419e-06 } }, { "step": 24600, "logs": { "loss": 0.1849, "epoch": 9.094269870609981, "learning_rate": 1.9270853816808904e-06 } }, { "step": 24650, "logs": { "loss": 0.1841, "epoch": 9.11275415896488, "learning_rate": 1.8877571085853622e-06 } }, { "step": 24700, "logs": { "loss": 0.1854, "epoch": 9.131238447319777, "learning_rate": 1.848428835489834e-06 } }, { "step": 24750, "logs": { "loss": 0.1847, "epoch": 9.149722735674677, "learning_rate": 1.8091005623943054e-06 } }, { "step": 24800, "logs": { "loss": 0.1852, "epoch": 9.168207024029575, "learning_rate": 1.769772289298777e-06 } }, { "step": 24850, "logs": { "loss": 0.1846, "epoch": 9.186691312384474, "learning_rate": 1.7304440162032487e-06 } }, { "step": 24900, "logs": { "loss": 0.1848, "epoch": 9.205175600739372, "learning_rate": 1.6911157431077202e-06 } }, { "step": 24950, "logs": { "loss": 0.1861, "epoch": 9.22365988909427, "learning_rate": 1.6517874700121919e-06 } }, { "step": 25000, "logs": { "loss": 0.185, "epoch": 9.242144177449168, "learning_rate": 1.6124591969166637e-06 } }, { "step": 25050, "logs": { "loss": 0.1846, "epoch": 9.260628465804066, "learning_rate": 1.573130923821135e-06 } }, { "step": 25100, "logs": { "loss": 0.1827, "epoch": 9.279112754158964, "learning_rate": 1.5338026507256069e-06 } }, { "step": 25150, "logs": { "loss": 0.1871, "epoch": 9.297597042513864, "learning_rate": 1.4944743776300785e-06 } }, { "step": 25200, "logs": { "loss": 0.1865, "epoch": 9.316081330868762, "learning_rate": 1.45514610453455e-06 } }, { "step": 25250, "logs": { "loss": 0.1859, "epoch": 9.33456561922366, "learning_rate": 1.4158178314390217e-06 } }, { "step": 25300, "logs": { "loss": 0.1874, "epoch": 9.353049907578558, "learning_rate": 1.3764895583434931e-06 } }, { "step": 25350, "logs": { "loss": 0.1847, "epoch": 9.371534195933457, "learning_rate": 1.3371612852479648e-06 } }, { "step": 25400, "logs": { "loss": 0.1849, "epoch": 9.390018484288355, "learning_rate": 1.2978330121524365e-06 } }, { "step": 25450, "logs": { "loss": 0.1895, "epoch": 9.408502772643253, "learning_rate": 1.258504739056908e-06 } }, { "step": 25500, "logs": { "loss": 0.1829, "epoch": 9.426987060998151, "learning_rate": 1.2191764659613798e-06 } }, { "step": 25550, "logs": { "loss": 0.1837, "epoch": 9.445471349353049, "learning_rate": 1.1798481928658513e-06 } }, { "step": 25600, "logs": { "loss": 0.1864, "epoch": 9.463955637707949, "learning_rate": 1.140519919770323e-06 } }, { "step": 25650, "logs": { "loss": 0.1862, "epoch": 9.482439926062847, "learning_rate": 1.1011916466747946e-06 } }, { "step": 25700, "logs": { "loss": 0.19, "epoch": 9.500924214417745, "learning_rate": 1.061863373579266e-06 } }, { "step": 25750, "logs": { "loss": 0.1834, "epoch": 9.519408502772643, "learning_rate": 1.0225351004837378e-06 } }, { "step": 25800, "logs": { "loss": 0.1863, "epoch": 9.537892791127542, "learning_rate": 9.832068273882094e-07 } }, { "step": 25850, "logs": { "loss": 0.1859, "epoch": 9.55637707948244, "learning_rate": 9.438785542926811e-07 } }, { "step": 25900, "logs": { "loss": 0.1829, "epoch": 9.574861367837338, "learning_rate": 9.045502811971527e-07 } }, { "step": 25950, "logs": { "loss": 0.1838, "epoch": 9.593345656192236, "learning_rate": 8.652220081016244e-07 } }, { "step": 26000, "logs": { "loss": 0.1817, "epoch": 9.611829944547136, "learning_rate": 8.258937350060959e-07 } }, { "step": 26050, "logs": { "loss": 0.1834, "epoch": 9.630314232902034, "learning_rate": 7.865654619105675e-07 } }, { "step": 26100, "logs": { "loss": 0.1857, "epoch": 9.648798521256932, "learning_rate": 7.472371888150393e-07 } }, { "step": 26150, "logs": { "loss": 0.1858, "epoch": 9.66728280961183, "learning_rate": 7.079089157195108e-07 } }, { "step": 26200, "logs": { "loss": 0.1858, "epoch": 9.685767097966728, "learning_rate": 6.685806426239824e-07 } }, { "step": 26250, "logs": { "loss": 0.1848, "epoch": 9.704251386321626, "learning_rate": 6.29252369528454e-07 } }, { "step": 26300, "logs": { "loss": 0.1832, "epoch": 9.722735674676525, "learning_rate": 5.899240964329256e-07 } }, { "step": 26350, "logs": { "loss": 0.1842, "epoch": 9.741219963031423, "learning_rate": 5.505958233373973e-07 } }, { "step": 26400, "logs": { "loss": 0.1842, "epoch": 9.75970425138632, "learning_rate": 5.112675502418689e-07 } }, { "step": 26450, "logs": { "loss": 0.1847, "epoch": 9.77818853974122, "learning_rate": 4.7193927714634056e-07 } }, { "step": 26500, "logs": { "loss": 0.185, "epoch": 9.796672828096119, "learning_rate": 4.326110040508122e-07 } }, { "step": 26550, "logs": { "loss": 0.1826, "epoch": 9.815157116451017, "learning_rate": 3.9328273095528375e-07 } }, { "step": 26600, "logs": { "loss": 0.1833, "epoch": 9.833641404805915, "learning_rate": 3.539544578597554e-07 } }, { "step": 26650, "logs": { "loss": 0.1846, "epoch": 9.852125693160813, "learning_rate": 3.14626184764227e-07 } }, { "step": 26700, "logs": { "loss": 0.184, "epoch": 9.870609981515711, "learning_rate": 2.7529791166869866e-07 } }, { "step": 26750, "logs": { "loss": 0.1864, "epoch": 9.88909426987061, "learning_rate": 2.3596963857317028e-07 } }, { "step": 26800, "logs": { "loss": 0.1841, "epoch": 9.907578558225508, "learning_rate": 1.9664136547764187e-07 } }, { "step": 26850, "logs": { "loss": 0.1855, "epoch": 9.926062846580407, "learning_rate": 1.573130923821135e-07 } }, { "step": 26900, "logs": { "loss": 0.1794, "epoch": 9.944547134935306, "learning_rate": 1.1798481928658514e-07 } }, { "step": 26950, "logs": { "loss": 0.1853, "epoch": 9.963031423290204, "learning_rate": 7.865654619105675e-08 } }, { "step": 27000, "logs": { "loss": 0.1855, "epoch": 9.981515711645102, "learning_rate": 3.9328273095528373e-08 } } ], "train_wrt_samples": [ { "step": 19200, "logs": { "loss": 1.2091, "epoch": 0.018484288354898338, "learning_rate": 1.0584432680980562e-05 } }, { "step": 38400, "logs": { "loss": 1.1315, "epoch": 0.036968576709796676, "learning_rate": 1.2459822860720352e-05 } }, { "step": 57600, "logs": { "loss": 1.1118, "epoch": 0.05545286506469501, "learning_rate": 1.355685579689696e-05 } }, { "step": 76800, "logs": { "loss": 1.1091, "epoch": 0.07393715341959335, "learning_rate": 1.4335213053988223e-05 } }, { "step": 96000, "logs": { "loss": 1.1063, "epoch": 0.09242144177449169, "learning_rate": 1.4938953847726847e-05 } }, { "step": 115200, "logs": { "loss": 1.1012, "epoch": 0.11090573012939002, "learning_rate": 1.5432245994674192e-05 } }, { "step": 134400, "logs": { "loss": 1.0844, "epoch": 0.12939001848428835, "learning_rate": 1.5849318562425815e-05 } }, { "step": 153600, "logs": { "loss": 1.0911, "epoch": 0.1478743068391867, "learning_rate": 1.6210603254020138e-05 } }, { "step": 172800, "logs": { "loss": 1.0816, "epoch": 0.16635859519408502, "learning_rate": 1.652927893686328e-05 } }, { "step": 192000, "logs": { "loss": 1.0819, "epoch": 0.18484288354898337, "learning_rate": 1.6814344049111566e-05 } }, { "step": 211200, "logs": { "loss": 1.0757, "epoch": 0.2033271719038817, "learning_rate": 1.70722168104602e-05 } }, { "step": 230400, "logs": { "loss": 1.0706, "epoch": 0.22181146025878004, "learning_rate": 1.7307636196960783e-05 } }, { "step": 249600, "logs": { "loss": 1.0698, "epoch": 0.24029574861367836, "learning_rate": 1.7524201039271304e-05 } }, { "step": 268800, "logs": { "loss": 1.0632, "epoch": 0.2587800369685767, "learning_rate": 1.7724708765356604e-05 } }, { "step": 288000, "logs": { "loss": 1.0601, "epoch": 0.27726432532347506, "learning_rate": 1.7911376992503148e-05 } }, { "step": 307200, "logs": { "loss": 1.0582, "epoch": 0.2957486136783734, "learning_rate": 1.808599345743407e-05 } }, { "step": 326400, "logs": { "loss": 1.0512, "epoch": 0.3142329020332717, "learning_rate": 1.825002041317456e-05 } }, { "step": 345600, "logs": { "loss": 1.0544, "epoch": 0.33271719038817005, "learning_rate": 1.840466914065299e-05 } }, { "step": 364800, "logs": { "loss": 1.043, "epoch": 0.3512014787430684, "learning_rate": 1.855095428760744e-05 } }, { "step": 384000, "logs": { "loss": 1.047, "epoch": 0.36968576709796674, "learning_rate": 1.8689734253201903e-05 } }, { "step": 403200, "logs": { "loss": 1.0408, "epoch": 0.38817005545286504, "learning_rate": 1.8821741709263542e-05 } }, { "step": 422400, "logs": { "loss": 1.0431, "epoch": 0.4066543438077634, "learning_rate": 1.89476070147965e-05 } }, { "step": 441600, "logs": { "loss": 1.0431, "epoch": 0.42513863216266173, "learning_rate": 1.9067876421445012e-05 } }, { "step": 460800, "logs": { "loss": 1.034, "epoch": 0.4436229205175601, "learning_rate": 1.9183026401502057e-05 } }, { "step": 480000, "logs": { "loss": 1.039, "epoch": 0.46210720887245843, "learning_rate": 1.9293475049105016e-05 } }, { "step": 499200, "logs": { "loss": 1.0304, "epoch": 0.4805914972273567, "learning_rate": 1.9399591243986016e-05 } }, { "step": 518400, "logs": { "loss": 1.0385, "epoch": 0.49907578558225507, "learning_rate": 1.950170208484624e-05 } }, { "step": 537600, "logs": { "loss": 1.027, "epoch": 0.5175600739371534, "learning_rate": 1.9600098970219974e-05 } }, { "step": 556800, "logs": { "loss": 1.0281, "epoch": 0.5360443622920518, "learning_rate": 1.9695042611797287e-05 } }, { "step": 576000, "logs": { "loss": 1.0282, "epoch": 0.5545286506469501, "learning_rate": 1.978676719749536e-05 } }, { "step": 595200, "logs": { "loss": 1.0186, "epoch": 0.5730129390018485, "learning_rate": 1.9875483871657987e-05 } }, { "step": 614400, "logs": { "loss": 1.0237, "epoch": 0.5914972273567468, "learning_rate": 1.9961383662539012e-05 } }, { "step": 633600, "logs": { "loss": 1.0176, "epoch": 0.609981515711645, "learning_rate": 1.9978762732528416e-05 } }, { "step": 652800, "logs": { "loss": 1.4539, "epoch": 0.6284658040665434, "learning_rate": 1.9939434459432887e-05 } }, { "step": 672000, "logs": { "loss": 1.2593, "epoch": 0.6469500924214417, "learning_rate": 1.990010618633736e-05 } }, { "step": 691200, "logs": { "loss": 1.5937, "epoch": 0.6654343807763401, "learning_rate": 1.986077791324183e-05 } }, { "step": 710400, "logs": { "loss": 1.0165, "epoch": 0.6839186691312384, "learning_rate": 1.9821449640146302e-05 } }, { "step": 729600, "logs": { "loss": 1.4354, "epoch": 0.7024029574861368, "learning_rate": 1.9782121367050776e-05 } }, { "step": 748800, "logs": { "loss": 1.021, "epoch": 0.7208872458410351, "learning_rate": 1.9742793093955247e-05 } }, { "step": 768000, "logs": { "loss": 1.0078, "epoch": 0.7393715341959335, "learning_rate": 1.9703464820859717e-05 } }, { "step": 787200, "logs": { "loss": 1.0057, "epoch": 0.7578558225508318, "learning_rate": 1.966413654776419e-05 } }, { "step": 806400, "logs": { "loss": 1.0001, "epoch": 0.7763401109057301, "learning_rate": 1.9624808274668662e-05 } }, { "step": 825600, "logs": { "loss": 1.006, "epoch": 0.7948243992606284, "learning_rate": 1.9585480001573133e-05 } }, { "step": 844800, "logs": { "loss": 1.0103, "epoch": 0.8133086876155268, "learning_rate": 1.9546151728477603e-05 } }, { "step": 864000, "logs": { "loss": 1.0046, "epoch": 0.8317929759704251, "learning_rate": 1.9506823455382077e-05 } }, { "step": 883200, "logs": { "loss": 0.9941, "epoch": 0.8502772643253235, "learning_rate": 1.9467495182286548e-05 } }, { "step": 902400, "logs": { "loss": 0.9963, "epoch": 0.8687615526802218, "learning_rate": 1.942816690919102e-05 } }, { "step": 921600, "logs": { "loss": 0.9926, "epoch": 0.8872458410351202, "learning_rate": 1.938883863609549e-05 } }, { "step": 940800, "logs": { "loss": 0.9918, "epoch": 0.9057301293900185, "learning_rate": 1.934951036299996e-05 } }, { "step": 960000, "logs": { "loss": 0.9899, "epoch": 0.9242144177449169, "learning_rate": 1.9310182089904434e-05 } }, { "step": 979200, "logs": { "loss": 0.9887, "epoch": 0.9426987060998152, "learning_rate": 1.9270853816808904e-05 } }, { "step": 998400, "logs": { "loss": 0.9942, "epoch": 0.9611829944547134, "learning_rate": 1.9231525543713375e-05 } }, { "step": 1017600, "logs": { "loss": 0.9817, "epoch": 0.9796672828096118, "learning_rate": 1.919219727061785e-05 } }, { "step": 1036800, "logs": { "loss": 0.9811, "epoch": 0.9981515711645101, "learning_rate": 1.915286899752232e-05 } }, { "step": 1055744, "logs": { "loss": 0.8466, "epoch": 1.0166358595194085, "learning_rate": 1.911354072442679e-05 } }, { "step": 1074944, "logs": { "loss": 0.8316, "epoch": 1.0351201478743068, "learning_rate": 1.9074212451331264e-05 } }, { "step": 1094144, "logs": { "loss": 0.8363, "epoch": 1.0536044362292052, "learning_rate": 1.9034884178235735e-05 } }, { "step": 1113344, "logs": { "loss": 0.8378, "epoch": 1.0720887245841035, "learning_rate": 1.8995555905140205e-05 } }, { "step": 1132544, "logs": { "loss": 0.8386, "epoch": 1.0905730129390019, "learning_rate": 1.895622763204468e-05 } }, { "step": 1151744, "logs": { "loss": 0.8465, "epoch": 1.1090573012939002, "learning_rate": 1.891689935894915e-05 } }, { "step": 1170944, "logs": { "loss": 0.8375, "epoch": 1.1275415896487986, "learning_rate": 1.887757108585362e-05 } }, { "step": 1190144, "logs": { "loss": 0.8379, "epoch": 1.146025878003697, "learning_rate": 1.8838242812758095e-05 } }, { "step": 1209344, "logs": { "loss": 0.836, "epoch": 1.1645101663585953, "learning_rate": 1.8798914539662565e-05 } }, { "step": 1228544, "logs": { "loss": 0.8411, "epoch": 1.1829944547134936, "learning_rate": 1.8759586266567036e-05 } }, { "step": 1247744, "logs": { "loss": 0.8442, "epoch": 1.201478743068392, "learning_rate": 1.872025799347151e-05 } }, { "step": 1266944, "logs": { "loss": 0.8397, "epoch": 1.21996303142329, "learning_rate": 1.868092972037598e-05 } }, { "step": 1286144, "logs": { "loss": 0.8415, "epoch": 1.2384473197781884, "learning_rate": 1.864160144728045e-05 } }, { "step": 1305344, "logs": { "loss": 0.8397, "epoch": 1.2569316081330868, "learning_rate": 1.8602273174184925e-05 } }, { "step": 1324544, "logs": { "loss": 0.8396, "epoch": 1.2754158964879851, "learning_rate": 1.8562944901089396e-05 } }, { "step": 1343744, "logs": { "loss": 0.8452, "epoch": 1.2939001848428835, "learning_rate": 1.8523616627993866e-05 } }, { "step": 1362944, "logs": { "loss": 0.8362, "epoch": 1.3123844731977818, "learning_rate": 1.848428835489834e-05 } }, { "step": 1382144, "logs": { "loss": 0.8396, "epoch": 1.3308687615526802, "learning_rate": 1.844496008180281e-05 } }, { "step": 1401344, "logs": { "loss": 0.8334, "epoch": 1.3493530499075785, "learning_rate": 1.840563180870728e-05 } }, { "step": 1420544, "logs": { "loss": 0.834, "epoch": 1.3678373382624769, "learning_rate": 1.8366303535611752e-05 } }, { "step": 1439744, "logs": { "loss": 0.8333, "epoch": 1.3863216266173752, "learning_rate": 1.8326975262516223e-05 } }, { "step": 1458944, "logs": { "loss": 0.8357, "epoch": 1.4048059149722736, "learning_rate": 1.8287646989420697e-05 } }, { "step": 1478144, "logs": { "loss": 0.8374, "epoch": 1.423290203327172, "learning_rate": 1.8248318716325167e-05 } }, { "step": 1497344, "logs": { "loss": 0.837, "epoch": 1.4417744916820703, "learning_rate": 1.8208990443229638e-05 } }, { "step": 1516544, "logs": { "loss": 0.835, "epoch": 1.4602587800369686, "learning_rate": 1.816966217013411e-05 } }, { "step": 1535744, "logs": { "loss": 0.8352, "epoch": 1.478743068391867, "learning_rate": 1.8130333897038583e-05 } }, { "step": 1554944, "logs": { "loss": 0.8475, "epoch": 1.4972273567467653, "learning_rate": 1.8091005623943053e-05 } }, { "step": 1574144, "logs": { "loss": 0.8339, "epoch": 1.5157116451016637, "learning_rate": 1.8051677350847524e-05 } }, { "step": 1593344, "logs": { "loss": 0.8382, "epoch": 1.534195933456562, "learning_rate": 1.8012349077751998e-05 } }, { "step": 1612544, "logs": { "loss": 0.8376, "epoch": 1.5526802218114601, "learning_rate": 1.797302080465647e-05 } }, { "step": 1631744, "logs": { "loss": 0.8302, "epoch": 1.5711645101663585, "learning_rate": 1.793369253156094e-05 } }, { "step": 1650944, "logs": { "loss": 0.8312, "epoch": 1.5896487985212568, "learning_rate": 1.7894364258465413e-05 } }, { "step": 1670144, "logs": { "loss": 0.8361, "epoch": 1.6081330868761552, "learning_rate": 1.7855035985369884e-05 } }, { "step": 1689344, "logs": { "loss": 0.8321, "epoch": 1.6266173752310535, "learning_rate": 1.7815707712274354e-05 } }, { "step": 1708544, "logs": { "loss": 0.8374, "epoch": 1.645101663585952, "learning_rate": 1.777637943917883e-05 } }, { "step": 1727744, "logs": { "loss": 0.8287, "epoch": 1.6635859519408502, "learning_rate": 1.77370511660833e-05 } }, { "step": 1746944, "logs": { "loss": 0.8367, "epoch": 1.6820702402957486, "learning_rate": 1.769772289298777e-05 } }, { "step": 1766144, "logs": { "loss": 0.8439, "epoch": 1.700554528650647, "learning_rate": 1.7658394619892244e-05 } }, { "step": 1785344, "logs": { "loss": 0.829, "epoch": 1.7190388170055453, "learning_rate": 1.7619066346796714e-05 } }, { "step": 1804544, "logs": { "loss": 0.8325, "epoch": 1.7375231053604436, "learning_rate": 1.7579738073701185e-05 } }, { "step": 1823744, "logs": { "loss": 0.837, "epoch": 1.756007393715342, "learning_rate": 1.754040980060566e-05 } }, { "step": 1842944, "logs": { "loss": 0.8371, "epoch": 1.7744916820702403, "learning_rate": 1.750108152751013e-05 } }, { "step": 1862144, "logs": { "loss": 0.832, "epoch": 1.7929759704251387, "learning_rate": 1.74617532544146e-05 } }, { "step": 1881344, "logs": { "loss": 0.8342, "epoch": 1.811460258780037, "learning_rate": 1.7422424981319074e-05 } }, { "step": 1900544, "logs": { "loss": 0.8331, "epoch": 1.8299445471349354, "learning_rate": 1.7383096708223545e-05 } }, { "step": 1919744, "logs": { "loss": 0.8234, "epoch": 1.8484288354898337, "learning_rate": 1.7343768435128015e-05 } }, { "step": 1938944, "logs": { "loss": 0.8311, "epoch": 1.866913123844732, "learning_rate": 1.7304440162032486e-05 } }, { "step": 1958144, "logs": { "loss": 0.8259, "epoch": 1.8853974121996304, "learning_rate": 1.726511188893696e-05 } }, { "step": 1977344, "logs": { "loss": 0.8253, "epoch": 1.9038817005545285, "learning_rate": 1.722578361584143e-05 } }, { "step": 1996544, "logs": { "loss": 0.8297, "epoch": 1.922365988909427, "learning_rate": 1.71864553427459e-05 } }, { "step": 2015744, "logs": { "loss": 0.8264, "epoch": 1.9408502772643252, "learning_rate": 1.7147127069650372e-05 } }, { "step": 2034944, "logs": { "loss": 0.8283, "epoch": 1.9593345656192236, "learning_rate": 1.7107798796554846e-05 } }, { "step": 2054144, "logs": { "loss": 0.8262, "epoch": 1.977818853974122, "learning_rate": 1.7068470523459316e-05 } }, { "step": 2073344, "logs": { "loss": 0.829, "epoch": 1.9963031423290203, "learning_rate": 1.7029142250363787e-05 } }, { "step": 2092288, "logs": { "loss": 0.6969, "epoch": 2.014787430683919, "learning_rate": 1.6989813977268258e-05 } }, { "step": 2111488, "logs": { "loss": 0.6715, "epoch": 2.033271719038817, "learning_rate": 1.695048570417273e-05 } }, { "step": 2130688, "logs": { "loss": 0.6636, "epoch": 2.0517560073937156, "learning_rate": 1.6911157431077202e-05 } }, { "step": 2149888, "logs": { "loss": 0.6649, "epoch": 2.0702402957486137, "learning_rate": 1.6871829157981673e-05 } }, { "step": 2169088, "logs": { "loss": 0.665, "epoch": 2.088724584103512, "learning_rate": 1.6832500884886147e-05 } }, { "step": 2188288, "logs": { "loss": 0.6746, "epoch": 2.1072088724584104, "learning_rate": 1.6793172611790617e-05 } }, { "step": 2207488, "logs": { "loss": 0.6678, "epoch": 2.1256931608133085, "learning_rate": 1.6753844338695088e-05 } }, { "step": 2226688, "logs": { "loss": 0.6739, "epoch": 2.144177449168207, "learning_rate": 1.6714516065599562e-05 } }, { "step": 2245888, "logs": { "loss": 0.6666, "epoch": 2.162661737523105, "learning_rate": 1.6675187792504033e-05 } }, { "step": 2265088, "logs": { "loss": 0.674, "epoch": 2.1811460258780038, "learning_rate": 1.6635859519408503e-05 } }, { "step": 2284288, "logs": { "loss": 0.6737, "epoch": 2.199630314232902, "learning_rate": 1.6596531246312977e-05 } }, { "step": 2303488, "logs": { "loss": 0.675, "epoch": 2.2181146025878005, "learning_rate": 1.6557202973217448e-05 } }, { "step": 2322688, "logs": { "loss": 0.6743, "epoch": 2.2365988909426986, "learning_rate": 1.651787470012192e-05 } }, { "step": 2341888, "logs": { "loss": 0.6718, "epoch": 2.255083179297597, "learning_rate": 1.647854642702639e-05 } }, { "step": 2361088, "logs": { "loss": 0.6735, "epoch": 2.2735674676524953, "learning_rate": 1.6439218153930863e-05 } }, { "step": 2380288, "logs": { "loss": 0.6798, "epoch": 2.292051756007394, "learning_rate": 1.6399889880835334e-05 } }, { "step": 2399488, "logs": { "loss": 0.6768, "epoch": 2.310536044362292, "learning_rate": 1.6360561607739804e-05 } }, { "step": 2418688, "logs": { "loss": 0.6796, "epoch": 2.3290203327171906, "learning_rate": 1.632123333464428e-05 } }, { "step": 2437888, "logs": { "loss": 0.6813, "epoch": 2.3475046210720887, "learning_rate": 1.628190506154875e-05 } }, { "step": 2457088, "logs": { "loss": 0.6774, "epoch": 2.3659889094269873, "learning_rate": 1.624257678845322e-05 } }, { "step": 2476288, "logs": { "loss": 0.6745, "epoch": 2.3844731977818854, "learning_rate": 1.6203248515357694e-05 } }, { "step": 2495488, "logs": { "loss": 0.6809, "epoch": 2.402957486136784, "learning_rate": 1.6163920242262164e-05 } }, { "step": 2514688, "logs": { "loss": 0.6831, "epoch": 2.421441774491682, "learning_rate": 1.6124591969166635e-05 } }, { "step": 2533888, "logs": { "loss": 0.6803, "epoch": 2.43992606284658, "learning_rate": 1.608526369607111e-05 } }, { "step": 2553088, "logs": { "loss": 0.6791, "epoch": 2.4584103512014788, "learning_rate": 1.604593542297558e-05 } }, { "step": 2572288, "logs": { "loss": 0.6812, "epoch": 2.476894639556377, "learning_rate": 1.600660714988005e-05 } }, { "step": 2591488, "logs": { "loss": 0.6866, "epoch": 2.4953789279112755, "learning_rate": 1.596727887678452e-05 } }, { "step": 2610688, "logs": { "loss": 0.6837, "epoch": 2.5138632162661736, "learning_rate": 1.5927950603688995e-05 } }, { "step": 2629888, "logs": { "loss": 0.6814, "epoch": 2.532347504621072, "learning_rate": 1.5888622330593465e-05 } }, { "step": 2649088, "logs": { "loss": 0.6845, "epoch": 2.5508317929759703, "learning_rate": 1.5849294057497936e-05 } }, { "step": 2668288, "logs": { "loss": 0.6832, "epoch": 2.569316081330869, "learning_rate": 1.5809965784402407e-05 } }, { "step": 2687488, "logs": { "loss": 0.6795, "epoch": 2.587800369685767, "learning_rate": 1.5770637511306877e-05 } }, { "step": 2706688, "logs": { "loss": 0.679, "epoch": 2.6062846580406656, "learning_rate": 1.573130923821135e-05 } }, { "step": 2725888, "logs": { "loss": 0.6851, "epoch": 2.6247689463955637, "learning_rate": 1.5691980965115822e-05 } }, { "step": 2745088, "logs": { "loss": 0.692, "epoch": 2.6432532347504623, "learning_rate": 1.5652652692020292e-05 } }, { "step": 2764288, "logs": { "loss": 0.6956, "epoch": 2.6617375231053604, "learning_rate": 1.5613324418924766e-05 } }, { "step": 2783488, "logs": { "loss": 0.6883, "epoch": 2.680221811460259, "learning_rate": 1.5573996145829237e-05 } }, { "step": 2802688, "logs": { "loss": 0.6806, "epoch": 2.698706099815157, "learning_rate": 1.5534667872733708e-05 } }, { "step": 2821888, "logs": { "loss": 0.6832, "epoch": 2.7171903881700556, "learning_rate": 1.549533959963818e-05 } }, { "step": 2841088, "logs": { "loss": 0.6871, "epoch": 2.7356746765249538, "learning_rate": 1.5456011326542652e-05 } }, { "step": 2860288, "logs": { "loss": 0.6843, "epoch": 2.7541589648798523, "learning_rate": 1.5416683053447123e-05 } }, { "step": 2879488, "logs": { "loss": 0.6869, "epoch": 2.7726432532347505, "learning_rate": 1.5377354780351597e-05 } }, { "step": 2898688, "logs": { "loss": 0.689, "epoch": 2.7911275415896486, "learning_rate": 1.5338026507256067e-05 } }, { "step": 2917888, "logs": { "loss": 0.6864, "epoch": 2.809611829944547, "learning_rate": 1.5298698234160538e-05 } }, { "step": 2937088, "logs": { "loss": 0.6875, "epoch": 2.8280961182994453, "learning_rate": 1.5259369961065012e-05 } }, { "step": 2956288, "logs": { "loss": 0.6844, "epoch": 2.846580406654344, "learning_rate": 1.5220041687969483e-05 } }, { "step": 2975488, "logs": { "loss": 0.6916, "epoch": 2.865064695009242, "learning_rate": 1.5180713414873953e-05 } }, { "step": 2994688, "logs": { "loss": 0.6849, "epoch": 2.8835489833641406, "learning_rate": 1.5141385141778426e-05 } }, { "step": 3013888, "logs": { "loss": 0.6835, "epoch": 2.9020332717190387, "learning_rate": 1.5102056868682898e-05 } }, { "step": 3033088, "logs": { "loss": 0.6866, "epoch": 2.9205175600739373, "learning_rate": 1.5062728595587369e-05 } }, { "step": 3052288, "logs": { "loss": 0.6863, "epoch": 2.9390018484288354, "learning_rate": 1.502340032249184e-05 } }, { "step": 3071488, "logs": { "loss": 0.6903, "epoch": 2.957486136783734, "learning_rate": 1.4984072049396311e-05 } }, { "step": 3090688, "logs": { "loss": 0.686, "epoch": 2.975970425138632, "learning_rate": 1.4944743776300784e-05 } }, { "step": 3109888, "logs": { "loss": 0.6909, "epoch": 2.9944547134935307, "learning_rate": 1.4905415503205256e-05 } }, { "step": 3128832, "logs": { "loss": 0.5832, "epoch": 3.0129390018484288, "learning_rate": 1.4866087230109727e-05 } }, { "step": 3148032, "logs": { "loss": 0.5314, "epoch": 3.0314232902033273, "learning_rate": 1.4826758957014197e-05 } }, { "step": 3167232, "logs": { "loss": 0.5332, "epoch": 3.0499075785582255, "learning_rate": 1.4787430683918671e-05 } }, { "step": 3186432, "logs": { "loss": 0.5359, "epoch": 3.068391866913124, "learning_rate": 1.4748102410823142e-05 } }, { "step": 3205632, "logs": { "loss": 0.5398, "epoch": 3.086876155268022, "learning_rate": 1.4708774137727613e-05 } }, { "step": 3224832, "logs": { "loss": 0.5433, "epoch": 3.1053604436229203, "learning_rate": 1.4669445864632087e-05 } }, { "step": 3244032, "logs": { "loss": 0.5368, "epoch": 3.123844731977819, "learning_rate": 1.4630117591536557e-05 } }, { "step": 3263232, "logs": { "loss": 0.5419, "epoch": 3.142329020332717, "learning_rate": 1.4590789318441028e-05 } }, { "step": 3282432, "logs": { "loss": 0.5398, "epoch": 3.1608133086876156, "learning_rate": 1.45514610453455e-05 } }, { "step": 3301632, "logs": { "loss": 0.5442, "epoch": 3.1792975970425137, "learning_rate": 1.4512132772249972e-05 } }, { "step": 3320832, "logs": { "loss": 0.544, "epoch": 3.1977818853974123, "learning_rate": 1.4472804499154443e-05 } }, { "step": 3340032, "logs": { "loss": 0.5455, "epoch": 3.2162661737523104, "learning_rate": 1.4433476226058915e-05 } }, { "step": 3359232, "logs": { "loss": 0.548, "epoch": 3.234750462107209, "learning_rate": 1.4394147952963386e-05 } }, { "step": 3378432, "logs": { "loss": 0.5453, "epoch": 3.253234750462107, "learning_rate": 1.4354819679867858e-05 } }, { "step": 3397632, "logs": { "loss": 0.5416, "epoch": 3.2717190388170057, "learning_rate": 1.431549140677233e-05 } }, { "step": 3416832, "logs": { "loss": 0.5542, "epoch": 3.290203327171904, "learning_rate": 1.4276163133676801e-05 } }, { "step": 3436032, "logs": { "loss": 0.5469, "epoch": 3.3086876155268024, "learning_rate": 1.4236834860581272e-05 } }, { "step": 3455232, "logs": { "loss": 0.5545, "epoch": 3.3271719038817005, "learning_rate": 1.4197506587485746e-05 } }, { "step": 3474432, "logs": { "loss": 0.5538, "epoch": 3.345656192236599, "learning_rate": 1.4158178314390216e-05 } }, { "step": 3493632, "logs": { "loss": 0.5504, "epoch": 3.364140480591497, "learning_rate": 1.4118850041294687e-05 } }, { "step": 3512832, "logs": { "loss": 0.5511, "epoch": 3.3826247689463957, "learning_rate": 1.4079521768199161e-05 } }, { "step": 3532032, "logs": { "loss": 0.554, "epoch": 3.401109057301294, "learning_rate": 1.4040193495103632e-05 } }, { "step": 3551232, "logs": { "loss": 0.5541, "epoch": 3.4195933456561924, "learning_rate": 1.4000865222008102e-05 } }, { "step": 3570432, "logs": { "loss": 0.5502, "epoch": 3.4380776340110906, "learning_rate": 1.3961536948912575e-05 } }, { "step": 3589632, "logs": { "loss": 0.5513, "epoch": 3.4565619223659887, "learning_rate": 1.3922208675817047e-05 } }, { "step": 3608832, "logs": { "loss": 0.5579, "epoch": 3.4750462107208873, "learning_rate": 1.3882880402721517e-05 } }, { "step": 3628032, "logs": { "loss": 0.5636, "epoch": 3.4935304990757854, "learning_rate": 1.384355212962599e-05 } }, { "step": 3647232, "logs": { "loss": 0.5617, "epoch": 3.512014787430684, "learning_rate": 1.380422385653046e-05 } }, { "step": 3666432, "logs": { "loss": 0.5549, "epoch": 3.530499075785582, "learning_rate": 1.3764895583434933e-05 } }, { "step": 3685632, "logs": { "loss": 0.5599, "epoch": 3.5489833641404807, "learning_rate": 1.3725567310339405e-05 } }, { "step": 3704832, "logs": { "loss": 0.5565, "epoch": 3.567467652495379, "learning_rate": 1.3686239037243876e-05 } }, { "step": 3724032, "logs": { "loss": 0.5565, "epoch": 3.5859519408502774, "learning_rate": 1.3646910764148346e-05 } }, { "step": 3743232, "logs": { "loss": 0.5558, "epoch": 3.6044362292051755, "learning_rate": 1.360758249105282e-05 } }, { "step": 3762432, "logs": { "loss": 0.5599, "epoch": 3.622920517560074, "learning_rate": 1.356825421795729e-05 } }, { "step": 3781632, "logs": { "loss": 0.561, "epoch": 3.641404805914972, "learning_rate": 1.3528925944861761e-05 } }, { "step": 3800832, "logs": { "loss": 0.5596, "epoch": 3.6598890942698707, "learning_rate": 1.3489597671766235e-05 } }, { "step": 3820032, "logs": { "loss": 0.5596, "epoch": 3.678373382624769, "learning_rate": 1.3450269398670706e-05 } }, { "step": 3839232, "logs": { "loss": 0.5579, "epoch": 3.6968576709796674, "learning_rate": 1.3410941125575177e-05 } }, { "step": 3858432, "logs": { "loss": 0.5611, "epoch": 3.7153419593345656, "learning_rate": 1.3371612852479649e-05 } }, { "step": 3877632, "logs": { "loss": 0.5627, "epoch": 3.733826247689464, "learning_rate": 1.3332284579384121e-05 } }, { "step": 3896832, "logs": { "loss": 0.5613, "epoch": 3.7523105360443623, "learning_rate": 1.3292956306288592e-05 } }, { "step": 3916032, "logs": { "loss": 0.5607, "epoch": 3.770794824399261, "learning_rate": 1.3253628033193064e-05 } }, { "step": 3935232, "logs": { "loss": 0.5651, "epoch": 3.789279112754159, "learning_rate": 1.3214299760097535e-05 } }, { "step": 3954432, "logs": { "loss": 0.5604, "epoch": 3.807763401109057, "learning_rate": 1.3174971487002005e-05 } }, { "step": 3973632, "logs": { "loss": 0.5676, "epoch": 3.8262476894639557, "learning_rate": 1.313564321390648e-05 } }, { "step": 3992832, "logs": { "loss": 0.5601, "epoch": 3.844731977818854, "learning_rate": 1.309631494081095e-05 } }, { "step": 4012032, "logs": { "loss": 0.5645, "epoch": 3.8632162661737524, "learning_rate": 1.305698666771542e-05 } }, { "step": 4031232, "logs": { "loss": 0.5653, "epoch": 3.8817005545286505, "learning_rate": 1.3017658394619895e-05 } }, { "step": 4050432, "logs": { "loss": 0.5618, "epoch": 3.900184842883549, "learning_rate": 1.2978330121524365e-05 } }, { "step": 4069632, "logs": { "loss": 0.5624, "epoch": 3.918669131238447, "learning_rate": 1.2939001848428836e-05 } }, { "step": 4088832, "logs": { "loss": 0.5621, "epoch": 3.9371534195933457, "learning_rate": 1.289967357533331e-05 } }, { "step": 4108032, "logs": { "loss": 0.5633, "epoch": 3.955637707948244, "learning_rate": 1.286034530223778e-05 } }, { "step": 4127232, "logs": { "loss": 0.5645, "epoch": 3.9741219963031424, "learning_rate": 1.2821017029142251e-05 } }, { "step": 4146432, "logs": { "loss": 0.5675, "epoch": 3.9926062846580406, "learning_rate": 1.2781688756046723e-05 } }, { "step": 4165376, "logs": { "loss": 0.4943, "epoch": 4.011090573012939, "learning_rate": 1.2742360482951194e-05 } }, { "step": 4184576, "logs": { "loss": 0.4282, "epoch": 4.029574861367838, "learning_rate": 1.2703032209855666e-05 } }, { "step": 4203776, "logs": { "loss": 0.4285, "epoch": 4.048059149722736, "learning_rate": 1.2663703936760139e-05 } }, { "step": 4222976, "logs": { "loss": 0.4307, "epoch": 4.066543438077634, "learning_rate": 1.262437566366461e-05 } }, { "step": 4242176, "logs": { "loss": 0.4372, "epoch": 4.085027726432532, "learning_rate": 1.258504739056908e-05 } }, { "step": 4261376, "logs": { "loss": 0.4377, "epoch": 4.103512014787431, "learning_rate": 1.2545719117473554e-05 } }, { "step": 4280576, "logs": { "loss": 0.4296, "epoch": 4.121996303142329, "learning_rate": 1.2506390844378025e-05 } }, { "step": 4299776, "logs": { "loss": 0.4358, "epoch": 4.140480591497227, "learning_rate": 1.2467062571282495e-05 } }, { "step": 4318976, "logs": { "loss": 0.4383, "epoch": 4.1589648798521255, "learning_rate": 1.2427734298186969e-05 } }, { "step": 4338176, "logs": { "loss": 0.4355, "epoch": 4.177449168207024, "learning_rate": 1.238840602509144e-05 } }, { "step": 4357376, "logs": { "loss": 0.44, "epoch": 4.195933456561923, "learning_rate": 1.234907775199591e-05 } }, { "step": 4376576, "logs": { "loss": 0.4393, "epoch": 4.214417744916821, "learning_rate": 1.2309749478900384e-05 } }, { "step": 4395776, "logs": { "loss": 0.4427, "epoch": 4.232902033271719, "learning_rate": 1.2270421205804855e-05 } }, { "step": 4414976, "logs": { "loss": 0.4399, "epoch": 4.251386321626617, "learning_rate": 1.2231092932709326e-05 } }, { "step": 4434176, "logs": { "loss": 0.4401, "epoch": 4.269870609981516, "learning_rate": 1.2191764659613798e-05 } }, { "step": 4453376, "logs": { "loss": 0.4446, "epoch": 4.288354898336414, "learning_rate": 1.2152436386518269e-05 } }, { "step": 4472576, "logs": { "loss": 0.4436, "epoch": 4.306839186691312, "learning_rate": 1.211310811342274e-05 } }, { "step": 4491776, "logs": { "loss": 0.4478, "epoch": 4.32532347504621, "learning_rate": 1.2073779840327213e-05 } }, { "step": 4510976, "logs": { "loss": 0.447, "epoch": 4.343807763401109, "learning_rate": 1.2034451567231684e-05 } }, { "step": 4530176, "logs": { "loss": 0.4505, "epoch": 4.3622920517560075, "learning_rate": 1.1995123294136154e-05 } }, { "step": 4549376, "logs": { "loss": 0.4461, "epoch": 4.380776340110906, "learning_rate": 1.1955795021040628e-05 } }, { "step": 4568576, "logs": { "loss": 0.4511, "epoch": 4.399260628465804, "learning_rate": 1.1916466747945099e-05 } }, { "step": 4587776, "logs": { "loss": 0.4481, "epoch": 4.417744916820703, "learning_rate": 1.187713847484957e-05 } }, { "step": 4606976, "logs": { "loss": 0.4457, "epoch": 4.436229205175601, "learning_rate": 1.1837810201754044e-05 } }, { "step": 4626176, "logs": { "loss": 0.4491, "epoch": 4.454713493530499, "learning_rate": 1.1798481928658514e-05 } }, { "step": 4645376, "logs": { "loss": 0.453, "epoch": 4.473197781885397, "learning_rate": 1.1759153655562985e-05 } }, { "step": 4664576, "logs": { "loss": 0.4557, "epoch": 4.491682070240295, "learning_rate": 1.1719825382467455e-05 } }, { "step": 4683776, "logs": { "loss": 0.4588, "epoch": 4.510166358595194, "learning_rate": 1.168049710937193e-05 } }, { "step": 4702976, "logs": { "loss": 0.4478, "epoch": 4.5286506469500925, "learning_rate": 1.16411688362764e-05 } }, { "step": 4722176, "logs": { "loss": 0.4558, "epoch": 4.547134935304991, "learning_rate": 1.160184056318087e-05 } }, { "step": 4741376, "logs": { "loss": 0.453, "epoch": 4.565619223659889, "learning_rate": 1.1562512290085343e-05 } }, { "step": 4760576, "logs": { "loss": 0.4566, "epoch": 4.584103512014788, "learning_rate": 1.1523184016989815e-05 } }, { "step": 4779776, "logs": { "loss": 0.4512, "epoch": 4.602587800369686, "learning_rate": 1.1483855743894286e-05 } }, { "step": 4798976, "logs": { "loss": 0.4537, "epoch": 4.621072088724584, "learning_rate": 1.1444527470798758e-05 } }, { "step": 4818176, "logs": { "loss": 0.4596, "epoch": 4.639556377079482, "learning_rate": 1.1405199197703229e-05 } }, { "step": 4837376, "logs": { "loss": 0.4544, "epoch": 4.658040665434381, "learning_rate": 1.1365870924607701e-05 } }, { "step": 4856576, "logs": { "loss": 0.4552, "epoch": 4.676524953789279, "learning_rate": 1.1326542651512173e-05 } }, { "step": 4875776, "logs": { "loss": 0.4561, "epoch": 4.695009242144177, "learning_rate": 1.1287214378416644e-05 } }, { "step": 4894976, "logs": { "loss": 0.456, "epoch": 4.7134935304990755, "learning_rate": 1.1247886105321115e-05 } }, { "step": 4914176, "logs": { "loss": 0.455, "epoch": 4.7319778188539745, "learning_rate": 1.1208557832225589e-05 } }, { "step": 4933376, "logs": { "loss": 0.4579, "epoch": 4.750462107208873, "learning_rate": 1.116922955913006e-05 } }, { "step": 4952576, "logs": { "loss": 0.4569, "epoch": 4.768946395563771, "learning_rate": 1.112990128603453e-05 } }, { "step": 4971776, "logs": { "loss": 0.459, "epoch": 4.787430683918669, "learning_rate": 1.1090573012939004e-05 } }, { "step": 4990976, "logs": { "loss": 0.456, "epoch": 4.805914972273568, "learning_rate": 1.1051244739843475e-05 } }, { "step": 5010176, "logs": { "loss": 0.4605, "epoch": 4.824399260628466, "learning_rate": 1.1011916466747945e-05 } }, { "step": 5029376, "logs": { "loss": 0.4565, "epoch": 4.842883548983364, "learning_rate": 1.0972588193652417e-05 } }, { "step": 5048576, "logs": { "loss": 0.4606, "epoch": 4.861367837338262, "learning_rate": 1.093325992055689e-05 } }, { "step": 5067776, "logs": { "loss": 0.4586, "epoch": 4.87985212569316, "learning_rate": 1.089393164746136e-05 } }, { "step": 5086976, "logs": { "loss": 0.4605, "epoch": 4.898336414048059, "learning_rate": 1.0854603374365833e-05 } }, { "step": 5106176, "logs": { "loss": 0.4565, "epoch": 4.9168207024029575, "learning_rate": 1.0815275101270303e-05 } }, { "step": 5125376, "logs": { "loss": 0.4585, "epoch": 4.935304990757856, "learning_rate": 1.0775946828174776e-05 } }, { "step": 5144576, "logs": { "loss": 0.4588, "epoch": 4.953789279112754, "learning_rate": 1.0736618555079248e-05 } }, { "step": 5163776, "logs": { "loss": 0.4639, "epoch": 4.972273567467653, "learning_rate": 1.0697290281983718e-05 } }, { "step": 5182976, "logs": { "loss": 0.4666, "epoch": 4.990757855822551, "learning_rate": 1.0657962008888189e-05 } }, { "step": 5201920, "logs": { "loss": 0.4109, "epoch": 5.009242144177449, "learning_rate": 1.0618633735792663e-05 } }, { "step": 5221120, "logs": { "loss": 0.3538, "epoch": 5.027726432532347, "learning_rate": 1.0579305462697134e-05 } }, { "step": 5240320, "logs": { "loss": 0.346, "epoch": 5.046210720887246, "learning_rate": 1.0539977189601604e-05 } }, { "step": 5259520, "logs": { "loss": 0.3483, "epoch": 5.064695009242144, "learning_rate": 1.0500648916506078e-05 } }, { "step": 5278720, "logs": { "loss": 0.3548, "epoch": 5.0831792975970425, "learning_rate": 1.0461320643410549e-05 } }, { "step": 5297920, "logs": { "loss": 0.3567, "epoch": 5.101663585951941, "learning_rate": 1.042199237031502e-05 } }, { "step": 5317120, "logs": { "loss": 0.3525, "epoch": 5.12014787430684, "learning_rate": 1.0382664097219492e-05 } }, { "step": 5336320, "logs": { "loss": 0.3563, "epoch": 5.138632162661738, "learning_rate": 1.0343335824123964e-05 } }, { "step": 5355520, "logs": { "loss": 0.3606, "epoch": 5.157116451016636, "learning_rate": 1.0304007551028435e-05 } }, { "step": 5374720, "logs": { "loss": 0.3585, "epoch": 5.175600739371534, "learning_rate": 1.0264679277932907e-05 } }, { "step": 5393920, "logs": { "loss": 0.3547, "epoch": 5.194085027726432, "learning_rate": 1.0225351004837378e-05 } }, { "step": 5413120, "logs": { "loss": 0.359, "epoch": 5.212569316081331, "learning_rate": 1.018602273174185e-05 } }, { "step": 5432320, "logs": { "loss": 0.3616, "epoch": 5.231053604436229, "learning_rate": 1.0146694458646322e-05 } }, { "step": 5451520, "logs": { "loss": 0.3602, "epoch": 5.249537892791127, "learning_rate": 1.0107366185550793e-05 } }, { "step": 5470720, "logs": { "loss": 0.3607, "epoch": 5.2680221811460255, "learning_rate": 1.0068037912455264e-05 } }, { "step": 5489920, "logs": { "loss": 0.3642, "epoch": 5.2865064695009245, "learning_rate": 1.0028709639359738e-05 } }, { "step": 5509120, "logs": { "loss": 0.3616, "epoch": 5.304990757855823, "learning_rate": 9.989381366264208e-06 } }, { "step": 5528320, "logs": { "loss": 0.364, "epoch": 5.323475046210721, "learning_rate": 9.95005309316868e-06 } }, { "step": 5547520, "logs": { "loss": 0.3656, "epoch": 5.341959334565619, "learning_rate": 9.910724820073151e-06 } }, { "step": 5566720, "logs": { "loss": 0.3613, "epoch": 5.360443622920518, "learning_rate": 9.871396546977623e-06 } }, { "step": 5585920, "logs": { "loss": 0.3655, "epoch": 5.378927911275416, "learning_rate": 9.832068273882096e-06 } }, { "step": 5605120, "logs": { "loss": 0.3677, "epoch": 5.397412199630314, "learning_rate": 9.792740000786566e-06 } }, { "step": 5624320, "logs": { "loss": 0.3678, "epoch": 5.415896487985212, "learning_rate": 9.753411727691039e-06 } }, { "step": 5643520, "logs": { "loss": 0.364, "epoch": 5.434380776340111, "learning_rate": 9.71408345459551e-06 } }, { "step": 5662720, "logs": { "loss": 0.3654, "epoch": 5.452865064695009, "learning_rate": 9.67475518149998e-06 } }, { "step": 5681920, "logs": { "loss": 0.3671, "epoch": 5.4713493530499075, "learning_rate": 9.635426908404452e-06 } }, { "step": 5701120, "logs": { "loss": 0.3724, "epoch": 5.489833641404806, "learning_rate": 9.596098635308924e-06 } }, { "step": 5720320, "logs": { "loss": 1.4537, "epoch": 5.508317929759705, "learning_rate": 9.556770362213395e-06 } }, { "step": 5739520, "logs": { "loss": 0.3685, "epoch": 5.526802218114603, "learning_rate": 9.517442089117867e-06 } }, { "step": 5758720, "logs": { "loss": 0.3688, "epoch": 5.545286506469501, "learning_rate": 9.47811381602234e-06 } }, { "step": 5777920, "logs": { "loss": 0.3726, "epoch": 5.563770794824399, "learning_rate": 9.43878554292681e-06 } }, { "step": 5797120, "logs": { "loss": 0.3718, "epoch": 5.582255083179297, "learning_rate": 9.399457269831283e-06 } }, { "step": 5816320, "logs": { "loss": 0.3691, "epoch": 5.600739371534196, "learning_rate": 9.360128996735755e-06 } }, { "step": 5835520, "logs": { "loss": 0.3684, "epoch": 5.619223659889094, "learning_rate": 9.320800723640226e-06 } }, { "step": 5854720, "logs": { "loss": 0.3747, "epoch": 5.6377079482439925, "learning_rate": 9.281472450544698e-06 } }, { "step": 5873920, "logs": { "loss": 0.3727, "epoch": 5.656192236598891, "learning_rate": 9.24214417744917e-06 } }, { "step": 5893120, "logs": { "loss": 0.3736, "epoch": 5.67467652495379, "learning_rate": 9.20281590435364e-06 } }, { "step": 5912320, "logs": { "loss": 0.3725, "epoch": 5.693160813308688, "learning_rate": 9.163487631258111e-06 } }, { "step": 5931520, "logs": { "loss": 0.3711, "epoch": 5.711645101663586, "learning_rate": 9.124159358162584e-06 } }, { "step": 5950720, "logs": { "loss": 0.3705, "epoch": 5.730129390018484, "learning_rate": 9.084831085067054e-06 } }, { "step": 5969920, "logs": { "loss": 0.3698, "epoch": 5.748613678373383, "learning_rate": 9.045502811971527e-06 } }, { "step": 5989120, "logs": { "loss": 0.3725, "epoch": 5.767097966728281, "learning_rate": 9.006174538875999e-06 } }, { "step": 6008320, "logs": { "loss": 0.3767, "epoch": 5.785582255083179, "learning_rate": 8.96684626578047e-06 } }, { "step": 6027520, "logs": { "loss": 0.3696, "epoch": 5.804066543438077, "learning_rate": 8.927517992684942e-06 } }, { "step": 6046720, "logs": { "loss": 0.3797, "epoch": 5.822550831792976, "learning_rate": 8.888189719589414e-06 } }, { "step": 6065920, "logs": { "loss": 0.371, "epoch": 5.8410351201478745, "learning_rate": 8.848861446493885e-06 } }, { "step": 6085120, "logs": { "loss": 0.3769, "epoch": 5.859519408502773, "learning_rate": 8.809533173398357e-06 } }, { "step": 6104320, "logs": { "loss": 0.3731, "epoch": 5.878003696857671, "learning_rate": 8.77020490030283e-06 } }, { "step": 6123520, "logs": { "loss": 0.3769, "epoch": 5.896487985212569, "learning_rate": 8.7308766272073e-06 } }, { "step": 6142720, "logs": { "loss": 0.3711, "epoch": 5.914972273567468, "learning_rate": 8.691548354111772e-06 } }, { "step": 6161920, "logs": { "loss": 0.3752, "epoch": 5.933456561922366, "learning_rate": 8.652220081016243e-06 } }, { "step": 6181120, "logs": { "loss": 0.3697, "epoch": 5.951940850277264, "learning_rate": 8.612891807920715e-06 } }, { "step": 6200320, "logs": { "loss": 0.3751, "epoch": 5.970425138632162, "learning_rate": 8.573563534825186e-06 } }, { "step": 6219520, "logs": { "loss": 0.3791, "epoch": 5.988909426987061, "learning_rate": 8.534235261729658e-06 } }, { "step": 6238464, "logs": { "loss": 0.3443, "epoch": 6.007393715341959, "learning_rate": 8.494906988634129e-06 } }, { "step": 6257664, "logs": { "loss": 0.2903, "epoch": 6.0258780036968576, "learning_rate": 8.455578715538601e-06 } }, { "step": 6276864, "logs": { "loss": 0.2906, "epoch": 6.044362292051756, "learning_rate": 8.416250442443073e-06 } }, { "step": 6296064, "logs": { "loss": 0.2884, "epoch": 6.062846580406655, "learning_rate": 8.376922169347544e-06 } }, { "step": 6315264, "logs": { "loss": 0.2913, "epoch": 6.081330868761553, "learning_rate": 8.337593896252016e-06 } }, { "step": 6334464, "logs": { "loss": 0.2964, "epoch": 6.099815157116451, "learning_rate": 8.298265623156489e-06 } }, { "step": 6353664, "logs": { "loss": 0.2877, "epoch": 6.118299445471349, "learning_rate": 8.25893735006096e-06 } }, { "step": 6372864, "logs": { "loss": 0.2957, "epoch": 6.136783733826248, "learning_rate": 8.219609076965432e-06 } }, { "step": 6392064, "logs": { "loss": 0.2974, "epoch": 6.155268022181146, "learning_rate": 8.180280803869902e-06 } }, { "step": 6411264, "logs": { "loss": 0.295, "epoch": 6.173752310536044, "learning_rate": 8.140952530774374e-06 } }, { "step": 6430464, "logs": { "loss": 0.2947, "epoch": 6.1922365988909425, "learning_rate": 8.101624257678847e-06 } }, { "step": 6449664, "logs": { "loss": 0.2957, "epoch": 6.210720887245841, "learning_rate": 8.062295984583317e-06 } }, { "step": 6468864, "logs": { "loss": 0.3001, "epoch": 6.22920517560074, "learning_rate": 8.02296771148779e-06 } }, { "step": 6488064, "logs": { "loss": 0.2958, "epoch": 6.247689463955638, "learning_rate": 7.98363943839226e-06 } }, { "step": 6507264, "logs": { "loss": 0.2956, "epoch": 6.266173752310536, "learning_rate": 7.944311165296733e-06 } }, { "step": 6526464, "logs": { "loss": 0.3, "epoch": 6.284658040665434, "learning_rate": 7.904982892201203e-06 } }, { "step": 6545664, "logs": { "loss": 0.3, "epoch": 6.303142329020333, "learning_rate": 7.865654619105676e-06 } }, { "step": 6564864, "logs": { "loss": 0.3003, "epoch": 6.321626617375231, "learning_rate": 7.826326346010146e-06 } }, { "step": 6584064, "logs": { "loss": 0.3029, "epoch": 6.340110905730129, "learning_rate": 7.786998072914618e-06 } }, { "step": 6603264, "logs": { "loss": 0.301, "epoch": 6.358595194085027, "learning_rate": 7.74766979981909e-06 } }, { "step": 6622464, "logs": { "loss": 0.297, "epoch": 6.377079482439926, "learning_rate": 7.708341526723561e-06 } }, { "step": 6641664, "logs": { "loss": 0.2993, "epoch": 6.3955637707948245, "learning_rate": 7.669013253628034e-06 } }, { "step": 6660864, "logs": { "loss": 0.3035, "epoch": 6.414048059149723, "learning_rate": 7.629684980532506e-06 } }, { "step": 6680064, "logs": { "loss": 0.2988, "epoch": 6.432532347504621, "learning_rate": 7.590356707436977e-06 } }, { "step": 6699264, "logs": { "loss": 0.3001, "epoch": 6.45101663585952, "learning_rate": 7.551028434341449e-06 } }, { "step": 6718464, "logs": { "loss": 0.3024, "epoch": 6.469500924214418, "learning_rate": 7.51170016124592e-06 } }, { "step": 6737664, "logs": { "loss": 0.3053, "epoch": 6.487985212569316, "learning_rate": 7.472371888150392e-06 } }, { "step": 6756864, "logs": { "loss": 0.3081, "epoch": 6.506469500924214, "learning_rate": 7.433043615054863e-06 } }, { "step": 6776064, "logs": { "loss": 0.3002, "epoch": 6.524953789279113, "learning_rate": 7.393715341959336e-06 } }, { "step": 6795264, "logs": { "loss": 0.3044, "epoch": 6.543438077634011, "learning_rate": 7.354387068863806e-06 } }, { "step": 6814464, "logs": { "loss": 0.3016, "epoch": 6.561922365988909, "learning_rate": 7.3150587957682786e-06 } }, { "step": 6833664, "logs": { "loss": 0.3071, "epoch": 6.580406654343808, "learning_rate": 7.27573052267275e-06 } }, { "step": 6852864, "logs": { "loss": 0.3002, "epoch": 6.598890942698706, "learning_rate": 7.2364022495772215e-06 } }, { "step": 6872064, "logs": { "loss": 0.3042, "epoch": 6.617375231053605, "learning_rate": 7.197073976481693e-06 } }, { "step": 6891264, "logs": { "loss": 0.3042, "epoch": 6.635859519408503, "learning_rate": 7.157745703386165e-06 } }, { "step": 6910464, "logs": { "loss": 0.3063, "epoch": 6.654343807763401, "learning_rate": 7.118417430290636e-06 } }, { "step": 6929664, "logs": { "loss": 0.3031, "epoch": 6.672828096118299, "learning_rate": 7.079089157195108e-06 } }, { "step": 6948864, "logs": { "loss": 0.3081, "epoch": 6.691312384473198, "learning_rate": 7.0397608840995805e-06 } }, { "step": 6968064, "logs": { "loss": 0.3041, "epoch": 6.709796672828096, "learning_rate": 7.000432611004051e-06 } }, { "step": 6987264, "logs": { "loss": 0.3036, "epoch": 6.728280961182994, "learning_rate": 6.961104337908523e-06 } }, { "step": 7006464, "logs": { "loss": 0.3044, "epoch": 6.7467652495378925, "learning_rate": 6.921776064812995e-06 } }, { "step": 7025664, "logs": { "loss": 0.3057, "epoch": 6.7652495378927915, "learning_rate": 6.882447791717466e-06 } }, { "step": 7044864, "logs": { "loss": 0.3081, "epoch": 6.78373382624769, "learning_rate": 6.843119518621938e-06 } }, { "step": 7064064, "logs": { "loss": 0.3058, "epoch": 6.802218114602588, "learning_rate": 6.80379124552641e-06 } }, { "step": 7083264, "logs": { "loss": 0.3072, "epoch": 6.820702402957486, "learning_rate": 6.764462972430881e-06 } }, { "step": 7102464, "logs": { "loss": 0.3042, "epoch": 6.839186691312385, "learning_rate": 6.725134699335353e-06 } }, { "step": 7121664, "logs": { "loss": 0.3091, "epoch": 6.857670979667283, "learning_rate": 6.6858064262398245e-06 } }, { "step": 7140864, "logs": { "loss": 0.3036, "epoch": 6.876155268022181, "learning_rate": 6.646478153144296e-06 } }, { "step": 7160064, "logs": { "loss": 0.3081, "epoch": 6.894639556377079, "learning_rate": 6.607149880048767e-06 } }, { "step": 7179264, "logs": { "loss": 0.3018, "epoch": 6.913123844731977, "learning_rate": 6.56782160695324e-06 } }, { "step": 7198464, "logs": { "loss": 0.3055, "epoch": 6.931608133086876, "learning_rate": 6.52849333385771e-06 } }, { "step": 7217664, "logs": { "loss": 0.3046, "epoch": 6.9500924214417745, "learning_rate": 6.489165060762183e-06 } }, { "step": 7236864, "logs": { "loss": 0.3083, "epoch": 6.968576709796673, "learning_rate": 6.449836787666655e-06 } }, { "step": 7256064, "logs": { "loss": 0.3118, "epoch": 6.987060998151571, "learning_rate": 6.4105085145711256e-06 } }, { "step": 7275008, "logs": { "loss": 0.2902, "epoch": 7.00554528650647, "learning_rate": 6.371180241475597e-06 } }, { "step": 7294208, "logs": { "loss": 0.241, "epoch": 7.024029574861368, "learning_rate": 6.331851968380069e-06 } }, { "step": 7313408, "logs": { "loss": 0.2432, "epoch": 7.042513863216266, "learning_rate": 6.29252369528454e-06 } }, { "step": 7332608, "logs": { "loss": 0.2405, "epoch": 7.060998151571164, "learning_rate": 6.253195422189012e-06 } }, { "step": 7351808, "logs": { "loss": 0.2447, "epoch": 7.079482439926063, "learning_rate": 6.2138671490934846e-06 } }, { "step": 7371008, "logs": { "loss": 0.2458, "epoch": 7.097966728280961, "learning_rate": 6.174538875997955e-06 } }, { "step": 7390208, "logs": { "loss": 0.2414, "epoch": 7.116451016635859, "learning_rate": 6.1352106029024275e-06 } }, { "step": 7409408, "logs": { "loss": 0.2465, "epoch": 7.134935304990758, "learning_rate": 6.095882329806899e-06 } }, { "step": 7428608, "logs": { "loss": 0.2474, "epoch": 7.153419593345657, "learning_rate": 6.05655405671137e-06 } }, { "step": 7447808, "logs": { "loss": 0.2464, "epoch": 7.171903881700555, "learning_rate": 6.017225783615842e-06 } }, { "step": 7467008, "logs": { "loss": 0.2443, "epoch": 7.190388170055453, "learning_rate": 5.977897510520314e-06 } }, { "step": 7486208, "logs": { "loss": 0.2466, "epoch": 7.208872458410351, "learning_rate": 5.938569237424785e-06 } }, { "step": 7505408, "logs": { "loss": 0.2497, "epoch": 7.22735674676525, "learning_rate": 5.899240964329257e-06 } }, { "step": 7524608, "logs": { "loss": 0.2469, "epoch": 7.245841035120148, "learning_rate": 5.859912691233728e-06 } }, { "step": 7543808, "logs": { "loss": 0.2468, "epoch": 7.264325323475046, "learning_rate": 5.8205844181382e-06 } }, { "step": 7563008, "logs": { "loss": 0.2495, "epoch": 7.282809611829944, "learning_rate": 5.7812561450426715e-06 } }, { "step": 7582208, "logs": { "loss": 0.2496, "epoch": 7.3012939001848425, "learning_rate": 5.741927871947143e-06 } }, { "step": 7601408, "logs": { "loss": 0.2516, "epoch": 7.3197781885397415, "learning_rate": 5.702599598851614e-06 } }, { "step": 7620608, "logs": { "loss": 0.2516, "epoch": 7.33826247689464, "learning_rate": 5.663271325756087e-06 } }, { "step": 7639808, "logs": { "loss": 0.2493, "epoch": 7.356746765249538, "learning_rate": 5.623943052660557e-06 } }, { "step": 7659008, "logs": { "loss": 0.2458, "epoch": 7.375231053604436, "learning_rate": 5.58461477956503e-06 } }, { "step": 7678208, "logs": { "loss": 0.2494, "epoch": 7.393715341959335, "learning_rate": 5.545286506469502e-06 } }, { "step": 7697408, "logs": { "loss": 0.2534, "epoch": 7.412199630314233, "learning_rate": 5.5059582333739726e-06 } }, { "step": 7716608, "logs": { "loss": 0.2499, "epoch": 7.430683918669131, "learning_rate": 5.466629960278445e-06 } }, { "step": 7735808, "logs": { "loss": 0.249, "epoch": 7.449168207024029, "learning_rate": 5.427301687182916e-06 } }, { "step": 7755008, "logs": { "loss": 0.2498, "epoch": 7.467652495378928, "learning_rate": 5.387973414087388e-06 } }, { "step": 7774208, "logs": { "loss": 0.2541, "epoch": 7.486136783733826, "learning_rate": 5.348645140991859e-06 } }, { "step": 7793408, "logs": { "loss": 0.2579, "epoch": 7.5046210720887245, "learning_rate": 5.3093168678963316e-06 } }, { "step": 7812608, "logs": { "loss": 0.2476, "epoch": 7.523105360443623, "learning_rate": 5.269988594800802e-06 } }, { "step": 7831808, "logs": { "loss": 0.2538, "epoch": 7.541589648798522, "learning_rate": 5.2306603217052745e-06 } }, { "step": 7851008, "logs": { "loss": 0.2537, "epoch": 7.56007393715342, "learning_rate": 5.191332048609746e-06 } }, { "step": 7870208, "logs": { "loss": 0.2522, "epoch": 7.578558225508318, "learning_rate": 5.152003775514217e-06 } }, { "step": 7889408, "logs": { "loss": 0.2491, "epoch": 7.597042513863216, "learning_rate": 5.112675502418689e-06 } }, { "step": 7908608, "logs": { "loss": 0.2509, "epoch": 7.615526802218114, "learning_rate": 5.073347229323161e-06 } }, { "step": 7927808, "logs": { "loss": 0.2496, "epoch": 7.634011090573013, "learning_rate": 5.034018956227632e-06 } }, { "step": 7947008, "logs": { "loss": 0.2542, "epoch": 7.652495378927911, "learning_rate": 4.994690683132104e-06 } }, { "step": 7966208, "logs": { "loss": 0.2517, "epoch": 7.6709796672828094, "learning_rate": 4.9553624100365756e-06 } }, { "step": 7985408, "logs": { "loss": 0.2544, "epoch": 7.689463955637708, "learning_rate": 4.916034136941048e-06 } }, { "step": 8004608, "logs": { "loss": 0.2489, "epoch": 7.707948243992607, "learning_rate": 4.876705863845519e-06 } }, { "step": 8023808, "logs": { "loss": 0.2506, "epoch": 7.726432532347505, "learning_rate": 4.83737759074999e-06 } }, { "step": 8043008, "logs": { "loss": 0.2535, "epoch": 7.744916820702403, "learning_rate": 4.798049317654462e-06 } }, { "step": 8062208, "logs": { "loss": 0.2506, "epoch": 7.763401109057301, "learning_rate": 4.758721044558934e-06 } }, { "step": 8081408, "logs": { "loss": 0.2547, "epoch": 7.7818853974122, "learning_rate": 4.719392771463405e-06 } }, { "step": 8100608, "logs": { "loss": 0.2525, "epoch": 7.800369685767098, "learning_rate": 4.6800644983678775e-06 } }, { "step": 8119808, "logs": { "loss": 0.2535, "epoch": 7.818853974121996, "learning_rate": 4.640736225272349e-06 } }, { "step": 8139008, "logs": { "loss": 0.2508, "epoch": 7.837338262476894, "learning_rate": 4.60140795217682e-06 } }, { "step": 8158208, "logs": { "loss": 0.254, "epoch": 7.855822550831793, "learning_rate": 4.562079679081292e-06 } }, { "step": 8177408, "logs": { "loss": 0.251, "epoch": 7.8743068391866915, "learning_rate": 4.522751405985763e-06 } }, { "step": 8196608, "logs": { "loss": 0.2545, "epoch": 7.89279112754159, "learning_rate": 4.483423132890235e-06 } }, { "step": 8215808, "logs": { "loss": 0.2497, "epoch": 7.911275415896488, "learning_rate": 4.444094859794707e-06 } }, { "step": 8235008, "logs": { "loss": 0.253, "epoch": 7.929759704251387, "learning_rate": 4.4047665866991786e-06 } }, { "step": 8254208, "logs": { "loss": 0.249, "epoch": 7.948243992606285, "learning_rate": 4.36543831360365e-06 } }, { "step": 8273408, "logs": { "loss": 0.2534, "epoch": 7.966728280961183, "learning_rate": 4.3261100405081215e-06 } }, { "step": 8292608, "logs": { "loss": 0.2563, "epoch": 7.985212569316081, "learning_rate": 4.286781767412593e-06 } }, { "step": 8311552, "logs": { "loss": 0.2489, "epoch": 8.00369685767098, "learning_rate": 4.247453494317064e-06 } }, { "step": 8330752, "logs": { "loss": 0.2079, "epoch": 8.022181146025877, "learning_rate": 4.208125221221537e-06 } }, { "step": 8349952, "logs": { "loss": 0.2079, "epoch": 8.040665434380776, "learning_rate": 4.168796948126008e-06 } }, { "step": 8369152, "logs": { "loss": 0.2055, "epoch": 8.059149722735675, "learning_rate": 4.12946867503048e-06 } }, { "step": 8388352, "logs": { "loss": 0.2115, "epoch": 8.077634011090574, "learning_rate": 4.090140401934951e-06 } }, { "step": 8407552, "logs": { "loss": 0.2105, "epoch": 8.096118299445472, "learning_rate": 4.050812128839423e-06 } }, { "step": 8426752, "logs": { "loss": 0.2055, "epoch": 8.11460258780037, "learning_rate": 4.011483855743895e-06 } }, { "step": 8445952, "logs": { "loss": 0.2086, "epoch": 8.133086876155268, "learning_rate": 3.972155582648366e-06 } }, { "step": 8465152, "logs": { "loss": 0.2102, "epoch": 8.151571164510166, "learning_rate": 3.932827309552838e-06 } }, { "step": 8484352, "logs": { "loss": 0.21, "epoch": 8.170055452865064, "learning_rate": 3.893499036457309e-06 } }, { "step": 8503552, "logs": { "loss": 0.2081, "epoch": 8.188539741219962, "learning_rate": 3.854170763361781e-06 } }, { "step": 8522752, "logs": { "loss": 0.213, "epoch": 8.207024029574862, "learning_rate": 3.814842490266253e-06 } }, { "step": 8541952, "logs": { "loss": 0.2114, "epoch": 8.22550831792976, "learning_rate": 3.7755142171707245e-06 } }, { "step": 8561152, "logs": { "loss": 0.2116, "epoch": 8.243992606284658, "learning_rate": 3.736185944075196e-06 } }, { "step": 8580352, "logs": { "loss": 0.2106, "epoch": 8.262476894639557, "learning_rate": 3.696857670979668e-06 } }, { "step": 8599552, "logs": { "loss": 0.2097, "epoch": 8.280961182994455, "learning_rate": 3.6575293978841393e-06 } }, { "step": 8618752, "logs": { "loss": 0.2119, "epoch": 8.299445471349353, "learning_rate": 3.6182011247886107e-06 } }, { "step": 8637952, "logs": { "loss": 0.2144, "epoch": 8.317929759704251, "learning_rate": 3.5788728516930826e-06 } }, { "step": 8657152, "logs": { "loss": 0.2125, "epoch": 8.336414048059149, "learning_rate": 3.539544578597554e-06 } }, { "step": 8676352, "logs": { "loss": 0.2134, "epoch": 8.354898336414047, "learning_rate": 3.5002163055020256e-06 } }, { "step": 8695552, "logs": { "loss": 0.2127, "epoch": 8.373382624768947, "learning_rate": 3.4608880324064974e-06 } }, { "step": 8714752, "logs": { "loss": 0.2111, "epoch": 8.391866913123845, "learning_rate": 3.421559759310969e-06 } }, { "step": 8733952, "logs": { "loss": 0.213, "epoch": 8.410351201478743, "learning_rate": 3.3822314862154404e-06 } }, { "step": 8753152, "logs": { "loss": 0.2109, "epoch": 8.428835489833642, "learning_rate": 3.3429032131199122e-06 } }, { "step": 8772352, "logs": { "loss": 0.2093, "epoch": 8.44731977818854, "learning_rate": 3.3035749400243837e-06 } }, { "step": 8791552, "logs": { "loss": 0.2126, "epoch": 8.465804066543438, "learning_rate": 3.264246666928855e-06 } }, { "step": 8810752, "logs": { "loss": 0.2127, "epoch": 8.484288354898336, "learning_rate": 3.2249183938333275e-06 } }, { "step": 8829952, "logs": { "loss": 0.2184, "epoch": 8.502772643253234, "learning_rate": 3.1855901207377985e-06 } }, { "step": 8849152, "logs": { "loss": 0.2108, "epoch": 8.521256931608134, "learning_rate": 3.14626184764227e-06 } }, { "step": 8868352, "logs": { "loss": 0.2123, "epoch": 8.539741219963032, "learning_rate": 3.1069335745467423e-06 } }, { "step": 8887552, "logs": { "loss": 0.2125, "epoch": 8.55822550831793, "learning_rate": 3.0676053014512137e-06 } }, { "step": 8906752, "logs": { "loss": 0.2124, "epoch": 8.576709796672828, "learning_rate": 3.028277028355685e-06 } }, { "step": 8925952, "logs": { "loss": 0.2112, "epoch": 8.595194085027726, "learning_rate": 2.988948755260157e-06 } }, { "step": 8945152, "logs": { "loss": 0.2103, "epoch": 8.613678373382625, "learning_rate": 2.9496204821646285e-06 } }, { "step": 8964352, "logs": { "loss": 0.2128, "epoch": 8.632162661737523, "learning_rate": 2.9102922090691e-06 } }, { "step": 8983552, "logs": { "loss": 0.2125, "epoch": 8.65064695009242, "learning_rate": 2.8709639359735715e-06 } }, { "step": 9002752, "logs": { "loss": 0.2109, "epoch": 8.669131238447319, "learning_rate": 2.8316356628780434e-06 } }, { "step": 9021952, "logs": { "loss": 0.2132, "epoch": 8.687615526802219, "learning_rate": 2.792307389782515e-06 } }, { "step": 9041152, "logs": { "loss": 0.2113, "epoch": 8.706099815157117, "learning_rate": 2.7529791166869863e-06 } }, { "step": 9060352, "logs": { "loss": 0.2109, "epoch": 8.724584103512015, "learning_rate": 2.713650843591458e-06 } }, { "step": 9079552, "logs": { "loss": 0.2138, "epoch": 8.743068391866913, "learning_rate": 2.6743225704959296e-06 } }, { "step": 9098752, "logs": { "loss": 0.2098, "epoch": 8.761552680221811, "learning_rate": 2.634994297400401e-06 } }, { "step": 9117952, "logs": { "loss": 0.2128, "epoch": 8.78003696857671, "learning_rate": 2.595666024304873e-06 } }, { "step": 9137152, "logs": { "loss": 0.2143, "epoch": 8.798521256931608, "learning_rate": 2.5563377512093444e-06 } }, { "step": 9156352, "logs": { "loss": 0.2132, "epoch": 8.817005545286506, "learning_rate": 2.517009478113816e-06 } }, { "step": 9175552, "logs": { "loss": 0.2099, "epoch": 8.835489833641406, "learning_rate": 2.4776812050182878e-06 } }, { "step": 9194752, "logs": { "loss": 0.2124, "epoch": 8.853974121996304, "learning_rate": 2.4383529319227597e-06 } }, { "step": 9213952, "logs": { "loss": 0.2122, "epoch": 8.872458410351202, "learning_rate": 2.399024658827231e-06 } }, { "step": 9233152, "logs": { "loss": 0.2136, "epoch": 8.8909426987061, "learning_rate": 2.3596963857317026e-06 } }, { "step": 9252352, "logs": { "loss": 0.2103, "epoch": 8.909426987060998, "learning_rate": 2.3203681126361745e-06 } }, { "step": 9271552, "logs": { "loss": 0.2132, "epoch": 8.927911275415896, "learning_rate": 2.281039839540646e-06 } }, { "step": 9290752, "logs": { "loss": 0.2082, "epoch": 8.946395563770794, "learning_rate": 2.2417115664451174e-06 } }, { "step": 9309952, "logs": { "loss": 0.213, "epoch": 8.964879852125692, "learning_rate": 2.2023832933495893e-06 } }, { "step": 9329152, "logs": { "loss": 0.2142, "epoch": 8.98336414048059, "learning_rate": 2.1630550202540607e-06 } }, { "step": 9348096, "logs": { "loss": 0.2123, "epoch": 9.00184842883549, "learning_rate": 2.123726747158532e-06 } }, { "step": 9367296, "logs": { "loss": 0.1854, "epoch": 9.020332717190389, "learning_rate": 2.084398474063004e-06 } }, { "step": 9386496, "logs": { "loss": 0.1848, "epoch": 9.038817005545287, "learning_rate": 2.0450702009674755e-06 } }, { "step": 9405696, "logs": { "loss": 0.1802, "epoch": 9.057301293900185, "learning_rate": 2.0057419278719474e-06 } }, { "step": 9424896, "logs": { "loss": 0.1859, "epoch": 9.075785582255083, "learning_rate": 1.966413654776419e-06 } }, { "step": 9444096, "logs": { "loss": 0.1849, "epoch": 9.094269870609981, "learning_rate": 1.9270853816808904e-06 } }, { "step": 9463296, "logs": { "loss": 0.1841, "epoch": 9.11275415896488, "learning_rate": 1.8877571085853622e-06 } }, { "step": 9482496, "logs": { "loss": 0.1854, "epoch": 9.131238447319777, "learning_rate": 1.848428835489834e-06 } }, { "step": 9501696, "logs": { "loss": 0.1847, "epoch": 9.149722735674677, "learning_rate": 1.8091005623943054e-06 } }, { "step": 9520896, "logs": { "loss": 0.1852, "epoch": 9.168207024029575, "learning_rate": 1.769772289298777e-06 } }, { "step": 9540096, "logs": { "loss": 0.1846, "epoch": 9.186691312384474, "learning_rate": 1.7304440162032487e-06 } }, { "step": 9559296, "logs": { "loss": 0.1848, "epoch": 9.205175600739372, "learning_rate": 1.6911157431077202e-06 } }, { "step": 9578496, "logs": { "loss": 0.1861, "epoch": 9.22365988909427, "learning_rate": 1.6517874700121919e-06 } }, { "step": 9597696, "logs": { "loss": 0.185, "epoch": 9.242144177449168, "learning_rate": 1.6124591969166637e-06 } }, { "step": 9616896, "logs": { "loss": 0.1846, "epoch": 9.260628465804066, "learning_rate": 1.573130923821135e-06 } }, { "step": 9636096, "logs": { "loss": 0.1827, "epoch": 9.279112754158964, "learning_rate": 1.5338026507256069e-06 } }, { "step": 9655296, "logs": { "loss": 0.1871, "epoch": 9.297597042513864, "learning_rate": 1.4944743776300785e-06 } }, { "step": 9674496, "logs": { "loss": 0.1865, "epoch": 9.316081330868762, "learning_rate": 1.45514610453455e-06 } }, { "step": 9693696, "logs": { "loss": 0.1859, "epoch": 9.33456561922366, "learning_rate": 1.4158178314390217e-06 } }, { "step": 9712896, "logs": { "loss": 0.1874, "epoch": 9.353049907578558, "learning_rate": 1.3764895583434931e-06 } }, { "step": 9732096, "logs": { "loss": 0.1847, "epoch": 9.371534195933457, "learning_rate": 1.3371612852479648e-06 } }, { "step": 9751296, "logs": { "loss": 0.1849, "epoch": 9.390018484288355, "learning_rate": 1.2978330121524365e-06 } }, { "step": 9770496, "logs": { "loss": 0.1895, "epoch": 9.408502772643253, "learning_rate": 1.258504739056908e-06 } }, { "step": 9789696, "logs": { "loss": 0.1829, "epoch": 9.426987060998151, "learning_rate": 1.2191764659613798e-06 } }, { "step": 9808896, "logs": { "loss": 0.1837, "epoch": 9.445471349353049, "learning_rate": 1.1798481928658513e-06 } }, { "step": 9828096, "logs": { "loss": 0.1864, "epoch": 9.463955637707949, "learning_rate": 1.140519919770323e-06 } }, { "step": 9847296, "logs": { "loss": 0.1862, "epoch": 9.482439926062847, "learning_rate": 1.1011916466747946e-06 } }, { "step": 9866496, "logs": { "loss": 0.19, "epoch": 9.500924214417745, "learning_rate": 1.061863373579266e-06 } }, { "step": 9885696, "logs": { "loss": 0.1834, "epoch": 9.519408502772643, "learning_rate": 1.0225351004837378e-06 } }, { "step": 9904896, "logs": { "loss": 0.1863, "epoch": 9.537892791127542, "learning_rate": 9.832068273882094e-07 } }, { "step": 9924096, "logs": { "loss": 0.1859, "epoch": 9.55637707948244, "learning_rate": 9.438785542926811e-07 } }, { "step": 9943296, "logs": { "loss": 0.1829, "epoch": 9.574861367837338, "learning_rate": 9.045502811971527e-07 } }, { "step": 9962496, "logs": { "loss": 0.1838, "epoch": 9.593345656192236, "learning_rate": 8.652220081016244e-07 } }, { "step": 9981696, "logs": { "loss": 0.1817, "epoch": 9.611829944547136, "learning_rate": 8.258937350060959e-07 } }, { "step": 10000896, "logs": { "loss": 0.1834, "epoch": 9.630314232902034, "learning_rate": 7.865654619105675e-07 } }, { "step": 10020096, "logs": { "loss": 0.1857, "epoch": 9.648798521256932, "learning_rate": 7.472371888150393e-07 } }, { "step": 10039296, "logs": { "loss": 0.1858, "epoch": 9.66728280961183, "learning_rate": 7.079089157195108e-07 } }, { "step": 10058496, "logs": { "loss": 0.1858, "epoch": 9.685767097966728, "learning_rate": 6.685806426239824e-07 } }, { "step": 10077696, "logs": { "loss": 0.1848, "epoch": 9.704251386321626, "learning_rate": 6.29252369528454e-07 } }, { "step": 10096896, "logs": { "loss": 0.1832, "epoch": 9.722735674676525, "learning_rate": 5.899240964329256e-07 } }, { "step": 10116096, "logs": { "loss": 0.1842, "epoch": 9.741219963031423, "learning_rate": 5.505958233373973e-07 } }, { "step": 10135296, "logs": { "loss": 0.1842, "epoch": 9.75970425138632, "learning_rate": 5.112675502418689e-07 } }, { "step": 10154496, "logs": { "loss": 0.1847, "epoch": 9.77818853974122, "learning_rate": 4.7193927714634056e-07 } }, { "step": 10173696, "logs": { "loss": 0.185, "epoch": 9.796672828096119, "learning_rate": 4.326110040508122e-07 } }, { "step": 10192896, "logs": { "loss": 0.1826, "epoch": 9.815157116451017, "learning_rate": 3.9328273095528375e-07 } }, { "step": 10212096, "logs": { "loss": 0.1833, "epoch": 9.833641404805915, "learning_rate": 3.539544578597554e-07 } }, { "step": 10231296, "logs": { "loss": 0.1846, "epoch": 9.852125693160813, "learning_rate": 3.14626184764227e-07 } }, { "step": 10250496, "logs": { "loss": 0.184, "epoch": 9.870609981515711, "learning_rate": 2.7529791166869866e-07 } }, { "step": 10269696, "logs": { "loss": 0.1864, "epoch": 9.88909426987061, "learning_rate": 2.3596963857317028e-07 } }, { "step": 10288896, "logs": { "loss": 0.1841, "epoch": 9.907578558225508, "learning_rate": 1.9664136547764187e-07 } }, { "step": 10308096, "logs": { "loss": 0.1855, "epoch": 9.926062846580407, "learning_rate": 1.573130923821135e-07 } }, { "step": 10327296, "logs": { "loss": 0.1794, "epoch": 9.944547134935306, "learning_rate": 1.1798481928658514e-07 } }, { "step": 10346496, "logs": { "loss": 0.1853, "epoch": 9.963031423290204, "learning_rate": 7.865654619105675e-08 } }, { "step": 10365696, "logs": { "loss": 0.1855, "epoch": 9.981515711645102, "learning_rate": 3.9328273095528373e-08 } } ], "Evaluation": [ { "step": 2705, "logs": { "eval_loss": 0.9760558605194092 } }, { "step": 5410, "logs": { "eval_loss": 0.9268760681152344 } }, { "step": 8115, "logs": { "eval_loss": 0.9153628945350647 } }, { "step": 10820, "logs": { "eval_loss": 0.9207033514976501 } }, { "step": 13525, "logs": { "eval_loss": 0.9357024431228638 } }, { "step": 16230, "logs": { "eval_loss": 0.948551595211029 } }, { "step": 18935, "logs": { "eval_loss": 0.992328941822052 } }, { "step": 21640, "logs": { "eval_loss": 1.0297634601593018 } }, { "step": 24345, "logs": { "eval_loss": 1.0606719255447388 } }, { "step": 27050, "logs": { "eval_loss": 1.0935026407241821 } } ] } }