|
{ |
|
"best_metric": 2.1034367084503174, |
|
"best_model_checkpoint": "nyt_ingredients-crf-tagger-gte-small-L3-ingredient-v2/checkpoint-40000", |
|
"epoch": 10.0, |
|
"eval_steps": 1000, |
|
"global_step": 50510, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.1, |
|
"learning_rate": 4.9505048505246485e-05, |
|
"loss": 6.8194, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 0.2, |
|
"learning_rate": 4.9010097010492975e-05, |
|
"loss": 4.134, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 0.2, |
|
"eval_COMMENT": { |
|
"f1": 0.5763258721516435, |
|
"number": 6854, |
|
"precision": 0.5343387760189455, |
|
"recall": 0.6254741756638459 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.78330041694097, |
|
"number": 8845, |
|
"precision": 0.7608440797186401, |
|
"recall": 0.8071226681741097 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9729431253451132, |
|
"number": 7152, |
|
"precision": 0.960741548527808, |
|
"recall": 0.9854586129753915 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.0, |
|
"number": 105, |
|
"precision": 0.0, |
|
"recall": 0.0 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9476944253269098, |
|
"number": 5646, |
|
"precision": 0.921378387420542, |
|
"recall": 0.975557917109458 |
|
}, |
|
"eval_loss": 3.7770841121673584, |
|
"eval_overall_accuracy": 0.7948864068079933, |
|
"eval_overall_f1": 0.8085364620208354, |
|
"eval_overall_precision": 0.7806640625, |
|
"eval_overall_recall": 0.8384728340675477, |
|
"eval_runtime": 11.1289, |
|
"eval_samples_per_second": 764.316, |
|
"eval_steps_per_second": 23.902, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 0.3, |
|
"learning_rate": 4.851514551573946e-05, |
|
"loss": 3.7402, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 0.4, |
|
"learning_rate": 4.802019402098595e-05, |
|
"loss": 3.5226, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 0.4, |
|
"eval_COMMENT": { |
|
"f1": 0.6215112776922562, |
|
"number": 6854, |
|
"precision": 0.5741313218746136, |
|
"recall": 0.6774146483805077 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.7914056489724146, |
|
"number": 8845, |
|
"precision": 0.7699133967710895, |
|
"recall": 0.8141322781232334 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9796598403332176, |
|
"number": 7152, |
|
"precision": 0.9728388253136633, |
|
"recall": 0.9865771812080537 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.6425339366515838, |
|
"number": 105, |
|
"precision": 0.6120689655172413, |
|
"recall": 0.6761904761904762 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9472432248746921, |
|
"number": 5646, |
|
"precision": 0.9102040816326531, |
|
"recall": 0.9874247254693589 |
|
}, |
|
"eval_loss": 3.3654797077178955, |
|
"eval_overall_accuracy": 0.8063976901451257, |
|
"eval_overall_f1": 0.8245767266863746, |
|
"eval_overall_precision": 0.7934958298312537, |
|
"eval_overall_recall": 0.8581917348437172, |
|
"eval_runtime": 11.014, |
|
"eval_samples_per_second": 772.292, |
|
"eval_steps_per_second": 24.151, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 0.49, |
|
"learning_rate": 4.752524252623243e-05, |
|
"loss": 3.3189, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 0.59, |
|
"learning_rate": 4.703029103147892e-05, |
|
"loss": 3.1948, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 0.59, |
|
"eval_COMMENT": { |
|
"f1": 0.6503977349332615, |
|
"number": 6854, |
|
"precision": 0.6045112781954888, |
|
"recall": 0.7038225853516195 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8008250181169521, |
|
"number": 8845, |
|
"precision": 0.7898614471079833, |
|
"recall": 0.8120972300734879 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9830792896098447, |
|
"number": 7152, |
|
"precision": 0.9832167832167832, |
|
"recall": 0.9829418344519015 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7035573122529643, |
|
"number": 105, |
|
"precision": 0.6013513513513513, |
|
"recall": 0.8476190476190476 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9492858975455399, |
|
"number": 5646, |
|
"precision": 0.9178104845377874, |
|
"recall": 0.9829968119022316 |
|
}, |
|
"eval_loss": 3.1104416847229004, |
|
"eval_overall_accuracy": 0.8160474128105767, |
|
"eval_overall_f1": 0.8361769539655378, |
|
"eval_overall_precision": 0.8112035241132187, |
|
"eval_overall_recall": 0.8627368715474443, |
|
"eval_runtime": 9.4851, |
|
"eval_samples_per_second": 896.774, |
|
"eval_steps_per_second": 28.044, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 0.69, |
|
"learning_rate": 4.65353395367254e-05, |
|
"loss": 3.1131, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 0.79, |
|
"learning_rate": 4.6040388041971886e-05, |
|
"loss": 3.0233, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 0.79, |
|
"eval_COMMENT": { |
|
"f1": 0.6598611678236015, |
|
"number": 6854, |
|
"precision": 0.6183673469387755, |
|
"recall": 0.7073241902538664 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8091748251748251, |
|
"number": 8845, |
|
"precision": 0.8008859357696567, |
|
"recall": 0.8176370830977954 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9835126449629734, |
|
"number": 7152, |
|
"precision": 0.982826026249651, |
|
"recall": 0.9842002237136466 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.5851063829787234, |
|
"number": 105, |
|
"precision": 0.6626506024096386, |
|
"recall": 0.5238095238095238 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9505612201182417, |
|
"number": 5646, |
|
"precision": 0.9206639004149377, |
|
"recall": 0.9824654622741764 |
|
}, |
|
"eval_loss": 3.005340576171875, |
|
"eval_overall_accuracy": 0.8174150900387509, |
|
"eval_overall_f1": 0.8416805692690068, |
|
"eval_overall_precision": 0.8202057067020571, |
|
"eval_overall_recall": 0.8643101880987344, |
|
"eval_runtime": 11.0513, |
|
"eval_samples_per_second": 769.68, |
|
"eval_steps_per_second": 24.069, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 0.89, |
|
"learning_rate": 4.5545436547218376e-05, |
|
"loss": 2.9721, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 0.99, |
|
"learning_rate": 4.505048505246486e-05, |
|
"loss": 2.9567, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 0.99, |
|
"eval_COMMENT": { |
|
"f1": 0.677434679334917, |
|
"number": 6854, |
|
"precision": 0.633295267098084, |
|
"recall": 0.7281879194630873 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8113767426235933, |
|
"number": 8845, |
|
"precision": 0.8036823425022183, |
|
"recall": 0.8192198982475976 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9826323498639883, |
|
"number": 7152, |
|
"precision": 0.9803757828810021, |
|
"recall": 0.9848993288590604 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.6288659793814434, |
|
"number": 105, |
|
"precision": 0.6853932584269663, |
|
"recall": 0.580952380952381 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9479768786127167, |
|
"number": 5646, |
|
"precision": 0.9114089571755476, |
|
"recall": 0.9876018420120439 |
|
}, |
|
"eval_loss": 2.910010814666748, |
|
"eval_overall_accuracy": 0.8215941037915052, |
|
"eval_overall_f1": 0.8462413611587509, |
|
"eval_overall_precision": 0.8226748984779954, |
|
"eval_overall_recall": 0.8711978183343823, |
|
"eval_runtime": 11.1963, |
|
"eval_samples_per_second": 759.713, |
|
"eval_steps_per_second": 23.758, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 1.09, |
|
"learning_rate": 4.455553355771135e-05, |
|
"loss": 2.794, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 1.19, |
|
"learning_rate": 4.406058206295783e-05, |
|
"loss": 2.738, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 1.19, |
|
"eval_COMMENT": { |
|
"f1": 0.6844883595018949, |
|
"number": 6854, |
|
"precision": 0.6383489017924766, |
|
"recall": 0.7378173329442661 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.809906216656371, |
|
"number": 8845, |
|
"precision": 0.8046195045748716, |
|
"recall": 0.8152628603730921 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9817170663885992, |
|
"number": 7152, |
|
"precision": 0.9762201023088621, |
|
"recall": 0.9872762863534675 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7286821705426357, |
|
"number": 105, |
|
"precision": 0.6143790849673203, |
|
"recall": 0.8952380952380953 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9514546393527284, |
|
"number": 5646, |
|
"precision": 0.9254855994641661, |
|
"recall": 0.9789231314204747 |
|
}, |
|
"eval_loss": 2.8514182567596436, |
|
"eval_overall_accuracy": 0.8213471620697516, |
|
"eval_overall_f1": 0.8480048942967846, |
|
"eval_overall_precision": 0.8250115733086436, |
|
"eval_overall_recall": 0.8723166212152996, |
|
"eval_runtime": 8.7005, |
|
"eval_samples_per_second": 977.64, |
|
"eval_steps_per_second": 30.573, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 1.29, |
|
"learning_rate": 4.356563056820432e-05, |
|
"loss": 2.7896, |
|
"step": 6500 |
|
}, |
|
{ |
|
"epoch": 1.39, |
|
"learning_rate": 4.3070679073450804e-05, |
|
"loss": 2.8132, |
|
"step": 7000 |
|
}, |
|
{ |
|
"epoch": 1.39, |
|
"eval_COMMENT": { |
|
"f1": 0.680542242913871, |
|
"number": 6854, |
|
"precision": 0.641124871001032, |
|
"recall": 0.7251240151736212 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8072829131652661, |
|
"number": 8845, |
|
"precision": 0.8001110494169905, |
|
"recall": 0.814584511023177 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9839452743263996, |
|
"number": 7152, |
|
"precision": 0.9824365765263451, |
|
"recall": 0.9854586129753915 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7421875, |
|
"number": 105, |
|
"precision": 0.6291390728476821, |
|
"recall": 0.9047619047619048 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9518423307626392, |
|
"number": 5646, |
|
"precision": 0.9219787516600265, |
|
"recall": 0.983705278072972 |
|
}, |
|
"eval_loss": 2.776045322418213, |
|
"eval_overall_accuracy": 0.8222589468885343, |
|
"eval_overall_f1": 0.8473121210056551, |
|
"eval_overall_precision": 0.8261476117717399, |
|
"eval_overall_recall": 0.8695895391930635, |
|
"eval_runtime": 11.1273, |
|
"eval_samples_per_second": 764.429, |
|
"eval_steps_per_second": 23.905, |
|
"step": 7000 |
|
}, |
|
{ |
|
"epoch": 1.48, |
|
"learning_rate": 4.257572757869729e-05, |
|
"loss": 2.7089, |
|
"step": 7500 |
|
}, |
|
{ |
|
"epoch": 1.58, |
|
"learning_rate": 4.208077608394378e-05, |
|
"loss": 2.6976, |
|
"step": 8000 |
|
}, |
|
{ |
|
"epoch": 1.58, |
|
"eval_COMMENT": { |
|
"f1": 0.6947368421052631, |
|
"number": 6854, |
|
"precision": 0.6535493827160493, |
|
"recall": 0.7414648380507732 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8145306859205775, |
|
"number": 8845, |
|
"precision": 0.8127884723629405, |
|
"recall": 0.8162803843979649 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9840759882665177, |
|
"number": 7152, |
|
"precision": 0.9831147083449623, |
|
"recall": 0.9850391498881432 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.75098814229249, |
|
"number": 105, |
|
"precision": 0.6418918918918919, |
|
"recall": 0.9047619047619048 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9538461538461539, |
|
"number": 5646, |
|
"precision": 0.926531975288028, |
|
"recall": 0.9828196953595466 |
|
}, |
|
"eval_loss": 2.707292318344116, |
|
"eval_overall_accuracy": 0.826172023402477, |
|
"eval_overall_f1": 0.8534594631514241, |
|
"eval_overall_precision": 0.8340898471397103, |
|
"eval_overall_recall": 0.8737500874064751, |
|
"eval_runtime": 10.8076, |
|
"eval_samples_per_second": 787.041, |
|
"eval_steps_per_second": 24.612, |
|
"step": 8000 |
|
}, |
|
{ |
|
"epoch": 1.68, |
|
"learning_rate": 4.158582458919026e-05, |
|
"loss": 2.6869, |
|
"step": 8500 |
|
}, |
|
{ |
|
"epoch": 1.78, |
|
"learning_rate": 4.109087309443675e-05, |
|
"loss": 2.6347, |
|
"step": 9000 |
|
}, |
|
{ |
|
"epoch": 1.78, |
|
"eval_COMMENT": { |
|
"f1": 0.6949685534591195, |
|
"number": 6854, |
|
"precision": 0.6538461538461539, |
|
"recall": 0.7416107382550335 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8143807055111011, |
|
"number": 8845, |
|
"precision": 0.8118188967531738, |
|
"recall": 0.8169587337478802 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9832394464149107, |
|
"number": 7152, |
|
"precision": 0.9781375397813754, |
|
"recall": 0.9883948545861297 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7588932806324111, |
|
"number": 105, |
|
"precision": 0.6486486486486487, |
|
"recall": 0.9142857142857143 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9523400601116359, |
|
"number": 5646, |
|
"precision": 0.92432072012002, |
|
"recall": 0.9821112291888062 |
|
}, |
|
"eval_loss": 2.6447880268096924, |
|
"eval_overall_accuracy": 0.8236836106678824, |
|
"eval_overall_f1": 0.8531482839167277, |
|
"eval_overall_precision": 0.832606742320876, |
|
"eval_overall_recall": 0.8747290399272778, |
|
"eval_runtime": 10.4718, |
|
"eval_samples_per_second": 812.274, |
|
"eval_steps_per_second": 25.401, |
|
"step": 9000 |
|
}, |
|
{ |
|
"epoch": 1.88, |
|
"learning_rate": 4.059592159968323e-05, |
|
"loss": 2.5569, |
|
"step": 9500 |
|
}, |
|
{ |
|
"epoch": 1.98, |
|
"learning_rate": 4.010097010492972e-05, |
|
"loss": 2.5847, |
|
"step": 10000 |
|
}, |
|
{ |
|
"epoch": 1.98, |
|
"eval_COMMENT": { |
|
"f1": 0.6963045290358433, |
|
"number": 6854, |
|
"precision": 0.6645452134712277, |
|
"recall": 0.7312518237525533 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8156796390298928, |
|
"number": 8845, |
|
"precision": 0.8138435565559933, |
|
"recall": 0.8175240248728095 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9831476323119777, |
|
"number": 7152, |
|
"precision": 0.9793285238623751, |
|
"recall": 0.986996644295302 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7639484978540773, |
|
"number": 105, |
|
"precision": 0.6953125, |
|
"recall": 0.8476190476190476 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9530017152658663, |
|
"number": 5646, |
|
"precision": 0.9238443631526438, |
|
"recall": 0.9840595111583422 |
|
}, |
|
"eval_loss": 2.591038227081299, |
|
"eval_overall_accuracy": 0.8253172251348682, |
|
"eval_overall_f1": 0.8546566402302197, |
|
"eval_overall_precision": 0.8377942707458776, |
|
"eval_overall_recall": 0.8722117334452136, |
|
"eval_runtime": 10.9908, |
|
"eval_samples_per_second": 773.919, |
|
"eval_steps_per_second": 24.202, |
|
"step": 10000 |
|
}, |
|
{ |
|
"epoch": 2.08, |
|
"learning_rate": 3.9606018610176205e-05, |
|
"loss": 2.5001, |
|
"step": 10500 |
|
}, |
|
{ |
|
"epoch": 2.18, |
|
"learning_rate": 3.911106711542269e-05, |
|
"loss": 2.4321, |
|
"step": 11000 |
|
}, |
|
{ |
|
"epoch": 2.18, |
|
"eval_COMMENT": { |
|
"f1": 0.7009998630324613, |
|
"number": 6854, |
|
"precision": 0.660557563242127, |
|
"recall": 0.7467172454041435 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8124085125548924, |
|
"number": 8845, |
|
"precision": 0.8091286307053942, |
|
"recall": 0.8157150932730356 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9833752444816989, |
|
"number": 7152, |
|
"precision": 0.9825516471245115, |
|
"recall": 0.9842002237136466 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7404580152671757, |
|
"number": 105, |
|
"precision": 0.6178343949044586, |
|
"recall": 0.9238095238095239 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9521690767519465, |
|
"number": 5646, |
|
"precision": 0.9210395629862606, |
|
"recall": 0.9854764434998229 |
|
}, |
|
"eval_loss": 2.5731780529022217, |
|
"eval_overall_accuracy": 0.8255071803054479, |
|
"eval_overall_f1": 0.8539459994200822, |
|
"eval_overall_precision": 0.8336830186165785, |
|
"eval_overall_recall": 0.8752185161876792, |
|
"eval_runtime": 9.4187, |
|
"eval_samples_per_second": 903.101, |
|
"eval_steps_per_second": 28.242, |
|
"step": 11000 |
|
}, |
|
{ |
|
"epoch": 2.28, |
|
"learning_rate": 3.861611562066917e-05, |
|
"loss": 2.5117, |
|
"step": 11500 |
|
}, |
|
{ |
|
"epoch": 2.38, |
|
"learning_rate": 3.812116412591566e-05, |
|
"loss": 2.4326, |
|
"step": 12000 |
|
}, |
|
{ |
|
"epoch": 2.38, |
|
"eval_COMMENT": { |
|
"f1": 0.7086570477247504, |
|
"number": 6854, |
|
"precision": 0.6754826765405977, |
|
"recall": 0.7452582433615407 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8158534516876803, |
|
"number": 8845, |
|
"precision": 0.8159918570459173, |
|
"recall": 0.8157150932730356 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9844993715961456, |
|
"number": 7152, |
|
"precision": 0.9832635983263598, |
|
"recall": 0.985738255033557 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7654320987654321, |
|
"number": 105, |
|
"precision": 0.6739130434782609, |
|
"recall": 0.8857142857142857 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9534265374388883, |
|
"number": 5646, |
|
"precision": 0.9243306169965075, |
|
"recall": 0.9844137442437123 |
|
}, |
|
"eval_loss": 2.5278468132019043, |
|
"eval_overall_accuracy": 0.8280525795912165, |
|
"eval_overall_f1": 0.8580588749635675, |
|
"eval_overall_precision": 0.8418502943650126, |
|
"eval_overall_recall": 0.8749038528774211, |
|
"eval_runtime": 11.4233, |
|
"eval_samples_per_second": 744.616, |
|
"eval_steps_per_second": 23.286, |
|
"step": 12000 |
|
}, |
|
{ |
|
"epoch": 2.47, |
|
"learning_rate": 3.762621263116215e-05, |
|
"loss": 2.3983, |
|
"step": 12500 |
|
}, |
|
{ |
|
"epoch": 2.57, |
|
"learning_rate": 3.7131261136408633e-05, |
|
"loss": 2.3705, |
|
"step": 13000 |
|
}, |
|
{ |
|
"epoch": 2.57, |
|
"eval_COMMENT": { |
|
"f1": 0.7056559686619477, |
|
"number": 6854, |
|
"precision": 0.6670131219955827, |
|
"recall": 0.7490516486723081 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8140058545372664, |
|
"number": 8845, |
|
"precision": 0.8106289942818702, |
|
"recall": 0.8174109666478236 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9845080251221213, |
|
"number": 7152, |
|
"precision": 0.9827249930342714, |
|
"recall": 0.9862975391498882 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7415730337078652, |
|
"number": 105, |
|
"precision": 0.6111111111111112, |
|
"recall": 0.9428571428571428 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.952819725279413, |
|
"number": 5646, |
|
"precision": 0.9191769547325103, |
|
"recall": 0.9890187743535246 |
|
}, |
|
"eval_loss": 2.4818899631500244, |
|
"eval_overall_accuracy": 0.8270458171871439, |
|
"eval_overall_f1": 0.8562072552999164, |
|
"eval_overall_precision": 0.8358363024874297, |
|
"eval_overall_recall": 0.8775959723096287, |
|
"eval_runtime": 9.7776, |
|
"eval_samples_per_second": 869.945, |
|
"eval_steps_per_second": 27.205, |
|
"step": 13000 |
|
}, |
|
{ |
|
"epoch": 2.67, |
|
"learning_rate": 3.663630964165512e-05, |
|
"loss": 2.4183, |
|
"step": 13500 |
|
}, |
|
{ |
|
"epoch": 2.77, |
|
"learning_rate": 3.6141358146901606e-05, |
|
"loss": 2.364, |
|
"step": 14000 |
|
}, |
|
{ |
|
"epoch": 2.77, |
|
"eval_COMMENT": { |
|
"f1": 0.7068350260774088, |
|
"number": 6854, |
|
"precision": 0.6672713138118683, |
|
"recall": 0.7513860519404727 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8130456824198727, |
|
"number": 8845, |
|
"precision": 0.8101706331387517, |
|
"recall": 0.8159412097230073 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9847269684078387, |
|
"number": 7152, |
|
"precision": 0.9823292055099485, |
|
"recall": 0.9871364653243848 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7729083665338645, |
|
"number": 105, |
|
"precision": 0.6643835616438356, |
|
"recall": 0.9238095238095239 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9542999228328902, |
|
"number": 5646, |
|
"precision": 0.9248795080604952, |
|
"recall": 0.9856535600425079 |
|
}, |
|
"eval_loss": 2.4206130504608154, |
|
"eval_overall_accuracy": 0.8284704809664919, |
|
"eval_overall_f1": 0.8566014544709617, |
|
"eval_overall_precision": 0.8369695756605284, |
|
"eval_overall_recall": 0.8771764212292846, |
|
"eval_runtime": 10.6958, |
|
"eval_samples_per_second": 795.265, |
|
"eval_steps_per_second": 24.87, |
|
"step": 14000 |
|
}, |
|
{ |
|
"epoch": 2.87, |
|
"learning_rate": 3.564640665214809e-05, |
|
"loss": 2.3089, |
|
"step": 14500 |
|
}, |
|
{ |
|
"epoch": 2.97, |
|
"learning_rate": 3.515145515739457e-05, |
|
"loss": 2.3349, |
|
"step": 15000 |
|
}, |
|
{ |
|
"epoch": 2.97, |
|
"eval_COMMENT": { |
|
"f1": 0.7115305703734099, |
|
"number": 6854, |
|
"precision": 0.6696704428424305, |
|
"recall": 0.7589728625620076 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8152284263959392, |
|
"number": 8845, |
|
"precision": 0.8133933595948227, |
|
"recall": 0.8170717919728661 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9854223338215806, |
|
"number": 7152, |
|
"precision": 0.9831593597773138, |
|
"recall": 0.9876957494407159 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7320754716981133, |
|
"number": 105, |
|
"precision": 0.60625, |
|
"recall": 0.9238095238095239 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.954592186429061, |
|
"number": 5646, |
|
"precision": 0.9244938599402589, |
|
"recall": 0.9867162592986185 |
|
}, |
|
"eval_loss": 2.390350103378296, |
|
"eval_overall_accuracy": 0.8285084720006078, |
|
"eval_overall_f1": 0.8583563606590933, |
|
"eval_overall_precision": 0.8380295763389288, |
|
"eval_overall_recall": 0.8796937277113489, |
|
"eval_runtime": 13.4662, |
|
"eval_samples_per_second": 631.657, |
|
"eval_steps_per_second": 19.753, |
|
"step": 15000 |
|
}, |
|
{ |
|
"epoch": 3.07, |
|
"learning_rate": 3.465650366264107e-05, |
|
"loss": 2.251, |
|
"step": 15500 |
|
}, |
|
{ |
|
"epoch": 3.17, |
|
"learning_rate": 3.416155216788755e-05, |
|
"loss": 2.253, |
|
"step": 16000 |
|
}, |
|
{ |
|
"epoch": 3.17, |
|
"eval_COMMENT": { |
|
"f1": 0.7120891136472357, |
|
"number": 6854, |
|
"precision": 0.669751896130608, |
|
"recall": 0.7601400641960899 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8165914221218961, |
|
"number": 8845, |
|
"precision": 0.8152112676056338, |
|
"recall": 0.817976257772753 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9850704618389843, |
|
"number": 7152, |
|
"precision": 0.9830130882762461, |
|
"recall": 0.9871364653243848 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7529411764705883, |
|
"number": 105, |
|
"precision": 0.64, |
|
"recall": 0.9142857142857143 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9538013199622868, |
|
"number": 5646, |
|
"precision": 0.924098986879256, |
|
"recall": 0.9854764434998229 |
|
}, |
|
"eval_loss": 2.3770651817321777, |
|
"eval_overall_accuracy": 0.8302180685358256, |
|
"eval_overall_f1": 0.8587418314593322, |
|
"eval_overall_precision": 0.8386376512147166, |
|
"eval_overall_recall": 0.8798335780714636, |
|
"eval_runtime": 11.0556, |
|
"eval_samples_per_second": 769.382, |
|
"eval_steps_per_second": 24.06, |
|
"step": 16000 |
|
}, |
|
{ |
|
"epoch": 3.27, |
|
"learning_rate": 3.3666600673134034e-05, |
|
"loss": 2.1955, |
|
"step": 16500 |
|
}, |
|
{ |
|
"epoch": 3.37, |
|
"learning_rate": 3.317164917838052e-05, |
|
"loss": 2.2137, |
|
"step": 17000 |
|
}, |
|
{ |
|
"epoch": 3.37, |
|
"eval_COMMENT": { |
|
"f1": 0.7152373022481265, |
|
"number": 6854, |
|
"precision": 0.6819264355649642, |
|
"recall": 0.7519696527575138 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.816918906708832, |
|
"number": 8845, |
|
"precision": 0.8160893602617624, |
|
"recall": 0.8177501413227812 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9852099902330124, |
|
"number": 7152, |
|
"precision": 0.9831523252575884, |
|
"recall": 0.9872762863534675 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7619047619047618, |
|
"number": 105, |
|
"precision": 0.6530612244897959, |
|
"recall": 0.9142857142857143 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9529855868222373, |
|
"number": 5646, |
|
"precision": 0.924126455906822, |
|
"recall": 0.983705278072972 |
|
}, |
|
"eval_loss": 2.378207206726074, |
|
"eval_overall_accuracy": 0.8285464630347238, |
|
"eval_overall_f1": 0.8600801891641822, |
|
"eval_overall_precision": 0.8433467741935484, |
|
"eval_overall_recall": 0.8774910845395427, |
|
"eval_runtime": 10.7102, |
|
"eval_samples_per_second": 794.197, |
|
"eval_steps_per_second": 24.836, |
|
"step": 17000 |
|
}, |
|
{ |
|
"epoch": 3.46, |
|
"learning_rate": 3.267669768362701e-05, |
|
"loss": 2.2027, |
|
"step": 17500 |
|
}, |
|
{ |
|
"epoch": 3.56, |
|
"learning_rate": 3.218174618887349e-05, |
|
"loss": 2.2065, |
|
"step": 18000 |
|
}, |
|
{ |
|
"epoch": 3.56, |
|
"eval_COMMENT": { |
|
"f1": 0.715327462850853, |
|
"number": 6854, |
|
"precision": 0.6767768810205675, |
|
"recall": 0.7585351619492268 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8111738148984199, |
|
"number": 8845, |
|
"precision": 0.8098028169014084, |
|
"recall": 0.8125494629734313 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9852766729467587, |
|
"number": 7152, |
|
"precision": 0.9834238751915308, |
|
"recall": 0.9871364653243848 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.751937984496124, |
|
"number": 105, |
|
"precision": 0.6339869281045751, |
|
"recall": 0.9238095238095239 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9542920847268673, |
|
"number": 5646, |
|
"precision": 0.9250207813798836, |
|
"recall": 0.9854764434998229 |
|
}, |
|
"eval_loss": 2.3392648696899414, |
|
"eval_overall_accuracy": 0.829154319580579, |
|
"eval_overall_f1": 0.8582709465695826, |
|
"eval_overall_precision": 0.8395866773675762, |
|
"eval_overall_recall": 0.8778057478498007, |
|
"eval_runtime": 10.643, |
|
"eval_samples_per_second": 799.209, |
|
"eval_steps_per_second": 24.993, |
|
"step": 18000 |
|
}, |
|
{ |
|
"epoch": 3.66, |
|
"learning_rate": 3.168679469411997e-05, |
|
"loss": 2.17, |
|
"step": 18500 |
|
}, |
|
{ |
|
"epoch": 3.76, |
|
"learning_rate": 3.119184319936647e-05, |
|
"loss": 2.1758, |
|
"step": 19000 |
|
}, |
|
{ |
|
"epoch": 3.76, |
|
"eval_COMMENT": { |
|
"f1": 0.7196268093572066, |
|
"number": 6854, |
|
"precision": 0.6791402304803833, |
|
"recall": 0.7652465713451999 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8154011420817548, |
|
"number": 8845, |
|
"precision": 0.8155394707079846, |
|
"recall": 0.8152628603730921 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9850017439832579, |
|
"number": 7152, |
|
"precision": 0.9828762355561743, |
|
"recall": 0.9871364653243848 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7637795275590552, |
|
"number": 105, |
|
"precision": 0.6510067114093959, |
|
"recall": 0.9238095238095239 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9544714052988081, |
|
"number": 5646, |
|
"precision": 0.9250457038391224, |
|
"recall": 0.9858306765851931 |
|
}, |
|
"eval_loss": 2.306312322616577, |
|
"eval_overall_accuracy": 0.827710660284173, |
|
"eval_overall_f1": 0.8605851391072529, |
|
"eval_overall_precision": 0.8417129103429832, |
|
"eval_overall_recall": 0.8803230543318649, |
|
"eval_runtime": 11.977, |
|
"eval_samples_per_second": 710.192, |
|
"eval_steps_per_second": 22.209, |
|
"step": 19000 |
|
}, |
|
{ |
|
"epoch": 3.86, |
|
"learning_rate": 3.069689170461295e-05, |
|
"loss": 2.2238, |
|
"step": 19500 |
|
}, |
|
{ |
|
"epoch": 3.96, |
|
"learning_rate": 3.0201940209859435e-05, |
|
"loss": 2.1417, |
|
"step": 20000 |
|
}, |
|
{ |
|
"epoch": 3.96, |
|
"eval_COMMENT": { |
|
"f1": 0.7152720243026789, |
|
"number": 6854, |
|
"precision": 0.6788990825688074, |
|
"recall": 0.7557630580682813 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.815481242573417, |
|
"number": 8845, |
|
"precision": 0.8162664250113276, |
|
"recall": 0.8146975692481628 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9854263998326477, |
|
"number": 7152, |
|
"precision": 0.9828905271943247, |
|
"recall": 0.9879753914988815 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7634854771784232, |
|
"number": 105, |
|
"precision": 0.6764705882352942, |
|
"recall": 0.8761904761904762 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9533384893013664, |
|
"number": 5646, |
|
"precision": 0.9258888332498748, |
|
"recall": 0.9824654622741764 |
|
}, |
|
"eval_loss": 2.288215398788452, |
|
"eval_overall_accuracy": 0.8285084720006078, |
|
"eval_overall_f1": 0.8596340962039195, |
|
"eval_overall_precision": 0.8427151205749983, |
|
"eval_overall_recall": 0.877246346409342, |
|
"eval_runtime": 9.5122, |
|
"eval_samples_per_second": 894.221, |
|
"eval_steps_per_second": 27.964, |
|
"step": 20000 |
|
}, |
|
{ |
|
"epoch": 4.06, |
|
"learning_rate": 2.970698871510592e-05, |
|
"loss": 2.1114, |
|
"step": 20500 |
|
}, |
|
{ |
|
"epoch": 4.16, |
|
"learning_rate": 2.9212037220352405e-05, |
|
"loss": 2.0271, |
|
"step": 21000 |
|
}, |
|
{ |
|
"epoch": 4.16, |
|
"eval_COMMENT": { |
|
"f1": 0.7168075752451809, |
|
"number": 6854, |
|
"precision": 0.6681376875551632, |
|
"recall": 0.7731251823752553 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8170380818053596, |
|
"number": 8845, |
|
"precision": 0.815427927927928, |
|
"recall": 0.8186546071226681 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9858546442756603, |
|
"number": 7152, |
|
"precision": 0.9826364772885123, |
|
"recall": 0.9890939597315436 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7717842323651452, |
|
"number": 105, |
|
"precision": 0.6838235294117647, |
|
"recall": 0.8857142857142857 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9534565366187543, |
|
"number": 5646, |
|
"precision": 0.922211188348229, |
|
"recall": 0.9868933758413035 |
|
}, |
|
"eval_loss": 2.350003242492676, |
|
"eval_overall_accuracy": 0.82989514474584, |
|
"eval_overall_f1": 0.859976186426263, |
|
"eval_overall_precision": 0.837385716178614, |
|
"eval_overall_recall": 0.8838193133347318, |
|
"eval_runtime": 11.0178, |
|
"eval_samples_per_second": 772.02, |
|
"eval_steps_per_second": 24.143, |
|
"step": 21000 |
|
}, |
|
{ |
|
"epoch": 4.26, |
|
"learning_rate": 2.871708572559889e-05, |
|
"loss": 2.0589, |
|
"step": 21500 |
|
}, |
|
{ |
|
"epoch": 4.36, |
|
"learning_rate": 2.8222134230845377e-05, |
|
"loss": 2.0488, |
|
"step": 22000 |
|
}, |
|
{ |
|
"epoch": 4.36, |
|
"eval_COMMENT": { |
|
"f1": 0.7173793103448276, |
|
"number": 6854, |
|
"precision": 0.6802249542244311, |
|
"recall": 0.7588269623577473 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.814222122048797, |
|
"number": 8845, |
|
"precision": 0.8116153673331835, |
|
"recall": 0.8168456755228943 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9854284319877291, |
|
"number": 7152, |
|
"precision": 0.9827562230565985, |
|
"recall": 0.9881152125279642 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7686274509803921, |
|
"number": 105, |
|
"precision": 0.6533333333333333, |
|
"recall": 0.9333333333333333 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9529190207156308, |
|
"number": 5646, |
|
"precision": 0.9221338634857521, |
|
"recall": 0.9858306765851931 |
|
}, |
|
"eval_loss": 2.2779643535614014, |
|
"eval_overall_accuracy": 0.8274067320112454, |
|
"eval_overall_f1": 0.8596716045585798, |
|
"eval_overall_precision": 0.8406683375104428, |
|
"eval_overall_recall": 0.8795538773512341, |
|
"eval_runtime": 10.9882, |
|
"eval_samples_per_second": 774.104, |
|
"eval_steps_per_second": 24.208, |
|
"step": 22000 |
|
}, |
|
{ |
|
"epoch": 4.45, |
|
"learning_rate": 2.7727182736091867e-05, |
|
"loss": 2.0377, |
|
"step": 22500 |
|
}, |
|
{ |
|
"epoch": 4.55, |
|
"learning_rate": 2.7232231241338353e-05, |
|
"loss": 2.0403, |
|
"step": 23000 |
|
}, |
|
{ |
|
"epoch": 4.55, |
|
"eval_COMMENT": { |
|
"f1": 0.7213069552629764, |
|
"number": 6854, |
|
"precision": 0.6836534692277538, |
|
"recall": 0.7633498686898161 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8175446529504862, |
|
"number": 8845, |
|
"precision": 0.8174522436984288, |
|
"recall": 0.8176370830977954 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9858447806986962, |
|
"number": 7152, |
|
"precision": 0.9833078314090973, |
|
"recall": 0.9883948545861297 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7868852459016393, |
|
"number": 105, |
|
"precision": 0.6906474820143885, |
|
"recall": 0.9142857142857143 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9541991267870901, |
|
"number": 5646, |
|
"precision": 0.9234465617232809, |
|
"recall": 0.9870704923839887 |
|
}, |
|
"eval_loss": 2.255697250366211, |
|
"eval_overall_accuracy": 0.8292303016488108, |
|
"eval_overall_f1": 0.8621226374754127, |
|
"eval_overall_precision": 0.8439205706057663, |
|
"eval_overall_recall": 0.8811271939025243, |
|
"eval_runtime": 11.1445, |
|
"eval_samples_per_second": 763.249, |
|
"eval_steps_per_second": 23.868, |
|
"step": 23000 |
|
}, |
|
{ |
|
"epoch": 4.65, |
|
"learning_rate": 2.6737279746584836e-05, |
|
"loss": 2.0887, |
|
"step": 23500 |
|
}, |
|
{ |
|
"epoch": 4.75, |
|
"learning_rate": 2.6242328251831323e-05, |
|
"loss": 2.0443, |
|
"step": 24000 |
|
}, |
|
{ |
|
"epoch": 4.75, |
|
"eval_COMMENT": { |
|
"f1": 0.7226055754899255, |
|
"number": 6854, |
|
"precision": 0.6855197695731867, |
|
"recall": 0.7639334695068573 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8165780843605112, |
|
"number": 8845, |
|
"precision": 0.8167628096369189, |
|
"recall": 0.8163934426229508 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9852161785216179, |
|
"number": 7152, |
|
"precision": 0.9827490261547023, |
|
"recall": 0.9876957494407159 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7854251012145749, |
|
"number": 105, |
|
"precision": 0.6830985915492958, |
|
"recall": 0.9238095238095239 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9537354352296092, |
|
"number": 5646, |
|
"precision": 0.9236641221374046, |
|
"recall": 0.9858306765851931 |
|
}, |
|
"eval_loss": 2.228408098220825, |
|
"eval_overall_accuracy": 0.829097333029405, |
|
"eval_overall_f1": 0.8619196741790305, |
|
"eval_overall_precision": 0.8441092676386794, |
|
"eval_overall_recall": 0.8804978672820083, |
|
"eval_runtime": 10.5005, |
|
"eval_samples_per_second": 810.058, |
|
"eval_steps_per_second": 25.332, |
|
"step": 24000 |
|
}, |
|
{ |
|
"epoch": 4.85, |
|
"learning_rate": 2.5747376757077806e-05, |
|
"loss": 2.068, |
|
"step": 24500 |
|
}, |
|
{ |
|
"epoch": 4.95, |
|
"learning_rate": 2.5252425262324292e-05, |
|
"loss": 2.0214, |
|
"step": 25000 |
|
}, |
|
{ |
|
"epoch": 4.95, |
|
"eval_COMMENT": { |
|
"f1": 0.7221103783408538, |
|
"number": 6854, |
|
"precision": 0.6887829426566018, |
|
"recall": 0.7588269623577473 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8139863300005649, |
|
"number": 8845, |
|
"precision": 0.8133890268683676, |
|
"recall": 0.814584511023177 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9864751812604574, |
|
"number": 7152, |
|
"precision": 0.9837319243604005, |
|
"recall": 0.9892337807606264 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7713004484304932, |
|
"number": 105, |
|
"precision": 0.7288135593220338, |
|
"recall": 0.819047619047619 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9553288176283975, |
|
"number": 5646, |
|
"precision": 0.9258766827322586, |
|
"recall": 0.9867162592986185 |
|
}, |
|
"eval_loss": 2.2036967277526855, |
|
"eval_overall_accuracy": 0.8304270192234633, |
|
"eval_overall_f1": 0.8618053412869828, |
|
"eval_overall_precision": 0.8453726123217649, |
|
"eval_overall_recall": 0.8788895881406895, |
|
"eval_runtime": 10.7118, |
|
"eval_samples_per_second": 794.075, |
|
"eval_steps_per_second": 24.832, |
|
"step": 25000 |
|
}, |
|
{ |
|
"epoch": 5.05, |
|
"learning_rate": 2.4757473767570778e-05, |
|
"loss": 2.0164, |
|
"step": 25500 |
|
}, |
|
{ |
|
"epoch": 5.15, |
|
"learning_rate": 2.4262522272817265e-05, |
|
"loss": 2.0081, |
|
"step": 26000 |
|
}, |
|
{ |
|
"epoch": 5.15, |
|
"eval_COMMENT": { |
|
"f1": 0.719671201814059, |
|
"number": 6854, |
|
"precision": 0.6996417745935519, |
|
"recall": 0.7408812372337321 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8098846414838272, |
|
"number": 8845, |
|
"precision": 0.8101595203077271, |
|
"recall": 0.8096099491237988 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9862001672706997, |
|
"number": 7152, |
|
"precision": 0.9831851028349082, |
|
"recall": 0.9892337807606264 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7918367346938776, |
|
"number": 105, |
|
"precision": 0.6928571428571428, |
|
"recall": 0.9238095238095239 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9546235819869371, |
|
"number": 5646, |
|
"precision": 0.927212020033389, |
|
"recall": 0.983705278072972 |
|
}, |
|
"eval_loss": 2.2013936042785645, |
|
"eval_overall_accuracy": 0.8273117544259555, |
|
"eval_overall_f1": 0.8604911676001723, |
|
"eval_overall_precision": 0.8484858783944533, |
|
"eval_overall_recall": 0.8728410600657297, |
|
"eval_runtime": 11.2303, |
|
"eval_samples_per_second": 757.413, |
|
"eval_steps_per_second": 23.686, |
|
"step": 26000 |
|
}, |
|
{ |
|
"epoch": 5.25, |
|
"learning_rate": 2.376757077806375e-05, |
|
"loss": 1.9905, |
|
"step": 26500 |
|
}, |
|
{ |
|
"epoch": 5.35, |
|
"learning_rate": 2.3272619283310237e-05, |
|
"loss": 1.9138, |
|
"step": 27000 |
|
}, |
|
{ |
|
"epoch": 5.35, |
|
"eval_COMMENT": { |
|
"f1": 0.7232730263157895, |
|
"number": 6854, |
|
"precision": 0.6819591625743086, |
|
"recall": 0.7699153778815291 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8175660419959357, |
|
"number": 8845, |
|
"precision": 0.8163679404802164, |
|
"recall": 0.818767665347654 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9861333704968295, |
|
"number": 7152, |
|
"precision": 0.9829142936518961, |
|
"recall": 0.9893736017897091 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7679324894514767, |
|
"number": 105, |
|
"precision": 0.6893939393939394, |
|
"recall": 0.8666666666666667 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9538567493112948, |
|
"number": 5646, |
|
"precision": 0.9279731993299832, |
|
"recall": 0.9812256464753808 |
|
}, |
|
"eval_loss": 2.1838574409484863, |
|
"eval_overall_accuracy": 0.8322695843780867, |
|
"eval_overall_f1": 0.8622504785343178, |
|
"eval_overall_precision": 0.8433968572383818, |
|
"eval_overall_recall": 0.8819662960632124, |
|
"eval_runtime": 10.2972, |
|
"eval_samples_per_second": 826.053, |
|
"eval_steps_per_second": 25.832, |
|
"step": 27000 |
|
}, |
|
{ |
|
"epoch": 5.44, |
|
"learning_rate": 2.2777667788556724e-05, |
|
"loss": 1.9236, |
|
"step": 27500 |
|
}, |
|
{ |
|
"epoch": 5.54, |
|
"learning_rate": 2.2282716293803206e-05, |
|
"loss": 1.9304, |
|
"step": 28000 |
|
}, |
|
{ |
|
"epoch": 5.54, |
|
"eval_COMMENT": { |
|
"f1": 0.7215675336447948, |
|
"number": 6854, |
|
"precision": 0.6910645118204889, |
|
"recall": 0.7548876568427196 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8127016471387332, |
|
"number": 8845, |
|
"precision": 0.8137610519156654, |
|
"recall": 0.8116449971735443 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9857760423929716, |
|
"number": 7152, |
|
"precision": 0.9831710709318497, |
|
"recall": 0.9883948545861297 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.776, |
|
"number": 105, |
|
"precision": 0.6689655172413793, |
|
"recall": 0.9238095238095239 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9539864109400533, |
|
"number": 5646, |
|
"precision": 0.9272696873432537, |
|
"recall": 0.9822883457314914 |
|
}, |
|
"eval_loss": 2.1557235717773438, |
|
"eval_overall_accuracy": 0.8287364182053035, |
|
"eval_overall_f1": 0.860940800659488, |
|
"eval_overall_precision": 0.8460759493670886, |
|
"eval_overall_recall": 0.8763373190685966, |
|
"eval_runtime": 11.4111, |
|
"eval_samples_per_second": 745.412, |
|
"eval_steps_per_second": 23.311, |
|
"step": 28000 |
|
}, |
|
{ |
|
"epoch": 5.64, |
|
"learning_rate": 2.1787764799049696e-05, |
|
"loss": 1.908, |
|
"step": 28500 |
|
}, |
|
{ |
|
"epoch": 5.74, |
|
"learning_rate": 2.129281330429618e-05, |
|
"loss": 1.9369, |
|
"step": 29000 |
|
}, |
|
{ |
|
"epoch": 5.74, |
|
"eval_COMMENT": { |
|
"f1": 0.7214330697641872, |
|
"number": 6854, |
|
"precision": 0.6931558424095737, |
|
"recall": 0.7521155529617741 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8120292235374073, |
|
"number": 8845, |
|
"precision": 0.8135497049477984, |
|
"recall": 0.8105144149236857 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9862020905923344, |
|
"number": 7152, |
|
"precision": 0.9830508474576272, |
|
"recall": 0.9893736017897091 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7841409691629957, |
|
"number": 105, |
|
"precision": 0.7295081967213115, |
|
"recall": 0.8476190476190476 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9530419880034275, |
|
"number": 5646, |
|
"precision": 0.923140770252324, |
|
"recall": 0.9849450938717677 |
|
}, |
|
"eval_loss": 2.152221918106079, |
|
"eval_overall_accuracy": 0.8286794316541296, |
|
"eval_overall_f1": 0.8608987026376836, |
|
"eval_overall_precision": 0.8464839658027237, |
|
"eval_overall_recall": 0.8758128802181666, |
|
"eval_runtime": 8.8394, |
|
"eval_samples_per_second": 962.281, |
|
"eval_steps_per_second": 30.093, |
|
"step": 29000 |
|
}, |
|
{ |
|
"epoch": 5.84, |
|
"learning_rate": 2.0797861809542665e-05, |
|
"loss": 1.9176, |
|
"step": 29500 |
|
}, |
|
{ |
|
"epoch": 5.94, |
|
"learning_rate": 2.0302910314789152e-05, |
|
"loss": 1.8944, |
|
"step": 30000 |
|
}, |
|
{ |
|
"epoch": 5.94, |
|
"eval_COMMENT": { |
|
"f1": 0.723598615916955, |
|
"number": 6854, |
|
"precision": 0.6882569773565034, |
|
"recall": 0.762766267872775 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8156853881794554, |
|
"number": 8845, |
|
"precision": 0.8153168417485598, |
|
"recall": 0.8160542679479932 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9857272157627236, |
|
"number": 7152, |
|
"precision": 0.9816946331992789, |
|
"recall": 0.9897930648769575 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7631578947368421, |
|
"number": 105, |
|
"precision": 0.7073170731707317, |
|
"recall": 0.8285714285714286 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9549935705100728, |
|
"number": 5646, |
|
"precision": 0.9254028908456554, |
|
"recall": 0.9865391427559334 |
|
}, |
|
"eval_loss": 2.128391742706299, |
|
"eval_overall_accuracy": 0.8317377099004635, |
|
"eval_overall_f1": 0.8623381960139715, |
|
"eval_overall_precision": 0.8449768471914637, |
|
"eval_overall_recall": 0.880427942101951, |
|
"eval_runtime": 11.5016, |
|
"eval_samples_per_second": 739.547, |
|
"eval_steps_per_second": 23.127, |
|
"step": 30000 |
|
}, |
|
{ |
|
"epoch": 6.04, |
|
"learning_rate": 1.9807958820035638e-05, |
|
"loss": 1.837, |
|
"step": 30500 |
|
}, |
|
{ |
|
"epoch": 6.14, |
|
"learning_rate": 1.9313007325282124e-05, |
|
"loss": 1.8311, |
|
"step": 31000 |
|
}, |
|
{ |
|
"epoch": 6.14, |
|
"eval_COMMENT": { |
|
"f1": 0.7244426318651441, |
|
"number": 6854, |
|
"precision": 0.6781623822855688, |
|
"recall": 0.7775021885030639 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.818961625282167, |
|
"number": 8845, |
|
"precision": 0.8175774647887324, |
|
"recall": 0.8203504804974562 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9856425982715361, |
|
"number": 7152, |
|
"precision": 0.9826292384658143, |
|
"recall": 0.9886744966442953 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7896995708154506, |
|
"number": 105, |
|
"precision": 0.71875, |
|
"recall": 0.8761904761904762 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9552008238928938, |
|
"number": 5646, |
|
"precision": 0.9265734265734266, |
|
"recall": 0.9856535600425079 |
|
}, |
|
"eval_loss": 2.171062469482422, |
|
"eval_overall_accuracy": 0.8314527771445939, |
|
"eval_overall_f1": 0.8629676979459644, |
|
"eval_overall_precision": 0.8419984698799189, |
|
"eval_overall_recall": 0.8850080413957065, |
|
"eval_runtime": 11.2938, |
|
"eval_samples_per_second": 753.154, |
|
"eval_steps_per_second": 23.553, |
|
"step": 31000 |
|
}, |
|
{ |
|
"epoch": 6.24, |
|
"learning_rate": 1.8818055830528607e-05, |
|
"loss": 1.8426, |
|
"step": 31500 |
|
}, |
|
{ |
|
"epoch": 6.34, |
|
"learning_rate": 1.8323104335775097e-05, |
|
"loss": 1.879, |
|
"step": 32000 |
|
}, |
|
{ |
|
"epoch": 6.34, |
|
"eval_COMMENT": { |
|
"f1": 0.7243460764587525, |
|
"number": 6854, |
|
"precision": 0.6905675353882789, |
|
"recall": 0.7615990662386928 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8148399502318742, |
|
"number": 8845, |
|
"precision": 0.8152087812606088, |
|
"recall": 0.8144714527981911 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.985952712100139, |
|
"number": 7152, |
|
"precision": 0.9807692307692307, |
|
"recall": 0.9911912751677853 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7796610169491526, |
|
"number": 105, |
|
"precision": 0.7022900763358778, |
|
"recall": 0.8761904761904762 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9541174456428694, |
|
"number": 5646, |
|
"precision": 0.9232935719019219, |
|
"recall": 0.9870704923839887 |
|
}, |
|
"eval_loss": 2.1472506523132324, |
|
"eval_overall_accuracy": 0.830635969911101, |
|
"eval_overall_f1": 0.8623636394773346, |
|
"eval_overall_precision": 0.8451545768856366, |
|
"eval_overall_recall": 0.8802880917418362, |
|
"eval_runtime": 12.4001, |
|
"eval_samples_per_second": 685.964, |
|
"eval_steps_per_second": 21.452, |
|
"step": 32000 |
|
}, |
|
{ |
|
"epoch": 6.43, |
|
"learning_rate": 1.782815284102158e-05, |
|
"loss": 1.8605, |
|
"step": 32500 |
|
}, |
|
{ |
|
"epoch": 6.53, |
|
"learning_rate": 1.7333201346268066e-05, |
|
"loss": 1.8279, |
|
"step": 33000 |
|
}, |
|
{ |
|
"epoch": 6.53, |
|
"eval_COMMENT": { |
|
"f1": 0.7266004792879152, |
|
"number": 6854, |
|
"precision": 0.6845568313765966, |
|
"recall": 0.7741464838050773 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8171618650279078, |
|
"number": 8845, |
|
"precision": 0.8150022492127755, |
|
"recall": 0.8193329564725834 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9857839721254356, |
|
"number": 7152, |
|
"precision": 0.9826340650180606, |
|
"recall": 0.9889541387024608 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7860262008733625, |
|
"number": 105, |
|
"precision": 0.7258064516129032, |
|
"recall": 0.8571428571428571 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9554850330216998, |
|
"number": 5646, |
|
"precision": 0.9263262930317645, |
|
"recall": 0.9865391427559334 |
|
}, |
|
"eval_loss": 2.1636247634887695, |
|
"eval_overall_accuracy": 0.83139579059342, |
|
"eval_overall_f1": 0.8632980539433255, |
|
"eval_overall_precision": 0.8434852224964974, |
|
"eval_overall_recall": 0.8840640514649325, |
|
"eval_runtime": 11.6243, |
|
"eval_samples_per_second": 731.745, |
|
"eval_steps_per_second": 22.883, |
|
"step": 33000 |
|
}, |
|
{ |
|
"epoch": 6.63, |
|
"learning_rate": 1.6838249851514553e-05, |
|
"loss": 1.8596, |
|
"step": 33500 |
|
}, |
|
{ |
|
"epoch": 6.73, |
|
"learning_rate": 1.634329835676104e-05, |
|
"loss": 1.8613, |
|
"step": 34000 |
|
}, |
|
{ |
|
"epoch": 6.73, |
|
"eval_COMMENT": { |
|
"f1": 0.7281226369698219, |
|
"number": 6854, |
|
"precision": 0.6884180423761861, |
|
"recall": 0.7726874817624745 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8162550161080653, |
|
"number": 8845, |
|
"precision": 0.8161166365280289, |
|
"recall": 0.8163934426229508 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9855233853006681, |
|
"number": 7152, |
|
"precision": 0.9811529933481153, |
|
"recall": 0.9899328859060402 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7777777777777778, |
|
"number": 105, |
|
"precision": 0.6666666666666666, |
|
"recall": 0.9333333333333333 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9550600343053174, |
|
"number": 5646, |
|
"precision": 0.9258397073495178, |
|
"recall": 0.9861849096705633 |
|
}, |
|
"eval_loss": 2.119246482849121, |
|
"eval_overall_accuracy": 0.8333523288503913, |
|
"eval_overall_f1": 0.8633971291866029, |
|
"eval_overall_precision": 0.8444080486663547, |
|
"eval_overall_recall": 0.8832599118942731, |
|
"eval_runtime": 9.0301, |
|
"eval_samples_per_second": 941.963, |
|
"eval_steps_per_second": 29.457, |
|
"step": 34000 |
|
}, |
|
{ |
|
"epoch": 6.83, |
|
"learning_rate": 1.5848346862007525e-05, |
|
"loss": 1.8804, |
|
"step": 34500 |
|
}, |
|
{ |
|
"epoch": 6.93, |
|
"learning_rate": 1.535339536725401e-05, |
|
"loss": 1.8604, |
|
"step": 35000 |
|
}, |
|
{ |
|
"epoch": 6.93, |
|
"eval_COMMENT": { |
|
"f1": 0.7285265601529427, |
|
"number": 6854, |
|
"precision": 0.68467659137577, |
|
"recall": 0.7783775897286256 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8183306055646481, |
|
"number": 8845, |
|
"precision": 0.8169934640522876, |
|
"recall": 0.819672131147541 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9865589525732991, |
|
"number": 7152, |
|
"precision": 0.9827945053420286, |
|
"recall": 0.9903523489932886 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7818930041152263, |
|
"number": 105, |
|
"precision": 0.6884057971014492, |
|
"recall": 0.9047619047619048 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9555517418911963, |
|
"number": 5646, |
|
"precision": 0.9267643142476698, |
|
"recall": 0.9861849096705633 |
|
}, |
|
"eval_loss": 2.1069583892822266, |
|
"eval_overall_accuracy": 0.834340095737406, |
|
"eval_overall_f1": 0.8642295423141878, |
|
"eval_overall_precision": 0.8438322395815984, |
|
"eval_overall_recall": 0.8856373680162226, |
|
"eval_runtime": 11.4858, |
|
"eval_samples_per_second": 740.57, |
|
"eval_steps_per_second": 23.159, |
|
"step": 35000 |
|
}, |
|
{ |
|
"epoch": 7.03, |
|
"learning_rate": 1.4858443872500496e-05, |
|
"loss": 1.7995, |
|
"step": 35500 |
|
}, |
|
{ |
|
"epoch": 7.13, |
|
"learning_rate": 1.4363492377746981e-05, |
|
"loss": 1.8026, |
|
"step": 36000 |
|
}, |
|
{ |
|
"epoch": 7.13, |
|
"eval_COMMENT": { |
|
"f1": 0.7254587315984092, |
|
"number": 6854, |
|
"precision": 0.695146409947854, |
|
"recall": 0.7585351619492268 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8138180584610165, |
|
"number": 8845, |
|
"precision": 0.8139561185252205, |
|
"recall": 0.81368004522329 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9861982434127978, |
|
"number": 7152, |
|
"precision": 0.9833194328607172, |
|
"recall": 0.9890939597315436 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7692307692307693, |
|
"number": 105, |
|
"precision": 0.6976744186046512, |
|
"recall": 0.8571428571428571 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9548265200961868, |
|
"number": 5646, |
|
"precision": 0.926808936312104, |
|
"recall": 0.9845908607863975 |
|
}, |
|
"eval_loss": 2.1282002925872803, |
|
"eval_overall_accuracy": 0.8295152344046804, |
|
"eval_overall_f1": 0.8625437813336996, |
|
"eval_overall_precision": 0.8474124552999123, |
|
"eval_overall_recall": 0.8782252989301448, |
|
"eval_runtime": 9.0618, |
|
"eval_samples_per_second": 938.668, |
|
"eval_steps_per_second": 29.354, |
|
"step": 36000 |
|
}, |
|
{ |
|
"epoch": 7.23, |
|
"learning_rate": 1.3868540882993467e-05, |
|
"loss": 1.7692, |
|
"step": 36500 |
|
}, |
|
{ |
|
"epoch": 7.33, |
|
"learning_rate": 1.3373589388239954e-05, |
|
"loss": 1.774, |
|
"step": 37000 |
|
}, |
|
{ |
|
"epoch": 7.33, |
|
"eval_COMMENT": { |
|
"f1": 0.7252502780867629, |
|
"number": 6854, |
|
"precision": 0.6926958831341301, |
|
"recall": 0.7610154654216515 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8135153429602889, |
|
"number": 8845, |
|
"precision": 0.8117753011370032, |
|
"recall": 0.8152628603730921 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9858644941160087, |
|
"number": 7152, |
|
"precision": 0.9819669857123041, |
|
"recall": 0.9897930648769575 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7948717948717948, |
|
"number": 105, |
|
"precision": 0.7209302325581395, |
|
"recall": 0.8857142857142857 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.953885787891799, |
|
"number": 5646, |
|
"precision": 0.9258209701616936, |
|
"recall": 0.983705278072972 |
|
}, |
|
"eval_loss": 2.1374754905700684, |
|
"eval_overall_accuracy": 0.829952131297014, |
|
"eval_overall_f1": 0.8621126953660542, |
|
"eval_overall_precision": 0.8454789915966386, |
|
"eval_overall_recall": 0.8794140269911195, |
|
"eval_runtime": 13.9271, |
|
"eval_samples_per_second": 610.751, |
|
"eval_steps_per_second": 19.099, |
|
"step": 37000 |
|
}, |
|
{ |
|
"epoch": 7.42, |
|
"learning_rate": 1.287863789348644e-05, |
|
"loss": 1.7909, |
|
"step": 37500 |
|
}, |
|
{ |
|
"epoch": 7.52, |
|
"learning_rate": 1.2383686398732925e-05, |
|
"loss": 1.8132, |
|
"step": 38000 |
|
}, |
|
{ |
|
"epoch": 7.52, |
|
"eval_COMMENT": { |
|
"f1": 0.7251632624704737, |
|
"number": 6854, |
|
"precision": 0.6921750663129973, |
|
"recall": 0.7614531660344325 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8144125798970531, |
|
"number": 8845, |
|
"precision": 0.8149196287072674, |
|
"recall": 0.8139061616732617 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9862059356276995, |
|
"number": 7152, |
|
"precision": 0.9827825603998889, |
|
"recall": 0.9896532438478747 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7966804979253113, |
|
"number": 105, |
|
"precision": 0.7058823529411765, |
|
"recall": 0.9142857142857143 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9550012856775519, |
|
"number": 5646, |
|
"precision": 0.9252615844544095, |
|
"recall": 0.9867162592986185 |
|
}, |
|
"eval_loss": 2.1093838214874268, |
|
"eval_overall_accuracy": 0.8298571537117241, |
|
"eval_overall_f1": 0.8627067798062913, |
|
"eval_overall_precision": 0.8462987253220328, |
|
"eval_overall_recall": 0.8797636528914062, |
|
"eval_runtime": 10.2321, |
|
"eval_samples_per_second": 831.306, |
|
"eval_steps_per_second": 25.997, |
|
"step": 38000 |
|
}, |
|
{ |
|
"epoch": 7.62, |
|
"learning_rate": 1.1888734903979411e-05, |
|
"loss": 1.7708, |
|
"step": 38500 |
|
}, |
|
{ |
|
"epoch": 7.72, |
|
"learning_rate": 1.1393783409225896e-05, |
|
"loss": 1.805, |
|
"step": 39000 |
|
}, |
|
{ |
|
"epoch": 7.72, |
|
"eval_COMMENT": { |
|
"f1": 0.7264215888751205, |
|
"number": 6854, |
|
"precision": 0.6876955161626694, |
|
"recall": 0.7697694776772688 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.815460358779922, |
|
"number": 8845, |
|
"precision": 0.8163380920009065, |
|
"recall": 0.814584511023177 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9862822923194763, |
|
"number": 7152, |
|
"precision": 0.9823831321958663, |
|
"recall": 0.9902125279642058 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7844827586206896, |
|
"number": 105, |
|
"precision": 0.7165354330708661, |
|
"recall": 0.8666666666666667 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9549858526965618, |
|
"number": 5646, |
|
"precision": 0.9255442911750041, |
|
"recall": 0.9863620262132483 |
|
}, |
|
"eval_loss": 2.1103549003601074, |
|
"eval_overall_accuracy": 0.8331053871286377, |
|
"eval_overall_f1": 0.8630181513352608, |
|
"eval_overall_precision": 0.8449633178117986, |
|
"eval_overall_recall": 0.8818614082931263, |
|
"eval_runtime": 10.8182, |
|
"eval_samples_per_second": 786.27, |
|
"eval_steps_per_second": 24.588, |
|
"step": 39000 |
|
}, |
|
{ |
|
"epoch": 7.82, |
|
"learning_rate": 1.0898831914472382e-05, |
|
"loss": 1.8185, |
|
"step": 39500 |
|
}, |
|
{ |
|
"epoch": 7.92, |
|
"learning_rate": 1.0403880419718868e-05, |
|
"loss": 1.7337, |
|
"step": 40000 |
|
}, |
|
{ |
|
"epoch": 7.92, |
|
"eval_COMMENT": { |
|
"f1": 0.7251437677544517, |
|
"number": 6854, |
|
"precision": 0.6904604829133131, |
|
"recall": 0.7634957688940764 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8154846001695395, |
|
"number": 8845, |
|
"precision": 0.8152542372881356, |
|
"recall": 0.8157150932730356 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9866220735785953, |
|
"number": 7152, |
|
"precision": 0.9833333333333333, |
|
"recall": 0.9899328859060402 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.8, |
|
"number": 105, |
|
"precision": 0.7, |
|
"recall": 0.9333333333333333 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9544557852302942, |
|
"number": 5646, |
|
"precision": 0.9253284550141361, |
|
"recall": 0.9854764434998229 |
|
}, |
|
"eval_loss": 2.1034367084503174, |
|
"eval_overall_accuracy": 0.830616974394043, |
|
"eval_overall_f1": 0.8629076459303919, |
|
"eval_overall_precision": 0.8458129071251091, |
|
"eval_overall_recall": 0.8807076428221803, |
|
"eval_runtime": 10.7303, |
|
"eval_samples_per_second": 792.708, |
|
"eval_steps_per_second": 24.79, |
|
"step": 40000 |
|
}, |
|
{ |
|
"epoch": 8.02, |
|
"learning_rate": 9.908928924965353e-06, |
|
"loss": 1.7519, |
|
"step": 40500 |
|
}, |
|
{ |
|
"epoch": 8.12, |
|
"learning_rate": 9.41397743021184e-06, |
|
"loss": 1.7771, |
|
"step": 41000 |
|
}, |
|
{ |
|
"epoch": 8.12, |
|
"eval_COMMENT": { |
|
"f1": 0.7258660347110893, |
|
"number": 6854, |
|
"precision": 0.6949152542372882, |
|
"recall": 0.759702363583309 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8134750169568167, |
|
"number": 8845, |
|
"precision": 0.8133830677065672, |
|
"recall": 0.8135669869983041 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9863395595204906, |
|
"number": 7152, |
|
"precision": 0.9833240689271817, |
|
"recall": 0.9893736017897091 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7931034482758621, |
|
"number": 105, |
|
"precision": 0.7244094488188977, |
|
"recall": 0.8761904761904762 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9552213149978513, |
|
"number": 5646, |
|
"precision": 0.9278677575555184, |
|
"recall": 0.9842366277010273 |
|
}, |
|
"eval_loss": 2.107405424118042, |
|
"eval_overall_accuracy": 0.8285654585517818, |
|
"eval_overall_f1": 0.8627047069729117, |
|
"eval_overall_precision": 0.8474301902063942, |
|
"eval_overall_recall": 0.8785399622404028, |
|
"eval_runtime": 11.3451, |
|
"eval_samples_per_second": 749.75, |
|
"eval_steps_per_second": 23.446, |
|
"step": 41000 |
|
}, |
|
{ |
|
"epoch": 8.22, |
|
"learning_rate": 8.919025935458326e-06, |
|
"loss": 1.7381, |
|
"step": 41500 |
|
}, |
|
{ |
|
"epoch": 8.32, |
|
"learning_rate": 8.424074440704812e-06, |
|
"loss": 1.7179, |
|
"step": 42000 |
|
}, |
|
{ |
|
"epoch": 8.32, |
|
"eval_COMMENT": { |
|
"f1": 0.7297001232370259, |
|
"number": 6854, |
|
"precision": 0.6874355005159959, |
|
"recall": 0.7775021885030639 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8157106527267589, |
|
"number": 8845, |
|
"precision": 0.8154802259887005, |
|
"recall": 0.8159412097230073 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9864158829676071, |
|
"number": 7152, |
|
"precision": 0.982923781757601, |
|
"recall": 0.9899328859060402 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.8016194331983806, |
|
"number": 105, |
|
"precision": 0.6971830985915493, |
|
"recall": 0.9428571428571428 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.954233801851217, |
|
"number": 5646, |
|
"precision": 0.9244437064098306, |
|
"recall": 0.9860077931278781 |
|
}, |
|
"eval_loss": 2.1069343090057373, |
|
"eval_overall_accuracy": 0.8319276650710432, |
|
"eval_overall_f1": 0.86363558757747, |
|
"eval_overall_precision": 0.8439387366945844, |
|
"eval_overall_recall": 0.8842738270051045, |
|
"eval_runtime": 11.303, |
|
"eval_samples_per_second": 752.544, |
|
"eval_steps_per_second": 23.534, |
|
"step": 42000 |
|
}, |
|
{ |
|
"epoch": 8.41, |
|
"learning_rate": 7.929122945951298e-06, |
|
"loss": 1.7763, |
|
"step": 42500 |
|
}, |
|
{ |
|
"epoch": 8.51, |
|
"learning_rate": 7.434171451197783e-06, |
|
"loss": 1.7005, |
|
"step": 43000 |
|
}, |
|
{ |
|
"epoch": 8.51, |
|
"eval_COMMENT": { |
|
"f1": 0.7259434619133825, |
|
"number": 6854, |
|
"precision": 0.694326052210975, |
|
"recall": 0.7605777648088707 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8142243328810492, |
|
"number": 8845, |
|
"precision": 0.8143164084586678, |
|
"recall": 0.8141322781232334 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9863471719141822, |
|
"number": 7152, |
|
"precision": 0.9827873403664631, |
|
"recall": 0.9899328859060402 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7894736842105263, |
|
"number": 105, |
|
"precision": 0.7317073170731707, |
|
"recall": 0.8571428571428571 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9534087016101404, |
|
"number": 5646, |
|
"precision": 0.9230514096185738, |
|
"recall": 0.9858306765851931 |
|
}, |
|
"eval_loss": 2.1151254177093506, |
|
"eval_overall_accuracy": 0.8293252792341007, |
|
"eval_overall_f1": 0.8626307665923513, |
|
"eval_overall_precision": 0.8465733135855662, |
|
"eval_overall_recall": 0.8793091392210335, |
|
"eval_runtime": 10.9284, |
|
"eval_samples_per_second": 778.339, |
|
"eval_steps_per_second": 24.34, |
|
"step": 43000 |
|
}, |
|
{ |
|
"epoch": 8.61, |
|
"learning_rate": 6.939219956444269e-06, |
|
"loss": 1.7224, |
|
"step": 43500 |
|
}, |
|
{ |
|
"epoch": 8.71, |
|
"learning_rate": 6.444268461690754e-06, |
|
"loss": 1.7078, |
|
"step": 44000 |
|
}, |
|
{ |
|
"epoch": 8.71, |
|
"eval_COMMENT": { |
|
"f1": 0.7251940133037693, |
|
"number": 6854, |
|
"precision": 0.6905515967273687, |
|
"recall": 0.7634957688940764 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8152167768922051, |
|
"number": 8845, |
|
"precision": 0.8151706986208456, |
|
"recall": 0.8152628603730921 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9865495853369572, |
|
"number": 7152, |
|
"precision": 0.9834653327775462, |
|
"recall": 0.9896532438478747 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7899159663865547, |
|
"number": 105, |
|
"precision": 0.706766917293233, |
|
"recall": 0.8952380952380953 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9550831476084348, |
|
"number": 5646, |
|
"precision": 0.9254152823920265, |
|
"recall": 0.9867162592986185 |
|
}, |
|
"eval_loss": 2.1110451221466064, |
|
"eval_overall_accuracy": 0.8313008130081301, |
|
"eval_overall_f1": 0.8629231190900369, |
|
"eval_overall_precision": 0.8459394102236851, |
|
"eval_overall_recall": 0.8806027550520943, |
|
"eval_runtime": 11.2874, |
|
"eval_samples_per_second": 753.583, |
|
"eval_steps_per_second": 23.566, |
|
"step": 44000 |
|
}, |
|
{ |
|
"epoch": 8.81, |
|
"learning_rate": 5.949316966937241e-06, |
|
"loss": 1.768, |
|
"step": 44500 |
|
}, |
|
{ |
|
"epoch": 8.91, |
|
"learning_rate": 5.4543654721837265e-06, |
|
"loss": 1.7494, |
|
"step": 45000 |
|
}, |
|
{ |
|
"epoch": 8.91, |
|
"eval_COMMENT": { |
|
"f1": 0.7275605726872247, |
|
"number": 6854, |
|
"precision": 0.6886890800104248, |
|
"recall": 0.7710825795156113 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8160244095378009, |
|
"number": 8845, |
|
"precision": 0.8156557099288377, |
|
"recall": 0.8163934426229508 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9865552072448623, |
|
"number": 7152, |
|
"precision": 0.9830626128002221, |
|
"recall": 0.9900727069351231 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7899159663865547, |
|
"number": 105, |
|
"precision": 0.706766917293233, |
|
"recall": 0.8952380952380953 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9546817441960078, |
|
"number": 5646, |
|
"precision": 0.924506387921022, |
|
"recall": 0.9868933758413035 |
|
}, |
|
"eval_loss": 2.1094605922698975, |
|
"eval_overall_accuracy": 0.8318896740369273, |
|
"eval_overall_f1": 0.8634685085139848, |
|
"eval_overall_precision": 0.8448645031783205, |
|
"eval_overall_recall": 0.8829102859939865, |
|
"eval_runtime": 10.8603, |
|
"eval_samples_per_second": 783.222, |
|
"eval_steps_per_second": 24.493, |
|
"step": 45000 |
|
}, |
|
{ |
|
"epoch": 9.01, |
|
"learning_rate": 4.959413977430212e-06, |
|
"loss": 1.7068, |
|
"step": 45500 |
|
}, |
|
{ |
|
"epoch": 9.11, |
|
"learning_rate": 4.4644624826766974e-06, |
|
"loss": 1.6805, |
|
"step": 46000 |
|
}, |
|
{ |
|
"epoch": 9.11, |
|
"eval_COMMENT": { |
|
"f1": 0.727134881797505, |
|
"number": 6854, |
|
"precision": 0.6890920966688439, |
|
"recall": 0.7696235774730085 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8148566905986773, |
|
"number": 8845, |
|
"precision": 0.8149027589326097, |
|
"recall": 0.8148106274731487 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9866963850386571, |
|
"number": 7152, |
|
"precision": 0.9830673143650243, |
|
"recall": 0.9903523489932886 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7950819672131149, |
|
"number": 105, |
|
"precision": 0.697841726618705, |
|
"recall": 0.9238095238095239 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9543739279588336, |
|
"number": 5646, |
|
"precision": 0.9251745926172265, |
|
"recall": 0.9854764434998229 |
|
}, |
|
"eval_loss": 2.113201856613159, |
|
"eval_overall_accuracy": 0.8326874857533622, |
|
"eval_overall_f1": 0.8630322106091448, |
|
"eval_overall_precision": 0.8448939947081087, |
|
"eval_overall_recall": 0.8819662960632124, |
|
"eval_runtime": 9.5944, |
|
"eval_samples_per_second": 886.557, |
|
"eval_steps_per_second": 27.724, |
|
"step": 46000 |
|
}, |
|
{ |
|
"epoch": 9.21, |
|
"learning_rate": 3.969510987923184e-06, |
|
"loss": 1.7258, |
|
"step": 46500 |
|
}, |
|
{ |
|
"epoch": 9.31, |
|
"learning_rate": 3.4745594931696697e-06, |
|
"loss": 1.6867, |
|
"step": 47000 |
|
}, |
|
{ |
|
"epoch": 9.31, |
|
"eval_COMMENT": { |
|
"f1": 0.7311783679912154, |
|
"number": 6854, |
|
"precision": 0.6902941557600104, |
|
"recall": 0.7772103880945433 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8176065092100803, |
|
"number": 8845, |
|
"precision": 0.8172370947701344, |
|
"recall": 0.817976257772753 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9865533337978123, |
|
"number": 7152, |
|
"precision": 0.9831967782252465, |
|
"recall": 0.9899328859060402 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7932489451476793, |
|
"number": 105, |
|
"precision": 0.7121212121212122, |
|
"recall": 0.8952380952380953 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9545610425240054, |
|
"number": 5646, |
|
"precision": 0.925058158856763, |
|
"recall": 0.9860077931278781 |
|
}, |
|
"eval_loss": 2.1125941276550293, |
|
"eval_overall_accuracy": 0.8326115036851303, |
|
"eval_overall_f1": 0.8647198537327205, |
|
"eval_overall_precision": 0.8456602386283881, |
|
"eval_overall_recall": 0.8846584154954199, |
|
"eval_runtime": 11.2863, |
|
"eval_samples_per_second": 753.659, |
|
"eval_steps_per_second": 23.568, |
|
"step": 47000 |
|
}, |
|
{ |
|
"epoch": 9.4, |
|
"learning_rate": 2.979607998416155e-06, |
|
"loss": 1.6794, |
|
"step": 47500 |
|
}, |
|
{ |
|
"epoch": 9.5, |
|
"learning_rate": 2.484656503662641e-06, |
|
"loss": 1.7212, |
|
"step": 48000 |
|
}, |
|
{ |
|
"epoch": 9.5, |
|
"eval_COMMENT": { |
|
"f1": 0.7277605779153767, |
|
"number": 6854, |
|
"precision": 0.6885822158573103, |
|
"recall": 0.7716661803326524 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8148064424978807, |
|
"number": 8845, |
|
"precision": 0.8145762711864407, |
|
"recall": 0.8150367439231204 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9864120967179988, |
|
"number": 7152, |
|
"precision": 0.98319211001528, |
|
"recall": 0.9896532438478747 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7901234567901234, |
|
"number": 105, |
|
"precision": 0.6956521739130435, |
|
"recall": 0.9142857142857143 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9545104086353122, |
|
"number": 5646, |
|
"precision": 0.9243404678944749, |
|
"recall": 0.9867162592986185 |
|
}, |
|
"eval_loss": 2.105802297592163, |
|
"eval_overall_accuracy": 0.8318706785198693, |
|
"eval_overall_f1": 0.86305280612681, |
|
"eval_overall_precision": 0.8443886937614986, |
|
"eval_overall_recall": 0.8825606600936997, |
|
"eval_runtime": 10.3961, |
|
"eval_samples_per_second": 818.189, |
|
"eval_steps_per_second": 25.586, |
|
"step": 48000 |
|
}, |
|
{ |
|
"epoch": 9.6, |
|
"learning_rate": 1.989705008909127e-06, |
|
"loss": 1.6992, |
|
"step": 48500 |
|
}, |
|
{ |
|
"epoch": 9.7, |
|
"learning_rate": 1.4947535141556129e-06, |
|
"loss": 1.6952, |
|
"step": 49000 |
|
}, |
|
{ |
|
"epoch": 9.7, |
|
"eval_COMMENT": { |
|
"f1": 0.7261049723756906, |
|
"number": 6854, |
|
"precision": 0.6893522161028062, |
|
"recall": 0.7669973737963233 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.81525854761232, |
|
"number": 8845, |
|
"precision": 0.8150282485875706, |
|
"recall": 0.8154889768230639 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9866276640200585, |
|
"number": 7152, |
|
"precision": 0.9829308909242298, |
|
"recall": 0.9903523489932886 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7916666666666667, |
|
"number": 105, |
|
"precision": 0.7037037037037037, |
|
"recall": 0.9047619047619048 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9544792113159023, |
|
"number": 5646, |
|
"precision": 0.9249044691809271, |
|
"recall": 0.9860077931278781 |
|
}, |
|
"eval_loss": 2.1103529930114746, |
|
"eval_overall_accuracy": 0.8311488488716663, |
|
"eval_overall_f1": 0.8629658783668163, |
|
"eval_overall_precision": 0.8451199892747017, |
|
"eval_overall_recall": 0.881581707572897, |
|
"eval_runtime": 11.1488, |
|
"eval_samples_per_second": 762.95, |
|
"eval_steps_per_second": 23.859, |
|
"step": 49000 |
|
}, |
|
{ |
|
"epoch": 9.8, |
|
"learning_rate": 9.998020194020988e-07, |
|
"loss": 1.7282, |
|
"step": 49500 |
|
}, |
|
{ |
|
"epoch": 9.9, |
|
"learning_rate": 5.048505246485845e-07, |
|
"loss": 1.7128, |
|
"step": 50000 |
|
}, |
|
{ |
|
"epoch": 9.9, |
|
"eval_COMMENT": { |
|
"f1": 0.7280375120673009, |
|
"number": 6854, |
|
"precision": 0.6902458158995816, |
|
"recall": 0.7702071782900496 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8154846001695395, |
|
"number": 8845, |
|
"precision": 0.8152542372881356, |
|
"recall": 0.8157150932730356 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9866276640200585, |
|
"number": 7152, |
|
"precision": 0.9829308909242298, |
|
"recall": 0.9903523489932886 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7851239669421487, |
|
"number": 105, |
|
"precision": 0.6934306569343066, |
|
"recall": 0.9047619047619048 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9546351084812623, |
|
"number": 5646, |
|
"precision": 0.9253532834580216, |
|
"recall": 0.9858306765851931 |
|
}, |
|
"eval_loss": 2.104012966156006, |
|
"eval_overall_accuracy": 0.8311298533546083, |
|
"eval_overall_f1": 0.8634575250607274, |
|
"eval_overall_precision": 0.8453242229367631, |
|
"eval_overall_recall": 0.8823858471435564, |
|
"eval_runtime": 10.6017, |
|
"eval_samples_per_second": 802.322, |
|
"eval_steps_per_second": 25.09, |
|
"step": 50000 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"learning_rate": 9.899029895070283e-09, |
|
"loss": 1.7318, |
|
"step": 50500 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"step": 50510, |
|
"total_flos": 1554473524185192.0, |
|
"train_loss": 2.2027091482279917, |
|
"train_runtime": 3516.1179, |
|
"train_samples_per_second": 459.606, |
|
"train_steps_per_second": 14.365 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 50510, |
|
"num_train_epochs": 10, |
|
"save_steps": 1000, |
|
"total_flos": 1554473524185192.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|