{ "best_metric": null, "best_model_checkpoint": null, "epoch": 0.3106796116504854, "eval_steps": 8, "global_step": 32, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.009708737864077669, "grad_norm": 0.38736554980278015, "learning_rate": 4.411764705882353e-07, "loss": 0.1607, "step": 1 }, { "epoch": 0.019417475728155338, "grad_norm": 0.38099536299705505, "learning_rate": 8.823529411764706e-07, "loss": 0.1664, "step": 2 }, { "epoch": 0.02912621359223301, "grad_norm": 0.2045232504606247, "learning_rate": 1.323529411764706e-06, "loss": 0.2686, "step": 3 }, { "epoch": 0.038834951456310676, "grad_norm": 0.370655357837677, "learning_rate": 1.7647058823529412e-06, "loss": 0.1656, "step": 4 }, { "epoch": 0.04854368932038835, "grad_norm": 0.35929468274116516, "learning_rate": 2.2058823529411767e-06, "loss": 0.1269, "step": 5 }, { "epoch": 0.05825242718446602, "grad_norm": 0.2196977585554123, "learning_rate": 2.647058823529412e-06, "loss": 0.1066, "step": 6 }, { "epoch": 0.06796116504854369, "grad_norm": 0.6120501756668091, "learning_rate": 3.0882352941176476e-06, "loss": 0.1936, "step": 7 }, { "epoch": 0.07766990291262135, "grad_norm": 0.7004581689834595, "learning_rate": 3.5294117647058825e-06, "loss": 0.087, "step": 8 }, { "epoch": 0.07766990291262135, "eval_Qnli-dev_cosine_accuracy": 0.6953125, "eval_Qnli-dev_cosine_accuracy_threshold": 0.6691694855690002, "eval_Qnli-dev_cosine_ap": 0.7181099755520133, "eval_Qnli-dev_cosine_f1": 0.6764705882352942, "eval_Qnli-dev_cosine_f1_threshold": 0.49676012992858887, "eval_Qnli-dev_cosine_precision": 0.550531914893617, "eval_Qnli-dev_cosine_recall": 0.8771186440677966, "eval_Qnli-dev_dot_accuracy": 0.669921875, "eval_Qnli-dev_dot_accuracy_threshold": 308.413330078125, "eval_Qnli-dev_dot_ap": 0.678634155184842, "eval_Qnli-dev_dot_f1": 0.6698872785829306, "eval_Qnli-dev_dot_f1_threshold": 208.48468017578125, "eval_Qnli-dev_dot_precision": 0.5402597402597402, "eval_Qnli-dev_dot_recall": 0.8813559322033898, "eval_Qnli-dev_euclidean_accuracy": 0.708984375, "eval_Qnli-dev_euclidean_accuracy_threshold": 17.320636749267578, "eval_Qnli-dev_euclidean_ap": 0.7302104938839877, "eval_Qnli-dev_euclidean_f1": 0.6845637583892616, "eval_Qnli-dev_euclidean_f1_threshold": 20.530838012695312, "eval_Qnli-dev_euclidean_precision": 0.5666666666666667, "eval_Qnli-dev_euclidean_recall": 0.864406779661017, "eval_Qnli-dev_manhattan_accuracy": 0.7109375, "eval_Qnli-dev_manhattan_accuracy_threshold": 369.90869140625, "eval_Qnli-dev_manhattan_ap": 0.732538057005555, "eval_Qnli-dev_manhattan_f1": 0.6836518046709129, "eval_Qnli-dev_manhattan_f1_threshold": 372.4708251953125, "eval_Qnli-dev_manhattan_precision": 0.6851063829787234, "eval_Qnli-dev_manhattan_recall": 0.6822033898305084, "eval_Qnli-dev_max_accuracy": 0.7109375, "eval_Qnli-dev_max_accuracy_threshold": 369.90869140625, "eval_Qnli-dev_max_ap": 0.732538057005555, "eval_Qnli-dev_max_f1": 0.6845637583892616, "eval_Qnli-dev_max_f1_threshold": 372.4708251953125, "eval_Qnli-dev_max_precision": 0.6851063829787234, "eval_Qnli-dev_max_recall": 0.8813559322033898, "eval_allNLI-dev_cosine_accuracy": 0.740234375, "eval_allNLI-dev_cosine_accuracy_threshold": 0.7844594717025757, "eval_allNLI-dev_cosine_ap": 0.6356383940181094, "eval_allNLI-dev_cosine_f1": 0.6369710467706012, "eval_allNLI-dev_cosine_f1_threshold": 0.5889398455619812, "eval_allNLI-dev_cosine_precision": 0.5181159420289855, "eval_allNLI-dev_cosine_recall": 0.8265895953757225, "eval_allNLI-dev_dot_accuracy": 0.72265625, "eval_allNLI-dev_dot_accuracy_threshold": 294.92120361328125, "eval_allNLI-dev_dot_ap": 0.5914839688879726, "eval_allNLI-dev_dot_f1": 0.6099290780141845, "eval_allNLI-dev_dot_f1_threshold": 246.92991638183594, "eval_allNLI-dev_dot_precision": 0.516, "eval_allNLI-dev_dot_recall": 0.7456647398843931, "eval_allNLI-dev_euclidean_accuracy": 0.744140625, "eval_allNLI-dev_euclidean_accuracy_threshold": 13.74991226196289, "eval_allNLI-dev_euclidean_ap": 0.6412989964435845, "eval_allNLI-dev_euclidean_f1": 0.6464208242950108, "eval_allNLI-dev_euclidean_f1_threshold": 18.407054901123047, "eval_allNLI-dev_euclidean_precision": 0.5173611111111112, "eval_allNLI-dev_euclidean_recall": 0.861271676300578, "eval_allNLI-dev_manhattan_accuracy": 0.744140625, "eval_allNLI-dev_manhattan_accuracy_threshold": 313.8516540527344, "eval_allNLI-dev_manhattan_ap": 0.6416934437743762, "eval_allNLI-dev_manhattan_f1": 0.655, "eval_allNLI-dev_manhattan_f1_threshold": 361.0255126953125, "eval_allNLI-dev_manhattan_precision": 0.5770925110132159, "eval_allNLI-dev_manhattan_recall": 0.7572254335260116, "eval_allNLI-dev_max_accuracy": 0.744140625, "eval_allNLI-dev_max_accuracy_threshold": 313.8516540527344, "eval_allNLI-dev_max_ap": 0.6416934437743762, "eval_allNLI-dev_max_f1": 0.655, "eval_allNLI-dev_max_f1_threshold": 361.0255126953125, "eval_allNLI-dev_max_precision": 0.5770925110132159, "eval_allNLI-dev_max_recall": 0.861271676300578, "eval_sequential_score": 0.732538057005555, "eval_sts-test_pearson_cosine": 0.8858982884210256, "eval_sts-test_pearson_dot": 0.8750202743648935, "eval_sts-test_pearson_euclidean": 0.9073481145616336, "eval_sts-test_pearson_manhattan": 0.908032029485236, "eval_sts-test_pearson_max": 0.908032029485236, "eval_sts-test_spearman_cosine": 0.9075027297778789, "eval_sts-test_spearman_dot": 0.8759972599919353, "eval_sts-test_spearman_euclidean": 0.9040041656648221, "eval_sts-test_spearman_manhattan": 0.9045863348242628, "eval_sts-test_spearman_max": 0.9075027297778789, "eval_vitaminc-pairs_loss": 2.801919460296631, "eval_vitaminc-pairs_runtime": 3.8986, "eval_vitaminc-pairs_samples_per_second": 32.832, "eval_vitaminc-pairs_steps_per_second": 0.257, "step": 8 }, { "epoch": 0.07766990291262135, "eval_negation-triplets_loss": 1.355710744857788, "eval_negation-triplets_runtime": 0.639, "eval_negation-triplets_samples_per_second": 200.304, "eval_negation-triplets_steps_per_second": 1.565, "step": 8 }, { "epoch": 0.07766990291262135, "eval_scitail-pairs-pos_loss": 0.06071745231747627, "eval_scitail-pairs-pos_runtime": 0.9322, "eval_scitail-pairs-pos_samples_per_second": 137.311, "eval_scitail-pairs-pos_steps_per_second": 1.073, "step": 8 }, { "epoch": 0.07766990291262135, "eval_scitail-pairs-qa_loss": 1.0544098927312007e-07, "eval_scitail-pairs-qa_runtime": 0.5629, "eval_scitail-pairs-qa_samples_per_second": 227.378, "eval_scitail-pairs-qa_steps_per_second": 1.776, "step": 8 }, { "epoch": 0.07766990291262135, "eval_xsum-pairs_loss": 0.00016850717656780034, "eval_xsum-pairs_runtime": 2.9256, "eval_xsum-pairs_samples_per_second": 43.751, "eval_xsum-pairs_steps_per_second": 0.342, "step": 8 }, { "epoch": 0.07766990291262135, "eval_sciq_pairs_loss": 0.0582379512488842, "eval_sciq_pairs_runtime": 2.5278, "eval_sciq_pairs_samples_per_second": 34.418, "eval_sciq_pairs_steps_per_second": 0.396, "step": 8 }, { "epoch": 0.07766990291262135, "eval_qasc_pairs_loss": 0.07362987846136093, "eval_qasc_pairs_runtime": 0.3723, "eval_qasc_pairs_samples_per_second": 233.691, "eval_qasc_pairs_steps_per_second": 2.686, "step": 8 }, { "epoch": 0.07766990291262135, "eval_openbookqa_pairs_loss": 1.3787189722061157, "eval_openbookqa_pairs_runtime": 0.5744, "eval_openbookqa_pairs_samples_per_second": 222.849, "eval_openbookqa_pairs_steps_per_second": 1.741, "step": 8 }, { "epoch": 0.07766990291262135, "eval_msmarco_pairs_loss": 0.1278172731399536, "eval_msmarco_pairs_runtime": 1.0983, "eval_msmarco_pairs_samples_per_second": 79.215, "eval_msmarco_pairs_steps_per_second": 0.911, "step": 8 }, { "epoch": 0.07766990291262135, "eval_nq_pairs_loss": 0.0051126074977219105, "eval_nq_pairs_runtime": 2.2469, "eval_nq_pairs_samples_per_second": 38.719, "eval_nq_pairs_steps_per_second": 0.445, "step": 8 }, { "epoch": 0.07766990291262135, "eval_trivia_pairs_loss": 0.26755890250205994, "eval_trivia_pairs_runtime": 2.4342, "eval_trivia_pairs_samples_per_second": 41.081, "eval_trivia_pairs_steps_per_second": 0.411, "step": 8 }, { "epoch": 0.07766990291262135, "eval_gooaq_pairs_loss": 0.05755230411887169, "eval_gooaq_pairs_runtime": 0.5805, "eval_gooaq_pairs_samples_per_second": 149.876, "eval_gooaq_pairs_steps_per_second": 1.723, "step": 8 }, { "epoch": 0.07766990291262135, "eval_paws-pos_loss": 0.04592936113476753, "eval_paws-pos_runtime": 0.6903, "eval_paws-pos_samples_per_second": 185.415, "eval_paws-pos_steps_per_second": 1.449, "step": 8 }, { "epoch": 0.07766990291262135, "eval_global_dataset_loss": 0.4901905357837677, "eval_global_dataset_runtime": 25.0307, "eval_global_dataset_samples_per_second": 26.487, "eval_global_dataset_steps_per_second": 0.24, "step": 8 }, { "epoch": 0.08737864077669903, "grad_norm": 1.2741845846176147, "learning_rate": 3.970588235294118e-06, "loss": 0.1952, "step": 9 }, { "epoch": 0.0970873786407767, "grad_norm": 0.46481379866600037, "learning_rate": 4.411764705882353e-06, "loss": 0.4167, "step": 10 }, { "epoch": 0.10679611650485436, "grad_norm": 0.7963629961013794, "learning_rate": 4.852941176470589e-06, "loss": 0.7876, "step": 11 }, { "epoch": 0.11650485436893204, "grad_norm": 0.6939969658851624, "learning_rate": 5.294117647058824e-06, "loss": 0.3714, "step": 12 }, { "epoch": 0.1262135922330097, "grad_norm": 0.44538313150405884, "learning_rate": 5.735294117647059e-06, "loss": 0.1852, "step": 13 }, { "epoch": 0.13592233009708737, "grad_norm": 0.3318534791469574, "learning_rate": 6.176470588235295e-06, "loss": 0.1144, "step": 14 }, { "epoch": 0.14563106796116504, "grad_norm": 0.4242781698703766, "learning_rate": 6.61764705882353e-06, "loss": 0.1234, "step": 15 }, { "epoch": 0.1553398058252427, "grad_norm": 0.2060050666332245, "learning_rate": 7.058823529411765e-06, "loss": 0.0569, "step": 16 }, { "epoch": 0.1553398058252427, "eval_Qnli-dev_cosine_accuracy": 0.6953125, "eval_Qnli-dev_cosine_accuracy_threshold": 0.6684989929199219, "eval_Qnli-dev_cosine_ap": 0.7189160511154118, "eval_Qnli-dev_cosine_f1": 0.6764705882352942, "eval_Qnli-dev_cosine_f1_threshold": 0.49889329075813293, "eval_Qnli-dev_cosine_precision": 0.550531914893617, "eval_Qnli-dev_cosine_recall": 0.8771186440677966, "eval_Qnli-dev_dot_accuracy": 0.66796875, "eval_Qnli-dev_dot_accuracy_threshold": 303.81427001953125, "eval_Qnli-dev_dot_ap": 0.6791091476516111, "eval_Qnli-dev_dot_f1": 0.6697247706422018, "eval_Qnli-dev_dot_f1_threshold": 184.08914184570312, "eval_Qnli-dev_dot_precision": 0.5239234449760766, "eval_Qnli-dev_dot_recall": 0.9279661016949152, "eval_Qnli-dev_euclidean_accuracy": 0.7109375, "eval_Qnli-dev_euclidean_accuracy_threshold": 17.21223258972168, "eval_Qnli-dev_euclidean_ap": 0.7305713530476123, "eval_Qnli-dev_euclidean_f1": 0.6848739495798319, "eval_Qnli-dev_euclidean_f1_threshold": 17.62983512878418, "eval_Qnli-dev_euclidean_precision": 0.6791666666666667, "eval_Qnli-dev_euclidean_recall": 0.690677966101695, "eval_Qnli-dev_manhattan_accuracy": 0.712890625, "eval_Qnli-dev_manhattan_accuracy_threshold": 367.2698974609375, "eval_Qnli-dev_manhattan_ap": 0.7327153618467641, "eval_Qnli-dev_manhattan_f1": 0.6824034334763949, "eval_Qnli-dev_manhattan_f1_threshold": 368.1672058105469, "eval_Qnli-dev_manhattan_precision": 0.691304347826087, "eval_Qnli-dev_manhattan_recall": 0.673728813559322, "eval_Qnli-dev_max_accuracy": 0.712890625, "eval_Qnli-dev_max_accuracy_threshold": 367.2698974609375, "eval_Qnli-dev_max_ap": 0.7327153618467641, "eval_Qnli-dev_max_f1": 0.6848739495798319, "eval_Qnli-dev_max_f1_threshold": 368.1672058105469, "eval_Qnli-dev_max_precision": 0.691304347826087, "eval_Qnli-dev_max_recall": 0.9279661016949152, "eval_allNLI-dev_cosine_accuracy": 0.7421875, "eval_allNLI-dev_cosine_accuracy_threshold": 0.7840416431427002, "eval_allNLI-dev_cosine_ap": 0.6349487371750362, "eval_allNLI-dev_cosine_f1": 0.6367713004484306, "eval_allNLI-dev_cosine_f1_threshold": 0.5954304337501526, "eval_allNLI-dev_cosine_precision": 0.5201465201465202, "eval_allNLI-dev_cosine_recall": 0.8208092485549133, "eval_allNLI-dev_dot_accuracy": 0.724609375, "eval_allNLI-dev_dot_accuracy_threshold": 291.18670654296875, "eval_allNLI-dev_dot_ap": 0.5913303711668598, "eval_allNLI-dev_dot_f1": 0.6070588235294118, "eval_allNLI-dev_dot_f1_threshold": 242.49884033203125, "eval_allNLI-dev_dot_precision": 0.5119047619047619, "eval_allNLI-dev_dot_recall": 0.7456647398843931, "eval_allNLI-dev_euclidean_accuracy": 0.744140625, "eval_allNLI-dev_euclidean_accuracy_threshold": 13.559854507446289, "eval_allNLI-dev_euclidean_ap": 0.6408865358113234, "eval_allNLI-dev_euclidean_f1": 0.6450116009280741, "eval_allNLI-dev_euclidean_f1_threshold": 17.65105628967285, "eval_allNLI-dev_euclidean_precision": 0.5387596899224806, "eval_allNLI-dev_euclidean_recall": 0.8034682080924855, "eval_allNLI-dev_manhattan_accuracy": 0.7421875, "eval_allNLI-dev_manhattan_accuracy_threshold": 307.83563232421875, "eval_allNLI-dev_manhattan_ap": 0.6414745653251337, "eval_allNLI-dev_manhattan_f1": 0.6533665835411472, "eval_allNLI-dev_manhattan_f1_threshold": 357.5172119140625, "eval_allNLI-dev_manhattan_precision": 0.5745614035087719, "eval_allNLI-dev_manhattan_recall": 0.7572254335260116, "eval_allNLI-dev_max_accuracy": 0.744140625, "eval_allNLI-dev_max_accuracy_threshold": 307.83563232421875, "eval_allNLI-dev_max_ap": 0.6414745653251337, "eval_allNLI-dev_max_f1": 0.6533665835411472, "eval_allNLI-dev_max_f1_threshold": 357.5172119140625, "eval_allNLI-dev_max_precision": 0.5745614035087719, "eval_allNLI-dev_max_recall": 0.8208092485549133, "eval_sequential_score": 0.7327153618467641, "eval_sts-test_pearson_cosine": 0.8857317653883374, "eval_sts-test_pearson_dot": 0.8740754819923455, "eval_sts-test_pearson_euclidean": 0.9064480556463691, "eval_sts-test_pearson_manhattan": 0.9071116458208927, "eval_sts-test_pearson_max": 0.9071116458208927, "eval_sts-test_spearman_cosine": 0.9078527293932209, "eval_sts-test_spearman_dot": 0.8744967501974819, "eval_sts-test_spearman_euclidean": 0.9030452803869885, "eval_sts-test_spearman_manhattan": 0.903667904686727, "eval_sts-test_spearman_max": 0.9078527293932209, "eval_vitaminc-pairs_loss": 2.799455165863037, "eval_vitaminc-pairs_runtime": 3.8555, "eval_vitaminc-pairs_samples_per_second": 33.2, "eval_vitaminc-pairs_steps_per_second": 0.259, "step": 16 }, { "epoch": 0.1553398058252427, "eval_negation-triplets_loss": 1.3501245975494385, "eval_negation-triplets_runtime": 0.6331, "eval_negation-triplets_samples_per_second": 202.181, "eval_negation-triplets_steps_per_second": 1.58, "step": 16 }, { "epoch": 0.1553398058252427, "eval_scitail-pairs-pos_loss": 0.060843899846076965, "eval_scitail-pairs-pos_runtime": 0.9131, "eval_scitail-pairs-pos_samples_per_second": 140.183, "eval_scitail-pairs-pos_steps_per_second": 1.095, "step": 16 }, { "epoch": 0.1553398058252427, "eval_scitail-pairs-qa_loss": 1.1229322893768767e-07, "eval_scitail-pairs-qa_runtime": 0.5691, "eval_scitail-pairs-qa_samples_per_second": 224.9, "eval_scitail-pairs-qa_steps_per_second": 1.757, "step": 16 }, { "epoch": 0.1553398058252427, "eval_xsum-pairs_loss": 0.0001665251620579511, "eval_xsum-pairs_runtime": 2.9369, "eval_xsum-pairs_samples_per_second": 43.584, "eval_xsum-pairs_steps_per_second": 0.34, "step": 16 }, { "epoch": 0.1553398058252427, "eval_sciq_pairs_loss": 0.05696266517043114, "eval_sciq_pairs_runtime": 2.5397, "eval_sciq_pairs_samples_per_second": 34.256, "eval_sciq_pairs_steps_per_second": 0.394, "step": 16 }, { "epoch": 0.1553398058252427, "eval_qasc_pairs_loss": 0.07378190755844116, "eval_qasc_pairs_runtime": 0.3731, "eval_qasc_pairs_samples_per_second": 233.155, "eval_qasc_pairs_steps_per_second": 2.68, "step": 16 }, { "epoch": 0.1553398058252427, "eval_openbookqa_pairs_loss": 1.3709176778793335, "eval_openbookqa_pairs_runtime": 0.5704, "eval_openbookqa_pairs_samples_per_second": 224.402, "eval_openbookqa_pairs_steps_per_second": 1.753, "step": 16 }, { "epoch": 0.1553398058252427, "eval_msmarco_pairs_loss": 0.13161690533161163, "eval_msmarco_pairs_runtime": 1.0994, "eval_msmarco_pairs_samples_per_second": 79.136, "eval_msmarco_pairs_steps_per_second": 0.91, "step": 16 }, { "epoch": 0.1553398058252427, "eval_nq_pairs_loss": 0.005713976453989744, "eval_nq_pairs_runtime": 2.2521, "eval_nq_pairs_samples_per_second": 38.631, "eval_nq_pairs_steps_per_second": 0.444, "step": 16 }, { "epoch": 0.1553398058252427, "eval_trivia_pairs_loss": 0.2678990364074707, "eval_trivia_pairs_runtime": 2.4403, "eval_trivia_pairs_samples_per_second": 40.979, "eval_trivia_pairs_steps_per_second": 0.41, "step": 16 }, { "epoch": 0.1553398058252427, "eval_gooaq_pairs_loss": 0.05776378884911537, "eval_gooaq_pairs_runtime": 0.5822, "eval_gooaq_pairs_samples_per_second": 149.421, "eval_gooaq_pairs_steps_per_second": 1.717, "step": 16 }, { "epoch": 0.1553398058252427, "eval_paws-pos_loss": 0.04598955065011978, "eval_paws-pos_runtime": 0.6747, "eval_paws-pos_samples_per_second": 189.727, "eval_paws-pos_steps_per_second": 1.482, "step": 16 }, { "epoch": 0.1553398058252427, "eval_global_dataset_loss": 0.48036298155784607, "eval_global_dataset_runtime": 25.0731, "eval_global_dataset_samples_per_second": 26.443, "eval_global_dataset_steps_per_second": 0.239, "step": 16 }, { "epoch": 0.1650485436893204, "grad_norm": 0.4544373154640198, "learning_rate": 7.5e-06, "loss": 0.3203, "step": 17 }, { "epoch": 0.17475728155339806, "grad_norm": 0.4103369414806366, "learning_rate": 7.941176470588236e-06, "loss": 0.2113, "step": 18 }, { "epoch": 0.18446601941747573, "grad_norm": 1.5407989025115967, "learning_rate": 8.382352941176472e-06, "loss": 0.3137, "step": 19 }, { "epoch": 0.1941747572815534, "grad_norm": 0.46951910853385925, "learning_rate": 8.823529411764707e-06, "loss": 0.4048, "step": 20 }, { "epoch": 0.20388349514563106, "grad_norm": 0.6390318870544434, "learning_rate": 9.264705882352942e-06, "loss": 0.2855, "step": 21 }, { "epoch": 0.21359223300970873, "grad_norm": 0.22210820019245148, "learning_rate": 9.705882352941177e-06, "loss": 0.0593, "step": 22 }, { "epoch": 0.22330097087378642, "grad_norm": 0.7516863346099854, "learning_rate": 1.0147058823529413e-05, "loss": 0.1228, "step": 23 }, { "epoch": 0.23300970873786409, "grad_norm": 0.4010964035987854, "learning_rate": 1.0588235294117648e-05, "loss": 0.0811, "step": 24 }, { "epoch": 0.23300970873786409, "eval_Qnli-dev_cosine_accuracy": 0.6953125, "eval_Qnli-dev_cosine_accuracy_threshold": 0.651726484298706, "eval_Qnli-dev_cosine_ap": 0.7197319450561322, "eval_Qnli-dev_cosine_f1": 0.6766666666666667, "eval_Qnli-dev_cosine_f1_threshold": 0.508252739906311, "eval_Qnli-dev_cosine_precision": 0.5576923076923077, "eval_Qnli-dev_cosine_recall": 0.8601694915254238, "eval_Qnli-dev_dot_accuracy": 0.66796875, "eval_Qnli-dev_dot_accuracy_threshold": 295.55169677734375, "eval_Qnli-dev_dot_ap": 0.6760811849258039, "eval_Qnli-dev_dot_f1": 0.6717791411042945, "eval_Qnli-dev_dot_f1_threshold": 181.16976928710938, "eval_Qnli-dev_dot_precision": 0.5264423076923077, "eval_Qnli-dev_dot_recall": 0.9279661016949152, "eval_Qnli-dev_euclidean_accuracy": 0.7109375, "eval_Qnli-dev_euclidean_accuracy_threshold": 17.042926788330078, "eval_Qnli-dev_euclidean_ap": 0.7310579368620943, "eval_Qnli-dev_euclidean_f1": 0.6848739495798319, "eval_Qnli-dev_euclidean_f1_threshold": 17.435243606567383, "eval_Qnli-dev_euclidean_precision": 0.6791666666666667, "eval_Qnli-dev_euclidean_recall": 0.690677966101695, "eval_Qnli-dev_manhattan_accuracy": 0.708984375, "eval_Qnli-dev_manhattan_accuracy_threshold": 364.541748046875, "eval_Qnli-dev_manhattan_ap": 0.7326520634446195, "eval_Qnli-dev_manhattan_f1": 0.6796747967479675, "eval_Qnli-dev_manhattan_f1_threshold": 434.2391357421875, "eval_Qnli-dev_manhattan_precision": 0.5514511873350924, "eval_Qnli-dev_manhattan_recall": 0.885593220338983, "eval_Qnli-dev_max_accuracy": 0.7109375, "eval_Qnli-dev_max_accuracy_threshold": 364.541748046875, "eval_Qnli-dev_max_ap": 0.7326520634446195, "eval_Qnli-dev_max_f1": 0.6848739495798319, "eval_Qnli-dev_max_f1_threshold": 434.2391357421875, "eval_Qnli-dev_max_precision": 0.6791666666666667, "eval_Qnli-dev_max_recall": 0.9279661016949152, "eval_allNLI-dev_cosine_accuracy": 0.740234375, "eval_allNLI-dev_cosine_accuracy_threshold": 0.7892441749572754, "eval_allNLI-dev_cosine_ap": 0.6337074778927934, "eval_allNLI-dev_cosine_f1": 0.6367713004484306, "eval_allNLI-dev_cosine_f1_threshold": 0.5993767976760864, "eval_allNLI-dev_cosine_precision": 0.5201465201465202, "eval_allNLI-dev_cosine_recall": 0.8208092485549133, "eval_allNLI-dev_dot_accuracy": 0.724609375, "eval_allNLI-dev_dot_accuracy_threshold": 286.42156982421875, "eval_allNLI-dev_dot_ap": 0.5908477549155566, "eval_allNLI-dev_dot_f1": 0.6013667425968109, "eval_allNLI-dev_dot_f1_threshold": 234.44680786132812, "eval_allNLI-dev_dot_precision": 0.49624060150375937, "eval_allNLI-dev_dot_recall": 0.7630057803468208, "eval_allNLI-dev_euclidean_accuracy": 0.744140625, "eval_allNLI-dev_euclidean_accuracy_threshold": 13.312193870544434, "eval_allNLI-dev_euclidean_ap": 0.6395819541470485, "eval_allNLI-dev_euclidean_f1": 0.6495327102803738, "eval_allNLI-dev_euclidean_f1_threshold": 17.35163116455078, "eval_allNLI-dev_euclidean_precision": 0.5450980392156862, "eval_allNLI-dev_euclidean_recall": 0.8034682080924855, "eval_allNLI-dev_manhattan_accuracy": 0.740234375, "eval_allNLI-dev_manhattan_accuracy_threshold": 273.14263916015625, "eval_allNLI-dev_manhattan_ap": 0.6396466602355837, "eval_allNLI-dev_manhattan_f1": 0.6482758620689655, "eval_allNLI-dev_manhattan_f1_threshold": 367.1748046875, "eval_allNLI-dev_manhattan_precision": 0.5381679389312977, "eval_allNLI-dev_manhattan_recall": 0.815028901734104, "eval_allNLI-dev_max_accuracy": 0.744140625, "eval_allNLI-dev_max_accuracy_threshold": 286.42156982421875, "eval_allNLI-dev_max_ap": 0.6396466602355837, "eval_allNLI-dev_max_f1": 0.6495327102803738, "eval_allNLI-dev_max_f1_threshold": 367.1748046875, "eval_allNLI-dev_max_precision": 0.5450980392156862, "eval_allNLI-dev_max_recall": 0.8208092485549133, "eval_sequential_score": 0.7326520634446195, "eval_sts-test_pearson_cosine": 0.8852721127163659, "eval_sts-test_pearson_dot": 0.8721890224510694, "eval_sts-test_pearson_euclidean": 0.9051850094674976, "eval_sts-test_pearson_manhattan": 0.9058527749212866, "eval_sts-test_pearson_max": 0.9058527749212866, "eval_sts-test_spearman_cosine": 0.9079463937833133, "eval_sts-test_spearman_dot": 0.8718395993011061, "eval_sts-test_spearman_euclidean": 0.901890876848136, "eval_sts-test_spearman_manhattan": 0.902598976057132, "eval_sts-test_spearman_max": 0.9079463937833133, "eval_vitaminc-pairs_loss": 2.794250965118408, "eval_vitaminc-pairs_runtime": 3.828, "eval_vitaminc-pairs_samples_per_second": 33.438, "eval_vitaminc-pairs_steps_per_second": 0.261, "step": 24 }, { "epoch": 0.23300970873786409, "eval_negation-triplets_loss": 1.340283989906311, "eval_negation-triplets_runtime": 0.6301, "eval_negation-triplets_samples_per_second": 203.131, "eval_negation-triplets_steps_per_second": 1.587, "step": 24 }, { "epoch": 0.23300970873786409, "eval_scitail-pairs-pos_loss": 0.060825277119874954, "eval_scitail-pairs-pos_runtime": 0.8911, "eval_scitail-pairs-pos_samples_per_second": 143.641, "eval_scitail-pairs-pos_steps_per_second": 1.122, "step": 24 }, { "epoch": 0.23300970873786409, "eval_scitail-pairs-qa_loss": 1.2640072100111865e-07, "eval_scitail-pairs-qa_runtime": 0.5679, "eval_scitail-pairs-qa_samples_per_second": 225.406, "eval_scitail-pairs-qa_steps_per_second": 1.761, "step": 24 }, { "epoch": 0.23300970873786409, "eval_xsum-pairs_loss": 0.0001656880631344393, "eval_xsum-pairs_runtime": 2.9303, "eval_xsum-pairs_samples_per_second": 43.681, "eval_xsum-pairs_steps_per_second": 0.341, "step": 24 }, { "epoch": 0.23300970873786409, "eval_sciq_pairs_loss": 0.05494913458824158, "eval_sciq_pairs_runtime": 2.53, "eval_sciq_pairs_samples_per_second": 34.387, "eval_sciq_pairs_steps_per_second": 0.395, "step": 24 }, { "epoch": 0.23300970873786409, "eval_qasc_pairs_loss": 0.07522959262132645, "eval_qasc_pairs_runtime": 0.3767, "eval_qasc_pairs_samples_per_second": 230.935, "eval_qasc_pairs_steps_per_second": 2.654, "step": 24 }, { "epoch": 0.23300970873786409, "eval_openbookqa_pairs_loss": 1.3630236387252808, "eval_openbookqa_pairs_runtime": 0.5729, "eval_openbookqa_pairs_samples_per_second": 223.429, "eval_openbookqa_pairs_steps_per_second": 1.746, "step": 24 }, { "epoch": 0.23300970873786409, "eval_msmarco_pairs_loss": 0.14150576293468475, "eval_msmarco_pairs_runtime": 1.095, "eval_msmarco_pairs_samples_per_second": 79.449, "eval_msmarco_pairs_steps_per_second": 0.913, "step": 24 }, { "epoch": 0.23300970873786409, "eval_nq_pairs_loss": 0.0068158903159201145, "eval_nq_pairs_runtime": 2.2497, "eval_nq_pairs_samples_per_second": 38.672, "eval_nq_pairs_steps_per_second": 0.445, "step": 24 }, { "epoch": 0.23300970873786409, "eval_trivia_pairs_loss": 0.26929065585136414, "eval_trivia_pairs_runtime": 2.4805, "eval_trivia_pairs_samples_per_second": 40.314, "eval_trivia_pairs_steps_per_second": 0.403, "step": 24 }, { "epoch": 0.23300970873786409, "eval_gooaq_pairs_loss": 0.05852792412042618, "eval_gooaq_pairs_runtime": 0.5795, "eval_gooaq_pairs_samples_per_second": 150.128, "eval_gooaq_pairs_steps_per_second": 1.726, "step": 24 }, { "epoch": 0.23300970873786409, "eval_paws-pos_loss": 0.046059899032115936, "eval_paws-pos_runtime": 0.668, "eval_paws-pos_samples_per_second": 191.605, "eval_paws-pos_steps_per_second": 1.497, "step": 24 }, { "epoch": 0.23300970873786409, "eval_global_dataset_loss": 0.4663805067539215, "eval_global_dataset_runtime": 25.0232, "eval_global_dataset_samples_per_second": 26.495, "eval_global_dataset_steps_per_second": 0.24, "step": 24 }, { "epoch": 0.24271844660194175, "grad_norm": 0.5014179944992065, "learning_rate": 1.1029411764705883e-05, "loss": 0.2806, "step": 25 }, { "epoch": 0.2524271844660194, "grad_norm": 0.320849746465683, "learning_rate": 1.1470588235294118e-05, "loss": 0.2202, "step": 26 }, { "epoch": 0.2621359223300971, "grad_norm": 0.28120842576026917, "learning_rate": 1.1911764705882354e-05, "loss": 0.195, "step": 27 }, { "epoch": 0.27184466019417475, "grad_norm": 0.755657434463501, "learning_rate": 1.235294117647059e-05, "loss": 0.1986, "step": 28 }, { "epoch": 0.2815533980582524, "grad_norm": 0.5951756238937378, "learning_rate": 1.2794117647058824e-05, "loss": 0.0546, "step": 29 }, { "epoch": 0.2912621359223301, "grad_norm": 0.5201478004455566, "learning_rate": 1.323529411764706e-05, "loss": 0.3083, "step": 30 }, { "epoch": 0.30097087378640774, "grad_norm": 0.261674702167511, "learning_rate": 1.3676470588235295e-05, "loss": 0.127, "step": 31 }, { "epoch": 0.3106796116504854, "grad_norm": 0.6115577220916748, "learning_rate": 1.411764705882353e-05, "loss": 0.2447, "step": 32 }, { "epoch": 0.3106796116504854, "eval_Qnli-dev_cosine_accuracy": 0.6953125, "eval_Qnli-dev_cosine_accuracy_threshold": 0.6684017181396484, "eval_Qnli-dev_cosine_ap": 0.7203045959833639, "eval_Qnli-dev_cosine_f1": 0.6755852842809364, "eval_Qnli-dev_cosine_f1_threshold": 0.5110002756118774, "eval_Qnli-dev_cosine_precision": 0.5580110497237569, "eval_Qnli-dev_cosine_recall": 0.8559322033898306, "eval_Qnli-dev_dot_accuracy": 0.66796875, "eval_Qnli-dev_dot_accuracy_threshold": 294.4780578613281, "eval_Qnli-dev_dot_ap": 0.676288649042553, "eval_Qnli-dev_dot_f1": 0.6738794435857806, "eval_Qnli-dev_dot_f1_threshold": 184.11688232421875, "eval_Qnli-dev_dot_precision": 0.5304136253041363, "eval_Qnli-dev_dot_recall": 0.923728813559322, "eval_Qnli-dev_euclidean_accuracy": 0.7109375, "eval_Qnli-dev_euclidean_accuracy_threshold": 16.85451889038086, "eval_Qnli-dev_euclidean_ap": 0.7312433122162235, "eval_Qnli-dev_euclidean_f1": 0.6848739495798319, "eval_Qnli-dev_euclidean_f1_threshold": 17.339509963989258, "eval_Qnli-dev_euclidean_precision": 0.6791666666666667, "eval_Qnli-dev_euclidean_recall": 0.690677966101695, "eval_Qnli-dev_manhattan_accuracy": 0.70703125, "eval_Qnli-dev_manhattan_accuracy_threshold": 359.81439208984375, "eval_Qnli-dev_manhattan_ap": 0.7325123059741169, "eval_Qnli-dev_manhattan_f1": 0.6800804828973843, "eval_Qnli-dev_manhattan_f1_threshold": 374.1423645019531, "eval_Qnli-dev_manhattan_precision": 0.6475095785440613, "eval_Qnli-dev_manhattan_recall": 0.7161016949152542, "eval_Qnli-dev_max_accuracy": 0.7109375, "eval_Qnli-dev_max_accuracy_threshold": 359.81439208984375, "eval_Qnli-dev_max_ap": 0.7325123059741169, "eval_Qnli-dev_max_f1": 0.6848739495798319, "eval_Qnli-dev_max_f1_threshold": 374.1423645019531, "eval_Qnli-dev_max_precision": 0.6791666666666667, "eval_Qnli-dev_max_recall": 0.923728813559322, "eval_allNLI-dev_cosine_accuracy": 0.7421875, "eval_allNLI-dev_cosine_accuracy_threshold": 0.7891373634338379, "eval_allNLI-dev_cosine_ap": 0.6322954079925401, "eval_allNLI-dev_cosine_f1": 0.6337078651685394, "eval_allNLI-dev_cosine_f1_threshold": 0.6023260354995728, "eval_allNLI-dev_cosine_precision": 0.5183823529411765, "eval_allNLI-dev_cosine_recall": 0.815028901734104, "eval_allNLI-dev_dot_accuracy": 0.724609375, "eval_allNLI-dev_dot_accuracy_threshold": 283.5550842285156, "eval_allNLI-dev_dot_ap": 0.5884575729907496, "eval_allNLI-dev_dot_f1": 0.5986394557823129, "eval_allNLI-dev_dot_f1_threshold": 231.64846801757812, "eval_allNLI-dev_dot_precision": 0.4925373134328358, "eval_allNLI-dev_dot_recall": 0.7630057803468208, "eval_allNLI-dev_euclidean_accuracy": 0.7421875, "eval_allNLI-dev_euclidean_accuracy_threshold": 13.253250122070312, "eval_allNLI-dev_euclidean_ap": 0.6378114586204184, "eval_allNLI-dev_euclidean_f1": 0.6512702078521939, "eval_allNLI-dev_euclidean_f1_threshold": 17.237594604492188, "eval_allNLI-dev_euclidean_precision": 0.5423076923076923, "eval_allNLI-dev_euclidean_recall": 0.815028901734104, "eval_allNLI-dev_manhattan_accuracy": 0.740234375, "eval_allNLI-dev_manhattan_accuracy_threshold": 267.76416015625, "eval_allNLI-dev_manhattan_ap": 0.6391624752319756, "eval_allNLI-dev_manhattan_f1": 0.6457831325301204, "eval_allNLI-dev_manhattan_f1_threshold": 353.9185791015625, "eval_allNLI-dev_manhattan_precision": 0.5537190082644629, "eval_allNLI-dev_manhattan_recall": 0.7745664739884393, "eval_allNLI-dev_max_accuracy": 0.7421875, "eval_allNLI-dev_max_accuracy_threshold": 283.5550842285156, "eval_allNLI-dev_max_ap": 0.6391624752319756, "eval_allNLI-dev_max_f1": 0.6512702078521939, "eval_allNLI-dev_max_f1_threshold": 353.9185791015625, "eval_allNLI-dev_max_precision": 0.5537190082644629, "eval_allNLI-dev_max_recall": 0.815028901734104, "eval_sequential_score": 0.7325123059741169, "eval_sts-test_pearson_cosine": 0.8848940721874675, "eval_sts-test_pearson_dot": 0.8708637407541432, "eval_sts-test_pearson_euclidean": 0.9044975746549173, "eval_sts-test_pearson_manhattan": 0.905176437582178, "eval_sts-test_pearson_max": 0.905176437582178, "eval_sts-test_spearman_cosine": 0.9077582147291623, "eval_sts-test_spearman_dot": 0.870147285600329, "eval_sts-test_spearman_euclidean": 0.9012842734999755, "eval_sts-test_spearman_manhattan": 0.9020171201565211, "eval_sts-test_spearman_max": 0.9077582147291623, "eval_vitaminc-pairs_loss": 2.790738105773926, "eval_vitaminc-pairs_runtime": 3.8263, "eval_vitaminc-pairs_samples_per_second": 33.453, "eval_vitaminc-pairs_steps_per_second": 0.261, "step": 32 }, { "epoch": 0.3106796116504854, "eval_negation-triplets_loss": 1.3332663774490356, "eval_negation-triplets_runtime": 0.631, "eval_negation-triplets_samples_per_second": 202.843, "eval_negation-triplets_steps_per_second": 1.585, "step": 32 }, { "epoch": 0.3106796116504854, "eval_scitail-pairs-pos_loss": 0.06070985272526741, "eval_scitail-pairs-pos_runtime": 0.8894, "eval_scitail-pairs-pos_samples_per_second": 143.912, "eval_scitail-pairs-pos_steps_per_second": 1.124, "step": 32 }, { "epoch": 0.3106796116504854, "eval_scitail-pairs-qa_loss": 1.3768674023140193e-07, "eval_scitail-pairs-qa_runtime": 0.5735, "eval_scitail-pairs-qa_samples_per_second": 223.193, "eval_scitail-pairs-qa_steps_per_second": 1.744, "step": 32 }, { "epoch": 0.3106796116504854, "eval_xsum-pairs_loss": 0.00016528123524039984, "eval_xsum-pairs_runtime": 2.9269, "eval_xsum-pairs_samples_per_second": 43.733, "eval_xsum-pairs_steps_per_second": 0.342, "step": 32 }, { "epoch": 0.3106796116504854, "eval_sciq_pairs_loss": 0.053717803210020065, "eval_sciq_pairs_runtime": 2.507, "eval_sciq_pairs_samples_per_second": 34.703, "eval_sciq_pairs_steps_per_second": 0.399, "step": 32 }, { "epoch": 0.3106796116504854, "eval_qasc_pairs_loss": 0.0767521858215332, "eval_qasc_pairs_runtime": 0.3716, "eval_qasc_pairs_samples_per_second": 234.106, "eval_qasc_pairs_steps_per_second": 2.691, "step": 32 }, { "epoch": 0.3106796116504854, "eval_openbookqa_pairs_loss": 1.3624300956726074, "eval_openbookqa_pairs_runtime": 0.5694, "eval_openbookqa_pairs_samples_per_second": 224.793, "eval_openbookqa_pairs_steps_per_second": 1.756, "step": 32 }, { "epoch": 0.3106796116504854, "eval_msmarco_pairs_loss": 0.1503019779920578, "eval_msmarco_pairs_runtime": 1.0979, "eval_msmarco_pairs_samples_per_second": 79.242, "eval_msmarco_pairs_steps_per_second": 0.911, "step": 32 }, { "epoch": 0.3106796116504854, "eval_nq_pairs_loss": 0.007631430868059397, "eval_nq_pairs_runtime": 2.2394, "eval_nq_pairs_samples_per_second": 38.849, "eval_nq_pairs_steps_per_second": 0.447, "step": 32 }, { "epoch": 0.3106796116504854, "eval_trivia_pairs_loss": 0.2704613208770752, "eval_trivia_pairs_runtime": 2.4373, "eval_trivia_pairs_samples_per_second": 41.029, "eval_trivia_pairs_steps_per_second": 0.41, "step": 32 }, { "epoch": 0.3106796116504854, "eval_gooaq_pairs_loss": 0.05935850366950035, "eval_gooaq_pairs_runtime": 0.5791, "eval_gooaq_pairs_samples_per_second": 150.232, "eval_gooaq_pairs_steps_per_second": 1.727, "step": 32 }, { "epoch": 0.3106796116504854, "eval_paws-pos_loss": 0.04611051082611084, "eval_paws-pos_runtime": 0.6911, "eval_paws-pos_samples_per_second": 185.199, "eval_paws-pos_steps_per_second": 1.447, "step": 32 }, { "epoch": 0.3106796116504854, "eval_global_dataset_loss": 0.4507196247577667, "eval_global_dataset_runtime": 25.0483, "eval_global_dataset_samples_per_second": 26.469, "eval_global_dataset_steps_per_second": 0.24, "step": 32 } ], "logging_steps": 1, "max_steps": 309, "num_input_tokens_seen": 0, "num_train_epochs": 3, "save_steps": 16, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": false }, "attributes": {} } }, "total_flos": 0.0, "train_batch_size": 96, "trial_name": null, "trial_params": null }