{ "best_metric": 0.8362939444102149, "best_model_checkpoint": "checkpoints/multicse-bert-base-uncased", "epoch": 6.0, "global_step": 2706, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.06, "eval_avg_sts": 0.808172199263909, "eval_sickr_spearman": 0.783590147828092, "eval_stsb_spearman": 0.8327542506997261, "step": 25 }, { "epoch": 0.11, "eval_avg_sts": 0.820794223239678, "eval_sickr_spearman": 0.8053590918084821, "eval_stsb_spearman": 0.8362293546708739, "step": 50 }, { "epoch": 0.17, "eval_avg_sts": 0.8218985782625993, "eval_sickr_spearman": 0.8010904717614742, "eval_stsb_spearman": 0.8427066847637243, "step": 75 }, { "epoch": 0.22, "eval_avg_sts": 0.8212197665999863, "eval_sickr_spearman": 0.7985843529817378, "eval_stsb_spearman": 0.8438551802182349, "step": 100 }, { "epoch": 0.28, "eval_avg_sts": 0.8263710498747726, "eval_sickr_spearman": 0.8055955008897605, "eval_stsb_spearman": 0.8471465988597847, "step": 125 }, { "epoch": 0.33, "eval_avg_sts": 0.8263231728376124, "eval_sickr_spearman": 0.8046682604764976, "eval_stsb_spearman": 0.8479780851987271, "step": 150 }, { "epoch": 0.39, "eval_avg_sts": 0.8240636839647479, "eval_sickr_spearman": 0.80153019649514, "eval_stsb_spearman": 0.8465971714343559, "step": 175 }, { "epoch": 0.44, "eval_avg_sts": 0.8305466429958255, "eval_sickr_spearman": 0.8140019522945605, "eval_stsb_spearman": 0.8470913336970906, "step": 200 }, { "epoch": 0.5, "eval_avg_sts": 0.8212438683719858, "eval_sickr_spearman": 0.796099127731127, "eval_stsb_spearman": 0.8463886090128445, "step": 225 }, { "epoch": 0.55, "eval_avg_sts": 0.8290131151517519, "eval_sickr_spearman": 0.8127541523102997, "eval_stsb_spearman": 0.8452720779932043, "step": 250 }, { "epoch": 0.61, "eval_avg_sts": 0.8291875600829677, "eval_sickr_spearman": 0.8103600420591169, "eval_stsb_spearman": 0.8480150781068185, "step": 275 }, { "epoch": 0.67, "eval_avg_sts": 0.8327962239942688, "eval_sickr_spearman": 0.816952310731498, "eval_stsb_spearman": 0.8486401372570397, "step": 300 }, { "epoch": 0.72, "eval_avg_sts": 0.8330122790068915, "eval_sickr_spearman": 0.8143033474560845, "eval_stsb_spearman": 0.8517212105576986, "step": 325 }, { "epoch": 0.78, "eval_avg_sts": 0.8334940457333329, "eval_sickr_spearman": 0.8149612294524823, "eval_stsb_spearman": 0.8520268620141834, "step": 350 }, { "epoch": 0.83, "eval_avg_sts": 0.8359867680300406, "eval_sickr_spearman": 0.8166730579077367, "eval_stsb_spearman": 0.8553004781523443, "step": 375 }, { "epoch": 0.89, "eval_avg_sts": 0.8362939444102149, "eval_sickr_spearman": 0.8178701370488788, "eval_stsb_spearman": 0.8547177517715511, "step": 400 }, { "epoch": 0.94, "eval_avg_sts": 0.8269789550924258, "eval_sickr_spearman": 0.8014972471595535, "eval_stsb_spearman": 0.852460663025298, "step": 425 }, { "epoch": 1.0, "eval_avg_sts": 0.8271598937884023, "eval_sickr_spearman": 0.8061173588068856, "eval_stsb_spearman": 0.8482024287699189, "step": 450 }, { "epoch": 1.05, "eval_avg_sts": 0.8282927205714137, "eval_sickr_spearman": 0.8104696010014973, "eval_stsb_spearman": 0.84611584014133, "step": 475 }, { "epoch": 1.11, "learning_rate": 4.076127124907613e-05, "loss": 0.4303, "step": 500 }, { "epoch": 1.11, "eval_avg_sts": 0.8274629650840639, "eval_sickr_spearman": 0.8056994401932726, "eval_stsb_spearman": 0.8492264899748552, "step": 500 }, { "epoch": 1.16, "eval_avg_sts": 0.8274341455051789, "eval_sickr_spearman": 0.8072793272128764, "eval_stsb_spearman": 0.8475889637974814, "step": 525 }, { "epoch": 1.22, "eval_avg_sts": 0.8269940468993253, "eval_sickr_spearman": 0.803170506640353, "eval_stsb_spearman": 0.8508175871582977, "step": 550 }, { "epoch": 1.27, "eval_avg_sts": 0.8288643821143353, "eval_sickr_spearman": 0.8083313524276753, "eval_stsb_spearman": 0.8493974118009953, "step": 575 }, { "epoch": 1.33, "eval_avg_sts": 0.8342864948337284, "eval_sickr_spearman": 0.8138802895146177, "eval_stsb_spearman": 0.8546927001528392, "step": 600 }, { "epoch": 1.39, "eval_avg_sts": 0.8270151161624402, "eval_sickr_spearman": 0.8041265176833771, "eval_stsb_spearman": 0.8499037146415034, "step": 625 }, { "epoch": 1.44, "eval_avg_sts": 0.8279455772988316, "eval_sickr_spearman": 0.8036888102559718, "eval_stsb_spearman": 0.8522023443416914, "step": 650 }, { "epoch": 1.5, "eval_avg_sts": 0.829012477308678, "eval_sickr_spearman": 0.808486444854219, "eval_stsb_spearman": 0.849538509763137, "step": 675 }, { "epoch": 1.55, "eval_avg_sts": 0.8288300235840231, "eval_sickr_spearman": 0.8088525379093803, "eval_stsb_spearman": 0.848807509258666, "step": 700 }, { "epoch": 1.61, "eval_avg_sts": 0.8305859335486241, "eval_sickr_spearman": 0.8107295453224803, "eval_stsb_spearman": 0.8504423217747678, "step": 725 }, { "epoch": 1.66, "eval_avg_sts": 0.8280931139956361, "eval_sickr_spearman": 0.8061409420776917, "eval_stsb_spearman": 0.8500452859135805, "step": 750 }, { "epoch": 1.72, "eval_avg_sts": 0.8302899379899211, "eval_sickr_spearman": 0.8096262228913453, "eval_stsb_spearman": 0.850953653088497, "step": 775 }, { "epoch": 1.77, "eval_avg_sts": 0.8312188464560427, "eval_sickr_spearman": 0.8104490436900817, "eval_stsb_spearman": 0.8519886492220037, "step": 800 }, { "epoch": 1.83, "eval_avg_sts": 0.8302662907658385, "eval_sickr_spearman": 0.8117301772587404, "eval_stsb_spearman": 0.8488024042729365, "step": 825 }, { "epoch": 1.88, "eval_avg_sts": 0.83177529644248, "eval_sickr_spearman": 0.8116331544338355, "eval_stsb_spearman": 0.8519174384511247, "step": 850 }, { "epoch": 1.94, "eval_avg_sts": 0.8342887017337668, "eval_sickr_spearman": 0.8159248294095337, "eval_stsb_spearman": 0.8526525740579998, "step": 875 }, { "epoch": 2.0, "eval_avg_sts": 0.8335303856286564, "eval_sickr_spearman": 0.8152034983281362, "eval_stsb_spearman": 0.8518572729291767, "step": 900 }, { "epoch": 2.05, "eval_avg_sts": 0.8316736063387226, "eval_sickr_spearman": 0.8125293667555692, "eval_stsb_spearman": 0.8508178459218759, "step": 925 }, { "epoch": 2.11, "eval_avg_sts": 0.8280586113483762, "eval_sickr_spearman": 0.809915706339713, "eval_stsb_spearman": 0.8462015163570394, "step": 950 }, { "epoch": 2.16, "eval_avg_sts": 0.8285809844295435, "eval_sickr_spearman": 0.8105551443931586, "eval_stsb_spearman": 0.8466068244659284, "step": 975 }, { "epoch": 2.22, "learning_rate": 3.152254249815226e-05, "loss": 0.2628, "step": 1000 }, { "epoch": 2.22, "eval_avg_sts": 0.8304703081697632, "eval_sickr_spearman": 0.8108091328575633, "eval_stsb_spearman": 0.8501314834819631, "step": 1000 }, { "epoch": 2.27, "eval_avg_sts": 0.8246676161757887, "eval_sickr_spearman": 0.8022548417225369, "eval_stsb_spearman": 0.8470803906290405, "step": 1025 }, { "epoch": 2.33, "eval_avg_sts": 0.8247542776319872, "eval_sickr_spearman": 0.8023693478683652, "eval_stsb_spearman": 0.8471392073956092, "step": 1050 }, { "epoch": 2.38, "eval_avg_sts": 0.8284712817725378, "eval_sickr_spearman": 0.8063077540929862, "eval_stsb_spearman": 0.8506348094520895, "step": 1075 }, { "epoch": 2.44, "eval_avg_sts": 0.8267581222566869, "eval_sickr_spearman": 0.8023707888014083, "eval_stsb_spearman": 0.8511454557119653, "step": 1100 }, { "epoch": 2.49, "eval_avg_sts": 0.8245678399799343, "eval_sickr_spearman": 0.8010677050193924, "eval_stsb_spearman": 0.8480679749404763, "step": 1125 }, { "epoch": 2.55, "eval_avg_sts": 0.8264893834503197, "eval_sickr_spearman": 0.8047740249618645, "eval_stsb_spearman": 0.848204741938775, "step": 1150 }, { "epoch": 2.61, "eval_avg_sts": 0.8239740308575658, "eval_sickr_spearman": 0.802257483433116, "eval_stsb_spearman": 0.8456905782820158, "step": 1175 }, { "epoch": 2.66, "eval_avg_sts": 0.8252898688219781, "eval_sickr_spearman": 0.8059969928666816, "eval_stsb_spearman": 0.8445827447772745, "step": 1200 }, { "epoch": 2.72, "eval_avg_sts": 0.8218363555031618, "eval_sickr_spearman": 0.7991245587796122, "eval_stsb_spearman": 0.8445481522267114, "step": 1225 }, { "epoch": 2.77, "eval_avg_sts": 0.8265232671423588, "eval_sickr_spearman": 0.8062044391937928, "eval_stsb_spearman": 0.8468420950909247, "step": 1250 }, { "epoch": 2.83, "eval_avg_sts": 0.8286104291951198, "eval_sickr_spearman": 0.8096378464178936, "eval_stsb_spearman": 0.8475830119723461, "step": 1275 }, { "epoch": 2.88, "eval_avg_sts": 0.8314342022111989, "eval_sickr_spearman": 0.8138266387743112, "eval_stsb_spearman": 0.8490417656480866, "step": 1300 }, { "epoch": 2.94, "eval_avg_sts": 0.8285621943597675, "eval_sickr_spearman": 0.807191478328346, "eval_stsb_spearman": 0.849932910391189, "step": 1325 }, { "epoch": 2.99, "eval_avg_sts": 0.8284116030199242, "eval_sickr_spearman": 0.8073644383246247, "eval_stsb_spearman": 0.8494587677152238, "step": 1350 }, { "epoch": 3.05, "eval_avg_sts": 0.8247221665272242, "eval_sickr_spearman": 0.8022067145588959, "eval_stsb_spearman": 0.8472376184955523, "step": 1375 }, { "epoch": 3.1, "eval_avg_sts": 0.826858184586315, "eval_sickr_spearman": 0.8056980472913309, "eval_stsb_spearman": 0.848018321881299, "step": 1400 }, { "epoch": 3.16, "eval_avg_sts": 0.8262245909726973, "eval_sickr_spearman": 0.8059310941955087, "eval_stsb_spearman": 0.846518087749886, "step": 1425 }, { "epoch": 3.22, "eval_avg_sts": 0.8271328383994965, "eval_sickr_spearman": 0.8059575113012996, "eval_stsb_spearman": 0.8483081654976934, "step": 1450 }, { "epoch": 3.27, "eval_avg_sts": 0.8262273295933256, "eval_sickr_spearman": 0.8045855028887199, "eval_stsb_spearman": 0.8478691562979312, "step": 1475 }, { "epoch": 3.33, "learning_rate": 2.2283813747228384e-05, "loss": 0.2284, "step": 1500 }, { "epoch": 3.33, "eval_avg_sts": 0.8290942209780299, "eval_sickr_spearman": 0.8098024490025217, "eval_stsb_spearman": 0.848385992953538, "step": 1500 }, { "epoch": 3.38, "eval_avg_sts": 0.8271287520959363, "eval_sickr_spearman": 0.8068388820126888, "eval_stsb_spearman": 0.8474186221791836, "step": 1525 }, { "epoch": 3.44, "eval_avg_sts": 0.8284906943060749, "eval_sickr_spearman": 0.8083666552872324, "eval_stsb_spearman": 0.8486147333249174, "step": 1550 }, { "epoch": 3.49, "eval_avg_sts": 0.8247556311383242, "eval_sickr_spearman": 0.8033069629995387, "eval_stsb_spearman": 0.8462042992771095, "step": 1575 }, { "epoch": 3.55, "eval_avg_sts": 0.8256788195546352, "eval_sickr_spearman": 0.8046946295511871, "eval_stsb_spearman": 0.8466630095580832, "step": 1600 }, { "epoch": 3.6, "eval_avg_sts": 0.8246935620550073, "eval_sickr_spearman": 0.8025401944961806, "eval_stsb_spearman": 0.8468469296138341, "step": 1625 }, { "epoch": 3.66, "eval_avg_sts": 0.8263329601931413, "eval_sickr_spearman": 0.8045876162571832, "eval_stsb_spearman": 0.8480783041290992, "step": 1650 }, { "epoch": 3.71, "eval_avg_sts": 0.8264865724885355, "eval_sickr_spearman": 0.8057473272014063, "eval_stsb_spearman": 0.8472258177756647, "step": 1675 }, { "epoch": 3.77, "eval_avg_sts": 0.8254423729673166, "eval_sickr_spearman": 0.8031947143154778, "eval_stsb_spearman": 0.8476900316191552, "step": 1700 }, { "epoch": 3.82, "eval_avg_sts": 0.8264107919338515, "eval_sickr_spearman": 0.8053674972512337, "eval_stsb_spearman": 0.8474540866164694, "step": 1725 }, { "epoch": 3.88, "eval_avg_sts": 0.8264776461929313, "eval_sickr_spearman": 0.8059907968545961, "eval_stsb_spearman": 0.8469644955312665, "step": 1750 }, { "epoch": 3.94, "eval_avg_sts": 0.8240221134684459, "eval_sickr_spearman": 0.8008853789583333, "eval_stsb_spearman": 0.8471588479785584, "step": 1775 }, { "epoch": 3.99, "eval_avg_sts": 0.8260093129727113, "eval_sickr_spearman": 0.8032525437616094, "eval_stsb_spearman": 0.8487660821838133, "step": 1800 }, { "epoch": 4.05, "eval_avg_sts": 0.8251871747358858, "eval_sickr_spearman": 0.8022517677320448, "eval_stsb_spearman": 0.8481225817397268, "step": 1825 }, { "epoch": 4.1, "eval_avg_sts": 0.8236068675958164, "eval_sickr_spearman": 0.8001952680928707, "eval_stsb_spearman": 0.8470184670987619, "step": 1850 }, { "epoch": 4.16, "eval_avg_sts": 0.8238228114044301, "eval_sickr_spearman": 0.8002784579605614, "eval_stsb_spearman": 0.8473671648482989, "step": 1875 }, { "epoch": 4.21, "eval_avg_sts": 0.8236955591912043, "eval_sickr_spearman": 0.7999801848206307, "eval_stsb_spearman": 0.847410933561778, "step": 1900 }, { "epoch": 4.27, "eval_avg_sts": 0.8217179921122288, "eval_sickr_spearman": 0.7976729628319497, "eval_stsb_spearman": 0.8457630213925079, "step": 1925 }, { "epoch": 4.32, "eval_avg_sts": 0.8218133292332199, "eval_sickr_spearman": 0.7972407309501078, "eval_stsb_spearman": 0.8463859275163321, "step": 1950 }, { "epoch": 4.38, "eval_avg_sts": 0.82307986157595, "eval_sickr_spearman": 0.7997425269307149, "eval_stsb_spearman": 0.846417196221185, "step": 1975 }, { "epoch": 4.43, "learning_rate": 1.3045084996304511e-05, "loss": 0.2149, "step": 2000 }, { "epoch": 4.43, "eval_avg_sts": 0.8251845211566629, "eval_sickr_spearman": 0.803791356657542, "eval_stsb_spearman": 0.8465776856557838, "step": 2000 }, { "epoch": 4.49, "eval_avg_sts": 0.8244897261222982, "eval_sickr_spearman": 0.8012433547573516, "eval_stsb_spearman": 0.8477360974872448, "step": 2025 }, { "epoch": 4.55, "eval_avg_sts": 0.8248464356555265, "eval_sickr_spearman": 0.80196872045127, "eval_stsb_spearman": 0.847724150859783, "step": 2050 }, { "epoch": 4.6, "eval_avg_sts": 0.8236282342217962, "eval_sickr_spearman": 0.801061412945104, "eval_stsb_spearman": 0.8461950554984884, "step": 2075 }, { "epoch": 4.66, "eval_avg_sts": 0.8241232806486489, "eval_sickr_spearman": 0.8016284200975811, "eval_stsb_spearman": 0.8466181411997169, "step": 2100 }, { "epoch": 4.71, "eval_avg_sts": 0.8240448338930326, "eval_sickr_spearman": 0.8024957657273504, "eval_stsb_spearman": 0.845593902058715, "step": 2125 }, { "epoch": 4.77, "eval_avg_sts": 0.8252602189328375, "eval_sickr_spearman": 0.8031946662843764, "eval_stsb_spearman": 0.8473257715812985, "step": 2150 }, { "epoch": 4.82, "eval_avg_sts": 0.8237954063381605, "eval_sickr_spearman": 0.8006036285172974, "eval_stsb_spearman": 0.8469871841590237, "step": 2175 }, { "epoch": 4.88, "eval_avg_sts": 0.8238382480785117, "eval_sickr_spearman": 0.8008013245308166, "eval_stsb_spearman": 0.8468751716262067, "step": 2200 }, { "epoch": 4.93, "eval_avg_sts": 0.8226554353280054, "eval_sickr_spearman": 0.79934425303759, "eval_stsb_spearman": 0.8459666176184208, "step": 2225 }, { "epoch": 4.99, "eval_avg_sts": 0.8221324924350076, "eval_sickr_spearman": 0.7977314166823997, "eval_stsb_spearman": 0.8465335681876156, "step": 2250 }, { "epoch": 5.04, "eval_avg_sts": 0.8230411082185226, "eval_sickr_spearman": 0.7989547688360285, "eval_stsb_spearman": 0.8471274476010168, "step": 2275 }, { "epoch": 5.1, "eval_avg_sts": 0.8228022688627314, "eval_sickr_spearman": 0.7994119768906178, "eval_stsb_spearman": 0.846192560834845, "step": 2300 }, { "epoch": 5.16, "eval_avg_sts": 0.8228479899857558, "eval_sickr_spearman": 0.7989381981060323, "eval_stsb_spearman": 0.8467577818654793, "step": 2325 }, { "epoch": 5.21, "eval_avg_sts": 0.8221050116430979, "eval_sickr_spearman": 0.7985421816746751, "eval_stsb_spearman": 0.8456678416115206, "step": 2350 }, { "epoch": 5.27, "eval_avg_sts": 0.822383318476755, "eval_sickr_spearman": 0.7986474658490273, "eval_stsb_spearman": 0.8461191711044828, "step": 2375 }, { "epoch": 5.32, "eval_avg_sts": 0.823048712126393, "eval_sickr_spearman": 0.7993529466669504, "eval_stsb_spearman": 0.8467444775858354, "step": 2400 }, { "epoch": 5.38, "eval_avg_sts": 0.8228378854074433, "eval_sickr_spearman": 0.799309382457946, "eval_stsb_spearman": 0.8463663883569406, "step": 2425 }, { "epoch": 5.43, "eval_avg_sts": 0.8229990938054758, "eval_sickr_spearman": 0.7993526104492402, "eval_stsb_spearman": 0.8466455771617113, "step": 2450 }, { "epoch": 5.49, "eval_avg_sts": 0.8223080164546823, "eval_sickr_spearman": 0.7985109614587403, "eval_stsb_spearman": 0.8461050714506243, "step": 2475 }, { "epoch": 5.54, "learning_rate": 3.806356245380636e-06, "loss": 0.2074, "step": 2500 }, { "epoch": 5.54, "eval_avg_sts": 0.8224706658462584, "eval_sickr_spearman": 0.7986079842836452, "eval_stsb_spearman": 0.8463333474088716, "step": 2500 }, { "epoch": 5.6, "eval_avg_sts": 0.8228255546038069, "eval_sickr_spearman": 0.7993520821071245, "eval_stsb_spearman": 0.8462990271004893, "step": 2525 }, { "epoch": 5.65, "eval_avg_sts": 0.8222772197799051, "eval_sickr_spearman": 0.7986904536848144, "eval_stsb_spearman": 0.8458639858749959, "step": 2550 }, { "epoch": 5.71, "eval_avg_sts": 0.822395438556291, "eval_sickr_spearman": 0.7987432398652949, "eval_stsb_spearman": 0.8460476372472872, "step": 2575 }, { "epoch": 5.76, "eval_avg_sts": 0.8229151972681052, "eval_sickr_spearman": 0.7992985754601224, "eval_stsb_spearman": 0.8465318190760882, "step": 2600 }, { "epoch": 5.82, "eval_avg_sts": 0.8227679691163096, "eval_sickr_spearman": 0.7989778237647187, "eval_stsb_spearman": 0.8465581144679004, "step": 2625 }, { "epoch": 5.88, "eval_avg_sts": 0.8231044151175362, "eval_sickr_spearman": 0.7993373845900845, "eval_stsb_spearman": 0.8468714456449877, "step": 2650 }, { "epoch": 5.93, "eval_avg_sts": 0.8230968701740264, "eval_sickr_spearman": 0.7993484797745166, "eval_stsb_spearman": 0.8468452605735363, "step": 2675 }, { "epoch": 5.99, "eval_avg_sts": 0.8230334553806065, "eval_sickr_spearman": 0.7992910345771966, "eval_stsb_spearman": 0.8467758761840164, "step": 2700 }, { "epoch": 6.0, "step": 2706, "train_runtime": 3739.6542, "train_samples_per_second": 0.724 } ], "max_steps": 2706, "num_train_epochs": 6, "total_flos": 212939896792195584, "trial_name": null, "trial_params": null }