| { | |
| "best_metric": 0.8362939444102149, | |
| "best_model_checkpoint": "checkpoints/multicse-bert-base-uncased", | |
| "epoch": 6.0, | |
| "global_step": 2706, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 0.06, | |
| "eval_avg_sts": 0.808172199263909, | |
| "eval_sickr_spearman": 0.783590147828092, | |
| "eval_stsb_spearman": 0.8327542506997261, | |
| "step": 25 | |
| }, | |
| { | |
| "epoch": 0.11, | |
| "eval_avg_sts": 0.820794223239678, | |
| "eval_sickr_spearman": 0.8053590918084821, | |
| "eval_stsb_spearman": 0.8362293546708739, | |
| "step": 50 | |
| }, | |
| { | |
| "epoch": 0.17, | |
| "eval_avg_sts": 0.8218985782625993, | |
| "eval_sickr_spearman": 0.8010904717614742, | |
| "eval_stsb_spearman": 0.8427066847637243, | |
| "step": 75 | |
| }, | |
| { | |
| "epoch": 0.22, | |
| "eval_avg_sts": 0.8212197665999863, | |
| "eval_sickr_spearman": 0.7985843529817378, | |
| "eval_stsb_spearman": 0.8438551802182349, | |
| "step": 100 | |
| }, | |
| { | |
| "epoch": 0.28, | |
| "eval_avg_sts": 0.8263710498747726, | |
| "eval_sickr_spearman": 0.8055955008897605, | |
| "eval_stsb_spearman": 0.8471465988597847, | |
| "step": 125 | |
| }, | |
| { | |
| "epoch": 0.33, | |
| "eval_avg_sts": 0.8263231728376124, | |
| "eval_sickr_spearman": 0.8046682604764976, | |
| "eval_stsb_spearman": 0.8479780851987271, | |
| "step": 150 | |
| }, | |
| { | |
| "epoch": 0.39, | |
| "eval_avg_sts": 0.8240636839647479, | |
| "eval_sickr_spearman": 0.80153019649514, | |
| "eval_stsb_spearman": 0.8465971714343559, | |
| "step": 175 | |
| }, | |
| { | |
| "epoch": 0.44, | |
| "eval_avg_sts": 0.8305466429958255, | |
| "eval_sickr_spearman": 0.8140019522945605, | |
| "eval_stsb_spearman": 0.8470913336970906, | |
| "step": 200 | |
| }, | |
| { | |
| "epoch": 0.5, | |
| "eval_avg_sts": 0.8212438683719858, | |
| "eval_sickr_spearman": 0.796099127731127, | |
| "eval_stsb_spearman": 0.8463886090128445, | |
| "step": 225 | |
| }, | |
| { | |
| "epoch": 0.55, | |
| "eval_avg_sts": 0.8290131151517519, | |
| "eval_sickr_spearman": 0.8127541523102997, | |
| "eval_stsb_spearman": 0.8452720779932043, | |
| "step": 250 | |
| }, | |
| { | |
| "epoch": 0.61, | |
| "eval_avg_sts": 0.8291875600829677, | |
| "eval_sickr_spearman": 0.8103600420591169, | |
| "eval_stsb_spearman": 0.8480150781068185, | |
| "step": 275 | |
| }, | |
| { | |
| "epoch": 0.67, | |
| "eval_avg_sts": 0.8327962239942688, | |
| "eval_sickr_spearman": 0.816952310731498, | |
| "eval_stsb_spearman": 0.8486401372570397, | |
| "step": 300 | |
| }, | |
| { | |
| "epoch": 0.72, | |
| "eval_avg_sts": 0.8330122790068915, | |
| "eval_sickr_spearman": 0.8143033474560845, | |
| "eval_stsb_spearman": 0.8517212105576986, | |
| "step": 325 | |
| }, | |
| { | |
| "epoch": 0.78, | |
| "eval_avg_sts": 0.8334940457333329, | |
| "eval_sickr_spearman": 0.8149612294524823, | |
| "eval_stsb_spearman": 0.8520268620141834, | |
| "step": 350 | |
| }, | |
| { | |
| "epoch": 0.83, | |
| "eval_avg_sts": 0.8359867680300406, | |
| "eval_sickr_spearman": 0.8166730579077367, | |
| "eval_stsb_spearman": 0.8553004781523443, | |
| "step": 375 | |
| }, | |
| { | |
| "epoch": 0.89, | |
| "eval_avg_sts": 0.8362939444102149, | |
| "eval_sickr_spearman": 0.8178701370488788, | |
| "eval_stsb_spearman": 0.8547177517715511, | |
| "step": 400 | |
| }, | |
| { | |
| "epoch": 0.94, | |
| "eval_avg_sts": 0.8269789550924258, | |
| "eval_sickr_spearman": 0.8014972471595535, | |
| "eval_stsb_spearman": 0.852460663025298, | |
| "step": 425 | |
| }, | |
| { | |
| "epoch": 1.0, | |
| "eval_avg_sts": 0.8271598937884023, | |
| "eval_sickr_spearman": 0.8061173588068856, | |
| "eval_stsb_spearman": 0.8482024287699189, | |
| "step": 450 | |
| }, | |
| { | |
| "epoch": 1.05, | |
| "eval_avg_sts": 0.8282927205714137, | |
| "eval_sickr_spearman": 0.8104696010014973, | |
| "eval_stsb_spearman": 0.84611584014133, | |
| "step": 475 | |
| }, | |
| { | |
| "epoch": 1.11, | |
| "learning_rate": 4.076127124907613e-05, | |
| "loss": 0.4303, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 1.11, | |
| "eval_avg_sts": 0.8274629650840639, | |
| "eval_sickr_spearman": 0.8056994401932726, | |
| "eval_stsb_spearman": 0.8492264899748552, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 1.16, | |
| "eval_avg_sts": 0.8274341455051789, | |
| "eval_sickr_spearman": 0.8072793272128764, | |
| "eval_stsb_spearman": 0.8475889637974814, | |
| "step": 525 | |
| }, | |
| { | |
| "epoch": 1.22, | |
| "eval_avg_sts": 0.8269940468993253, | |
| "eval_sickr_spearman": 0.803170506640353, | |
| "eval_stsb_spearman": 0.8508175871582977, | |
| "step": 550 | |
| }, | |
| { | |
| "epoch": 1.27, | |
| "eval_avg_sts": 0.8288643821143353, | |
| "eval_sickr_spearman": 0.8083313524276753, | |
| "eval_stsb_spearman": 0.8493974118009953, | |
| "step": 575 | |
| }, | |
| { | |
| "epoch": 1.33, | |
| "eval_avg_sts": 0.8342864948337284, | |
| "eval_sickr_spearman": 0.8138802895146177, | |
| "eval_stsb_spearman": 0.8546927001528392, | |
| "step": 600 | |
| }, | |
| { | |
| "epoch": 1.39, | |
| "eval_avg_sts": 0.8270151161624402, | |
| "eval_sickr_spearman": 0.8041265176833771, | |
| "eval_stsb_spearman": 0.8499037146415034, | |
| "step": 625 | |
| }, | |
| { | |
| "epoch": 1.44, | |
| "eval_avg_sts": 0.8279455772988316, | |
| "eval_sickr_spearman": 0.8036888102559718, | |
| "eval_stsb_spearman": 0.8522023443416914, | |
| "step": 650 | |
| }, | |
| { | |
| "epoch": 1.5, | |
| "eval_avg_sts": 0.829012477308678, | |
| "eval_sickr_spearman": 0.808486444854219, | |
| "eval_stsb_spearman": 0.849538509763137, | |
| "step": 675 | |
| }, | |
| { | |
| "epoch": 1.55, | |
| "eval_avg_sts": 0.8288300235840231, | |
| "eval_sickr_spearman": 0.8088525379093803, | |
| "eval_stsb_spearman": 0.848807509258666, | |
| "step": 700 | |
| }, | |
| { | |
| "epoch": 1.61, | |
| "eval_avg_sts": 0.8305859335486241, | |
| "eval_sickr_spearman": 0.8107295453224803, | |
| "eval_stsb_spearman": 0.8504423217747678, | |
| "step": 725 | |
| }, | |
| { | |
| "epoch": 1.66, | |
| "eval_avg_sts": 0.8280931139956361, | |
| "eval_sickr_spearman": 0.8061409420776917, | |
| "eval_stsb_spearman": 0.8500452859135805, | |
| "step": 750 | |
| }, | |
| { | |
| "epoch": 1.72, | |
| "eval_avg_sts": 0.8302899379899211, | |
| "eval_sickr_spearman": 0.8096262228913453, | |
| "eval_stsb_spearman": 0.850953653088497, | |
| "step": 775 | |
| }, | |
| { | |
| "epoch": 1.77, | |
| "eval_avg_sts": 0.8312188464560427, | |
| "eval_sickr_spearman": 0.8104490436900817, | |
| "eval_stsb_spearman": 0.8519886492220037, | |
| "step": 800 | |
| }, | |
| { | |
| "epoch": 1.83, | |
| "eval_avg_sts": 0.8302662907658385, | |
| "eval_sickr_spearman": 0.8117301772587404, | |
| "eval_stsb_spearman": 0.8488024042729365, | |
| "step": 825 | |
| }, | |
| { | |
| "epoch": 1.88, | |
| "eval_avg_sts": 0.83177529644248, | |
| "eval_sickr_spearman": 0.8116331544338355, | |
| "eval_stsb_spearman": 0.8519174384511247, | |
| "step": 850 | |
| }, | |
| { | |
| "epoch": 1.94, | |
| "eval_avg_sts": 0.8342887017337668, | |
| "eval_sickr_spearman": 0.8159248294095337, | |
| "eval_stsb_spearman": 0.8526525740579998, | |
| "step": 875 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_avg_sts": 0.8335303856286564, | |
| "eval_sickr_spearman": 0.8152034983281362, | |
| "eval_stsb_spearman": 0.8518572729291767, | |
| "step": 900 | |
| }, | |
| { | |
| "epoch": 2.05, | |
| "eval_avg_sts": 0.8316736063387226, | |
| "eval_sickr_spearman": 0.8125293667555692, | |
| "eval_stsb_spearman": 0.8508178459218759, | |
| "step": 925 | |
| }, | |
| { | |
| "epoch": 2.11, | |
| "eval_avg_sts": 0.8280586113483762, | |
| "eval_sickr_spearman": 0.809915706339713, | |
| "eval_stsb_spearman": 0.8462015163570394, | |
| "step": 950 | |
| }, | |
| { | |
| "epoch": 2.16, | |
| "eval_avg_sts": 0.8285809844295435, | |
| "eval_sickr_spearman": 0.8105551443931586, | |
| "eval_stsb_spearman": 0.8466068244659284, | |
| "step": 975 | |
| }, | |
| { | |
| "epoch": 2.22, | |
| "learning_rate": 3.152254249815226e-05, | |
| "loss": 0.2628, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 2.22, | |
| "eval_avg_sts": 0.8304703081697632, | |
| "eval_sickr_spearman": 0.8108091328575633, | |
| "eval_stsb_spearman": 0.8501314834819631, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 2.27, | |
| "eval_avg_sts": 0.8246676161757887, | |
| "eval_sickr_spearman": 0.8022548417225369, | |
| "eval_stsb_spearman": 0.8470803906290405, | |
| "step": 1025 | |
| }, | |
| { | |
| "epoch": 2.33, | |
| "eval_avg_sts": 0.8247542776319872, | |
| "eval_sickr_spearman": 0.8023693478683652, | |
| "eval_stsb_spearman": 0.8471392073956092, | |
| "step": 1050 | |
| }, | |
| { | |
| "epoch": 2.38, | |
| "eval_avg_sts": 0.8284712817725378, | |
| "eval_sickr_spearman": 0.8063077540929862, | |
| "eval_stsb_spearman": 0.8506348094520895, | |
| "step": 1075 | |
| }, | |
| { | |
| "epoch": 2.44, | |
| "eval_avg_sts": 0.8267581222566869, | |
| "eval_sickr_spearman": 0.8023707888014083, | |
| "eval_stsb_spearman": 0.8511454557119653, | |
| "step": 1100 | |
| }, | |
| { | |
| "epoch": 2.49, | |
| "eval_avg_sts": 0.8245678399799343, | |
| "eval_sickr_spearman": 0.8010677050193924, | |
| "eval_stsb_spearman": 0.8480679749404763, | |
| "step": 1125 | |
| }, | |
| { | |
| "epoch": 2.55, | |
| "eval_avg_sts": 0.8264893834503197, | |
| "eval_sickr_spearman": 0.8047740249618645, | |
| "eval_stsb_spearman": 0.848204741938775, | |
| "step": 1150 | |
| }, | |
| { | |
| "epoch": 2.61, | |
| "eval_avg_sts": 0.8239740308575658, | |
| "eval_sickr_spearman": 0.802257483433116, | |
| "eval_stsb_spearman": 0.8456905782820158, | |
| "step": 1175 | |
| }, | |
| { | |
| "epoch": 2.66, | |
| "eval_avg_sts": 0.8252898688219781, | |
| "eval_sickr_spearman": 0.8059969928666816, | |
| "eval_stsb_spearman": 0.8445827447772745, | |
| "step": 1200 | |
| }, | |
| { | |
| "epoch": 2.72, | |
| "eval_avg_sts": 0.8218363555031618, | |
| "eval_sickr_spearman": 0.7991245587796122, | |
| "eval_stsb_spearman": 0.8445481522267114, | |
| "step": 1225 | |
| }, | |
| { | |
| "epoch": 2.77, | |
| "eval_avg_sts": 0.8265232671423588, | |
| "eval_sickr_spearman": 0.8062044391937928, | |
| "eval_stsb_spearman": 0.8468420950909247, | |
| "step": 1250 | |
| }, | |
| { | |
| "epoch": 2.83, | |
| "eval_avg_sts": 0.8286104291951198, | |
| "eval_sickr_spearman": 0.8096378464178936, | |
| "eval_stsb_spearman": 0.8475830119723461, | |
| "step": 1275 | |
| }, | |
| { | |
| "epoch": 2.88, | |
| "eval_avg_sts": 0.8314342022111989, | |
| "eval_sickr_spearman": 0.8138266387743112, | |
| "eval_stsb_spearman": 0.8490417656480866, | |
| "step": 1300 | |
| }, | |
| { | |
| "epoch": 2.94, | |
| "eval_avg_sts": 0.8285621943597675, | |
| "eval_sickr_spearman": 0.807191478328346, | |
| "eval_stsb_spearman": 0.849932910391189, | |
| "step": 1325 | |
| }, | |
| { | |
| "epoch": 2.99, | |
| "eval_avg_sts": 0.8284116030199242, | |
| "eval_sickr_spearman": 0.8073644383246247, | |
| "eval_stsb_spearman": 0.8494587677152238, | |
| "step": 1350 | |
| }, | |
| { | |
| "epoch": 3.05, | |
| "eval_avg_sts": 0.8247221665272242, | |
| "eval_sickr_spearman": 0.8022067145588959, | |
| "eval_stsb_spearman": 0.8472376184955523, | |
| "step": 1375 | |
| }, | |
| { | |
| "epoch": 3.1, | |
| "eval_avg_sts": 0.826858184586315, | |
| "eval_sickr_spearman": 0.8056980472913309, | |
| "eval_stsb_spearman": 0.848018321881299, | |
| "step": 1400 | |
| }, | |
| { | |
| "epoch": 3.16, | |
| "eval_avg_sts": 0.8262245909726973, | |
| "eval_sickr_spearman": 0.8059310941955087, | |
| "eval_stsb_spearman": 0.846518087749886, | |
| "step": 1425 | |
| }, | |
| { | |
| "epoch": 3.22, | |
| "eval_avg_sts": 0.8271328383994965, | |
| "eval_sickr_spearman": 0.8059575113012996, | |
| "eval_stsb_spearman": 0.8483081654976934, | |
| "step": 1450 | |
| }, | |
| { | |
| "epoch": 3.27, | |
| "eval_avg_sts": 0.8262273295933256, | |
| "eval_sickr_spearman": 0.8045855028887199, | |
| "eval_stsb_spearman": 0.8478691562979312, | |
| "step": 1475 | |
| }, | |
| { | |
| "epoch": 3.33, | |
| "learning_rate": 2.2283813747228384e-05, | |
| "loss": 0.2284, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 3.33, | |
| "eval_avg_sts": 0.8290942209780299, | |
| "eval_sickr_spearman": 0.8098024490025217, | |
| "eval_stsb_spearman": 0.848385992953538, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 3.38, | |
| "eval_avg_sts": 0.8271287520959363, | |
| "eval_sickr_spearman": 0.8068388820126888, | |
| "eval_stsb_spearman": 0.8474186221791836, | |
| "step": 1525 | |
| }, | |
| { | |
| "epoch": 3.44, | |
| "eval_avg_sts": 0.8284906943060749, | |
| "eval_sickr_spearman": 0.8083666552872324, | |
| "eval_stsb_spearman": 0.8486147333249174, | |
| "step": 1550 | |
| }, | |
| { | |
| "epoch": 3.49, | |
| "eval_avg_sts": 0.8247556311383242, | |
| "eval_sickr_spearman": 0.8033069629995387, | |
| "eval_stsb_spearman": 0.8462042992771095, | |
| "step": 1575 | |
| }, | |
| { | |
| "epoch": 3.55, | |
| "eval_avg_sts": 0.8256788195546352, | |
| "eval_sickr_spearman": 0.8046946295511871, | |
| "eval_stsb_spearman": 0.8466630095580832, | |
| "step": 1600 | |
| }, | |
| { | |
| "epoch": 3.6, | |
| "eval_avg_sts": 0.8246935620550073, | |
| "eval_sickr_spearman": 0.8025401944961806, | |
| "eval_stsb_spearman": 0.8468469296138341, | |
| "step": 1625 | |
| }, | |
| { | |
| "epoch": 3.66, | |
| "eval_avg_sts": 0.8263329601931413, | |
| "eval_sickr_spearman": 0.8045876162571832, | |
| "eval_stsb_spearman": 0.8480783041290992, | |
| "step": 1650 | |
| }, | |
| { | |
| "epoch": 3.71, | |
| "eval_avg_sts": 0.8264865724885355, | |
| "eval_sickr_spearman": 0.8057473272014063, | |
| "eval_stsb_spearman": 0.8472258177756647, | |
| "step": 1675 | |
| }, | |
| { | |
| "epoch": 3.77, | |
| "eval_avg_sts": 0.8254423729673166, | |
| "eval_sickr_spearman": 0.8031947143154778, | |
| "eval_stsb_spearman": 0.8476900316191552, | |
| "step": 1700 | |
| }, | |
| { | |
| "epoch": 3.82, | |
| "eval_avg_sts": 0.8264107919338515, | |
| "eval_sickr_spearman": 0.8053674972512337, | |
| "eval_stsb_spearman": 0.8474540866164694, | |
| "step": 1725 | |
| }, | |
| { | |
| "epoch": 3.88, | |
| "eval_avg_sts": 0.8264776461929313, | |
| "eval_sickr_spearman": 0.8059907968545961, | |
| "eval_stsb_spearman": 0.8469644955312665, | |
| "step": 1750 | |
| }, | |
| { | |
| "epoch": 3.94, | |
| "eval_avg_sts": 0.8240221134684459, | |
| "eval_sickr_spearman": 0.8008853789583333, | |
| "eval_stsb_spearman": 0.8471588479785584, | |
| "step": 1775 | |
| }, | |
| { | |
| "epoch": 3.99, | |
| "eval_avg_sts": 0.8260093129727113, | |
| "eval_sickr_spearman": 0.8032525437616094, | |
| "eval_stsb_spearman": 0.8487660821838133, | |
| "step": 1800 | |
| }, | |
| { | |
| "epoch": 4.05, | |
| "eval_avg_sts": 0.8251871747358858, | |
| "eval_sickr_spearman": 0.8022517677320448, | |
| "eval_stsb_spearman": 0.8481225817397268, | |
| "step": 1825 | |
| }, | |
| { | |
| "epoch": 4.1, | |
| "eval_avg_sts": 0.8236068675958164, | |
| "eval_sickr_spearman": 0.8001952680928707, | |
| "eval_stsb_spearman": 0.8470184670987619, | |
| "step": 1850 | |
| }, | |
| { | |
| "epoch": 4.16, | |
| "eval_avg_sts": 0.8238228114044301, | |
| "eval_sickr_spearman": 0.8002784579605614, | |
| "eval_stsb_spearman": 0.8473671648482989, | |
| "step": 1875 | |
| }, | |
| { | |
| "epoch": 4.21, | |
| "eval_avg_sts": 0.8236955591912043, | |
| "eval_sickr_spearman": 0.7999801848206307, | |
| "eval_stsb_spearman": 0.847410933561778, | |
| "step": 1900 | |
| }, | |
| { | |
| "epoch": 4.27, | |
| "eval_avg_sts": 0.8217179921122288, | |
| "eval_sickr_spearman": 0.7976729628319497, | |
| "eval_stsb_spearman": 0.8457630213925079, | |
| "step": 1925 | |
| }, | |
| { | |
| "epoch": 4.32, | |
| "eval_avg_sts": 0.8218133292332199, | |
| "eval_sickr_spearman": 0.7972407309501078, | |
| "eval_stsb_spearman": 0.8463859275163321, | |
| "step": 1950 | |
| }, | |
| { | |
| "epoch": 4.38, | |
| "eval_avg_sts": 0.82307986157595, | |
| "eval_sickr_spearman": 0.7997425269307149, | |
| "eval_stsb_spearman": 0.846417196221185, | |
| "step": 1975 | |
| }, | |
| { | |
| "epoch": 4.43, | |
| "learning_rate": 1.3045084996304511e-05, | |
| "loss": 0.2149, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 4.43, | |
| "eval_avg_sts": 0.8251845211566629, | |
| "eval_sickr_spearman": 0.803791356657542, | |
| "eval_stsb_spearman": 0.8465776856557838, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 4.49, | |
| "eval_avg_sts": 0.8244897261222982, | |
| "eval_sickr_spearman": 0.8012433547573516, | |
| "eval_stsb_spearman": 0.8477360974872448, | |
| "step": 2025 | |
| }, | |
| { | |
| "epoch": 4.55, | |
| "eval_avg_sts": 0.8248464356555265, | |
| "eval_sickr_spearman": 0.80196872045127, | |
| "eval_stsb_spearman": 0.847724150859783, | |
| "step": 2050 | |
| }, | |
| { | |
| "epoch": 4.6, | |
| "eval_avg_sts": 0.8236282342217962, | |
| "eval_sickr_spearman": 0.801061412945104, | |
| "eval_stsb_spearman": 0.8461950554984884, | |
| "step": 2075 | |
| }, | |
| { | |
| "epoch": 4.66, | |
| "eval_avg_sts": 0.8241232806486489, | |
| "eval_sickr_spearman": 0.8016284200975811, | |
| "eval_stsb_spearman": 0.8466181411997169, | |
| "step": 2100 | |
| }, | |
| { | |
| "epoch": 4.71, | |
| "eval_avg_sts": 0.8240448338930326, | |
| "eval_sickr_spearman": 0.8024957657273504, | |
| "eval_stsb_spearman": 0.845593902058715, | |
| "step": 2125 | |
| }, | |
| { | |
| "epoch": 4.77, | |
| "eval_avg_sts": 0.8252602189328375, | |
| "eval_sickr_spearman": 0.8031946662843764, | |
| "eval_stsb_spearman": 0.8473257715812985, | |
| "step": 2150 | |
| }, | |
| { | |
| "epoch": 4.82, | |
| "eval_avg_sts": 0.8237954063381605, | |
| "eval_sickr_spearman": 0.8006036285172974, | |
| "eval_stsb_spearman": 0.8469871841590237, | |
| "step": 2175 | |
| }, | |
| { | |
| "epoch": 4.88, | |
| "eval_avg_sts": 0.8238382480785117, | |
| "eval_sickr_spearman": 0.8008013245308166, | |
| "eval_stsb_spearman": 0.8468751716262067, | |
| "step": 2200 | |
| }, | |
| { | |
| "epoch": 4.93, | |
| "eval_avg_sts": 0.8226554353280054, | |
| "eval_sickr_spearman": 0.79934425303759, | |
| "eval_stsb_spearman": 0.8459666176184208, | |
| "step": 2225 | |
| }, | |
| { | |
| "epoch": 4.99, | |
| "eval_avg_sts": 0.8221324924350076, | |
| "eval_sickr_spearman": 0.7977314166823997, | |
| "eval_stsb_spearman": 0.8465335681876156, | |
| "step": 2250 | |
| }, | |
| { | |
| "epoch": 5.04, | |
| "eval_avg_sts": 0.8230411082185226, | |
| "eval_sickr_spearman": 0.7989547688360285, | |
| "eval_stsb_spearman": 0.8471274476010168, | |
| "step": 2275 | |
| }, | |
| { | |
| "epoch": 5.1, | |
| "eval_avg_sts": 0.8228022688627314, | |
| "eval_sickr_spearman": 0.7994119768906178, | |
| "eval_stsb_spearman": 0.846192560834845, | |
| "step": 2300 | |
| }, | |
| { | |
| "epoch": 5.16, | |
| "eval_avg_sts": 0.8228479899857558, | |
| "eval_sickr_spearman": 0.7989381981060323, | |
| "eval_stsb_spearman": 0.8467577818654793, | |
| "step": 2325 | |
| }, | |
| { | |
| "epoch": 5.21, | |
| "eval_avg_sts": 0.8221050116430979, | |
| "eval_sickr_spearman": 0.7985421816746751, | |
| "eval_stsb_spearman": 0.8456678416115206, | |
| "step": 2350 | |
| }, | |
| { | |
| "epoch": 5.27, | |
| "eval_avg_sts": 0.822383318476755, | |
| "eval_sickr_spearman": 0.7986474658490273, | |
| "eval_stsb_spearman": 0.8461191711044828, | |
| "step": 2375 | |
| }, | |
| { | |
| "epoch": 5.32, | |
| "eval_avg_sts": 0.823048712126393, | |
| "eval_sickr_spearman": 0.7993529466669504, | |
| "eval_stsb_spearman": 0.8467444775858354, | |
| "step": 2400 | |
| }, | |
| { | |
| "epoch": 5.38, | |
| "eval_avg_sts": 0.8228378854074433, | |
| "eval_sickr_spearman": 0.799309382457946, | |
| "eval_stsb_spearman": 0.8463663883569406, | |
| "step": 2425 | |
| }, | |
| { | |
| "epoch": 5.43, | |
| "eval_avg_sts": 0.8229990938054758, | |
| "eval_sickr_spearman": 0.7993526104492402, | |
| "eval_stsb_spearman": 0.8466455771617113, | |
| "step": 2450 | |
| }, | |
| { | |
| "epoch": 5.49, | |
| "eval_avg_sts": 0.8223080164546823, | |
| "eval_sickr_spearman": 0.7985109614587403, | |
| "eval_stsb_spearman": 0.8461050714506243, | |
| "step": 2475 | |
| }, | |
| { | |
| "epoch": 5.54, | |
| "learning_rate": 3.806356245380636e-06, | |
| "loss": 0.2074, | |
| "step": 2500 | |
| }, | |
| { | |
| "epoch": 5.54, | |
| "eval_avg_sts": 0.8224706658462584, | |
| "eval_sickr_spearman": 0.7986079842836452, | |
| "eval_stsb_spearman": 0.8463333474088716, | |
| "step": 2500 | |
| }, | |
| { | |
| "epoch": 5.6, | |
| "eval_avg_sts": 0.8228255546038069, | |
| "eval_sickr_spearman": 0.7993520821071245, | |
| "eval_stsb_spearman": 0.8462990271004893, | |
| "step": 2525 | |
| }, | |
| { | |
| "epoch": 5.65, | |
| "eval_avg_sts": 0.8222772197799051, | |
| "eval_sickr_spearman": 0.7986904536848144, | |
| "eval_stsb_spearman": 0.8458639858749959, | |
| "step": 2550 | |
| }, | |
| { | |
| "epoch": 5.71, | |
| "eval_avg_sts": 0.822395438556291, | |
| "eval_sickr_spearman": 0.7987432398652949, | |
| "eval_stsb_spearman": 0.8460476372472872, | |
| "step": 2575 | |
| }, | |
| { | |
| "epoch": 5.76, | |
| "eval_avg_sts": 0.8229151972681052, | |
| "eval_sickr_spearman": 0.7992985754601224, | |
| "eval_stsb_spearman": 0.8465318190760882, | |
| "step": 2600 | |
| }, | |
| { | |
| "epoch": 5.82, | |
| "eval_avg_sts": 0.8227679691163096, | |
| "eval_sickr_spearman": 0.7989778237647187, | |
| "eval_stsb_spearman": 0.8465581144679004, | |
| "step": 2625 | |
| }, | |
| { | |
| "epoch": 5.88, | |
| "eval_avg_sts": 0.8231044151175362, | |
| "eval_sickr_spearman": 0.7993373845900845, | |
| "eval_stsb_spearman": 0.8468714456449877, | |
| "step": 2650 | |
| }, | |
| { | |
| "epoch": 5.93, | |
| "eval_avg_sts": 0.8230968701740264, | |
| "eval_sickr_spearman": 0.7993484797745166, | |
| "eval_stsb_spearman": 0.8468452605735363, | |
| "step": 2675 | |
| }, | |
| { | |
| "epoch": 5.99, | |
| "eval_avg_sts": 0.8230334553806065, | |
| "eval_sickr_spearman": 0.7992910345771966, | |
| "eval_stsb_spearman": 0.8467758761840164, | |
| "step": 2700 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "step": 2706, | |
| "train_runtime": 3739.6542, | |
| "train_samples_per_second": 0.724 | |
| } | |
| ], | |
| "max_steps": 2706, | |
| "num_train_epochs": 6, | |
| "total_flos": 212939896792195584, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |