| { | |
| "best_metric": 0.8287429760185343, | |
| "best_model_checkpoint": "result/my-sup-simcse-roberta-base_filtered_final_augx_0517_275578", | |
| "epoch": 3.0, | |
| "global_step": 1617, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 0.05, | |
| "eval_avg_sts": 0.7923727821060924, | |
| "eval_sickr_spearman": 0.7589401062590382, | |
| "eval_stsb_spearman": 0.8258054579531467, | |
| "step": 25 | |
| }, | |
| { | |
| "epoch": 0.09, | |
| "eval_avg_sts": 0.788369556206714, | |
| "eval_sickr_spearman": 0.7429059316970545, | |
| "eval_stsb_spearman": 0.8338331807163735, | |
| "step": 50 | |
| }, | |
| { | |
| "epoch": 0.14, | |
| "eval_avg_sts": 0.8104646483652821, | |
| "eval_sickr_spearman": 0.7750206308339096, | |
| "eval_stsb_spearman": 0.8459086658966546, | |
| "step": 75 | |
| }, | |
| { | |
| "epoch": 0.19, | |
| "eval_avg_sts": 0.8156440464261943, | |
| "eval_sickr_spearman": 0.7790718621158088, | |
| "eval_stsb_spearman": 0.8522162307365796, | |
| "step": 100 | |
| }, | |
| { | |
| "epoch": 0.23, | |
| "eval_avg_sts": 0.8158874725367419, | |
| "eval_sickr_spearman": 0.7767967729339896, | |
| "eval_stsb_spearman": 0.8549781721394941, | |
| "step": 125 | |
| }, | |
| { | |
| "epoch": 0.28, | |
| "eval_avg_sts": 0.8226456308827159, | |
| "eval_sickr_spearman": 0.7900410609689407, | |
| "eval_stsb_spearman": 0.8552502007964913, | |
| "step": 150 | |
| }, | |
| { | |
| "epoch": 0.32, | |
| "eval_avg_sts": 0.8233733407465815, | |
| "eval_sickr_spearman": 0.7881731314340124, | |
| "eval_stsb_spearman": 0.8585735500591508, | |
| "step": 175 | |
| }, | |
| { | |
| "epoch": 0.37, | |
| "eval_avg_sts": 0.8246758200303745, | |
| "eval_sickr_spearman": 0.7910648919271954, | |
| "eval_stsb_spearman": 0.8582867481335537, | |
| "step": 200 | |
| }, | |
| { | |
| "epoch": 0.42, | |
| "eval_avg_sts": 0.8127837390967988, | |
| "eval_sickr_spearman": 0.7683723098661505, | |
| "eval_stsb_spearman": 0.8571951683274471, | |
| "step": 225 | |
| }, | |
| { | |
| "epoch": 0.46, | |
| "eval_avg_sts": 0.8211001358940954, | |
| "eval_sickr_spearman": 0.7857309900813916, | |
| "eval_stsb_spearman": 0.8564692817067991, | |
| "step": 250 | |
| }, | |
| { | |
| "epoch": 0.51, | |
| "eval_avg_sts": 0.8231415754884768, | |
| "eval_sickr_spearman": 0.7870932481803794, | |
| "eval_stsb_spearman": 0.859189902796574, | |
| "step": 275 | |
| }, | |
| { | |
| "epoch": 0.56, | |
| "eval_avg_sts": 0.8281698148839484, | |
| "eval_sickr_spearman": 0.7933201442641206, | |
| "eval_stsb_spearman": 0.8630194855037762, | |
| "step": 300 | |
| }, | |
| { | |
| "epoch": 0.6, | |
| "eval_avg_sts": 0.8261624892170372, | |
| "eval_sickr_spearman": 0.7934045829404487, | |
| "eval_stsb_spearman": 0.8589203954936255, | |
| "step": 325 | |
| }, | |
| { | |
| "epoch": 0.65, | |
| "eval_avg_sts": 0.8223223884475288, | |
| "eval_sickr_spearman": 0.7860610117793729, | |
| "eval_stsb_spearman": 0.8585837651156847, | |
| "step": 350 | |
| }, | |
| { | |
| "epoch": 0.7, | |
| "eval_avg_sts": 0.8239117966986287, | |
| "eval_sickr_spearman": 0.7878053572903008, | |
| "eval_stsb_spearman": 0.8600182361069565, | |
| "step": 375 | |
| }, | |
| { | |
| "epoch": 0.74, | |
| "eval_avg_sts": 0.8189825828946973, | |
| "eval_sickr_spearman": 0.7824180448596978, | |
| "eval_stsb_spearman": 0.8555471209296966, | |
| "step": 400 | |
| }, | |
| { | |
| "epoch": 0.79, | |
| "eval_avg_sts": 0.8284554395260346, | |
| "eval_sickr_spearman": 0.7938278330063215, | |
| "eval_stsb_spearman": 0.8630830460457476, | |
| "step": 425 | |
| }, | |
| { | |
| "epoch": 0.83, | |
| "eval_avg_sts": 0.8287429760185343, | |
| "eval_sickr_spearman": 0.7950705897249312, | |
| "eval_stsb_spearman": 0.8624153623121376, | |
| "step": 450 | |
| }, | |
| { | |
| "epoch": 0.88, | |
| "eval_avg_sts": 0.8175086199936331, | |
| "eval_sickr_spearman": 0.7783943353989228, | |
| "eval_stsb_spearman": 0.8566229045883434, | |
| "step": 475 | |
| }, | |
| { | |
| "epoch": 0.93, | |
| "learning_rate": 3.453927025355597e-05, | |
| "loss": 0.4533, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 0.93, | |
| "eval_avg_sts": 0.8230793846551405, | |
| "eval_sickr_spearman": 0.791305047434386, | |
| "eval_stsb_spearman": 0.8548537218758949, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 0.97, | |
| "eval_avg_sts": 0.813507998872834, | |
| "eval_sickr_spearman": 0.7710531177618173, | |
| "eval_stsb_spearman": 0.8559628799838506, | |
| "step": 525 | |
| }, | |
| { | |
| "epoch": 1.02, | |
| "eval_avg_sts": 0.8152806946649198, | |
| "eval_sickr_spearman": 0.7748347024402428, | |
| "eval_stsb_spearman": 0.8557266868895969, | |
| "step": 550 | |
| }, | |
| { | |
| "epoch": 1.07, | |
| "eval_avg_sts": 0.8193593042077025, | |
| "eval_sickr_spearman": 0.7769575330305031, | |
| "eval_stsb_spearman": 0.8617610753849019, | |
| "step": 575 | |
| }, | |
| { | |
| "epoch": 1.11, | |
| "eval_avg_sts": 0.8122703001838674, | |
| "eval_sickr_spearman": 0.7715038416177126, | |
| "eval_stsb_spearman": 0.8530367587500223, | |
| "step": 600 | |
| }, | |
| { | |
| "epoch": 1.16, | |
| "eval_avg_sts": 0.8236420464403356, | |
| "eval_sickr_spearman": 0.7849814167123483, | |
| "eval_stsb_spearman": 0.8623026761683228, | |
| "step": 625 | |
| }, | |
| { | |
| "epoch": 1.21, | |
| "eval_avg_sts": 0.8133106230456628, | |
| "eval_sickr_spearman": 0.770097202780996, | |
| "eval_stsb_spearman": 0.8565240433103297, | |
| "step": 650 | |
| }, | |
| { | |
| "epoch": 1.25, | |
| "eval_avg_sts": 0.8207134638537716, | |
| "eval_sickr_spearman": 0.7790919391162099, | |
| "eval_stsb_spearman": 0.8623349885913333, | |
| "step": 675 | |
| }, | |
| { | |
| "epoch": 1.3, | |
| "eval_avg_sts": 0.8130353473025216, | |
| "eval_sickr_spearman": 0.7694488309426829, | |
| "eval_stsb_spearman": 0.8566218636623602, | |
| "step": 700 | |
| }, | |
| { | |
| "epoch": 1.35, | |
| "eval_avg_sts": 0.8135852616644544, | |
| "eval_sickr_spearman": 0.7713928417422891, | |
| "eval_stsb_spearman": 0.8557776815866198, | |
| "step": 725 | |
| }, | |
| { | |
| "epoch": 1.39, | |
| "eval_avg_sts": 0.8182033488573868, | |
| "eval_sickr_spearman": 0.7772465361678562, | |
| "eval_stsb_spearman": 0.8591601615469172, | |
| "step": 750 | |
| }, | |
| { | |
| "epoch": 1.44, | |
| "eval_avg_sts": 0.8248685458177708, | |
| "eval_sickr_spearman": 0.7874361422135461, | |
| "eval_stsb_spearman": 0.8623009494219955, | |
| "step": 775 | |
| }, | |
| { | |
| "epoch": 1.48, | |
| "eval_avg_sts": 0.8161782720571904, | |
| "eval_sickr_spearman": 0.7755229400927496, | |
| "eval_stsb_spearman": 0.8568336040216311, | |
| "step": 800 | |
| }, | |
| { | |
| "epoch": 1.53, | |
| "eval_avg_sts": 0.8207483887962784, | |
| "eval_sickr_spearman": 0.7822897537877566, | |
| "eval_stsb_spearman": 0.8592070238048003, | |
| "step": 825 | |
| }, | |
| { | |
| "epoch": 1.58, | |
| "eval_avg_sts": 0.8239255438283619, | |
| "eval_sickr_spearman": 0.7867861853488854, | |
| "eval_stsb_spearman": 0.8610649023078384, | |
| "step": 850 | |
| }, | |
| { | |
| "epoch": 1.62, | |
| "eval_avg_sts": 0.8190144607374632, | |
| "eval_sickr_spearman": 0.7796808964820441, | |
| "eval_stsb_spearman": 0.8583480249928824, | |
| "step": 875 | |
| }, | |
| { | |
| "epoch": 1.67, | |
| "eval_avg_sts": 0.8211177033463906, | |
| "eval_sickr_spearman": 0.7840137821427762, | |
| "eval_stsb_spearman": 0.8582216245500051, | |
| "step": 900 | |
| }, | |
| { | |
| "epoch": 1.72, | |
| "eval_avg_sts": 0.8201580926083631, | |
| "eval_sickr_spearman": 0.7816100656713059, | |
| "eval_stsb_spearman": 0.8587061195454205, | |
| "step": 925 | |
| }, | |
| { | |
| "epoch": 1.76, | |
| "eval_avg_sts": 0.8140545936227954, | |
| "eval_sickr_spearman": 0.7693706363095416, | |
| "eval_stsb_spearman": 0.8587385509360493, | |
| "step": 950 | |
| }, | |
| { | |
| "epoch": 1.81, | |
| "eval_avg_sts": 0.8205478478328316, | |
| "eval_sickr_spearman": 0.778550484509698, | |
| "eval_stsb_spearman": 0.8625452111559652, | |
| "step": 975 | |
| }, | |
| { | |
| "epoch": 1.86, | |
| "learning_rate": 1.9078540507111937e-05, | |
| "loss": 0.2352, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 1.86, | |
| "eval_avg_sts": 0.8194978907732944, | |
| "eval_sickr_spearman": 0.7797764783739058, | |
| "eval_stsb_spearman": 0.859219303172683, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 1.9, | |
| "eval_avg_sts": 0.8179603788237452, | |
| "eval_sickr_spearman": 0.7792966476705391, | |
| "eval_stsb_spearman": 0.8566241099769513, | |
| "step": 1025 | |
| }, | |
| { | |
| "epoch": 1.95, | |
| "eval_avg_sts": 0.814634655693672, | |
| "eval_sickr_spearman": 0.7726660501792106, | |
| "eval_stsb_spearman": 0.8566032612081333, | |
| "step": 1050 | |
| }, | |
| { | |
| "epoch": 1.99, | |
| "eval_avg_sts": 0.8229387572431492, | |
| "eval_sickr_spearman": 0.786164518802972, | |
| "eval_stsb_spearman": 0.8597129956833264, | |
| "step": 1075 | |
| }, | |
| { | |
| "epoch": 2.04, | |
| "eval_avg_sts": 0.8170446704890681, | |
| "eval_sickr_spearman": 0.7740013628302915, | |
| "eval_stsb_spearman": 0.8600879781478449, | |
| "step": 1100 | |
| }, | |
| { | |
| "epoch": 2.09, | |
| "eval_avg_sts": 0.823749807845302, | |
| "eval_sickr_spearman": 0.7840726202420378, | |
| "eval_stsb_spearman": 0.8634269954485662, | |
| "step": 1125 | |
| }, | |
| { | |
| "epoch": 2.13, | |
| "eval_avg_sts": 0.824679097934147, | |
| "eval_sickr_spearman": 0.786571486325457, | |
| "eval_stsb_spearman": 0.8627867095428369, | |
| "step": 1150 | |
| }, | |
| { | |
| "epoch": 2.18, | |
| "eval_avg_sts": 0.8215752053838693, | |
| "eval_sickr_spearman": 0.7836207916708096, | |
| "eval_stsb_spearman": 0.859529619096929, | |
| "step": 1175 | |
| }, | |
| { | |
| "epoch": 2.23, | |
| "eval_avg_sts": 0.8271625177527122, | |
| "eval_sickr_spearman": 0.790379536140775, | |
| "eval_stsb_spearman": 0.8639454993646494, | |
| "step": 1200 | |
| }, | |
| { | |
| "epoch": 2.27, | |
| "eval_avg_sts": 0.8175642564462906, | |
| "eval_sickr_spearman": 0.7762766441365164, | |
| "eval_stsb_spearman": 0.8588518687560649, | |
| "step": 1225 | |
| }, | |
| { | |
| "epoch": 2.32, | |
| "eval_avg_sts": 0.8189636390886708, | |
| "eval_sickr_spearman": 0.7794043814310648, | |
| "eval_stsb_spearman": 0.8585228967462767, | |
| "step": 1250 | |
| }, | |
| { | |
| "epoch": 2.37, | |
| "eval_avg_sts": 0.8235331481562411, | |
| "eval_sickr_spearman": 0.7853204202262986, | |
| "eval_stsb_spearman": 0.8617458760861836, | |
| "step": 1275 | |
| }, | |
| { | |
| "epoch": 2.41, | |
| "eval_avg_sts": 0.8212932121455792, | |
| "eval_sickr_spearman": 0.7838025893897528, | |
| "eval_stsb_spearman": 0.8587838349014056, | |
| "step": 1300 | |
| }, | |
| { | |
| "epoch": 2.46, | |
| "eval_avg_sts": 0.8200184185533622, | |
| "eval_sickr_spearman": 0.7804020834701373, | |
| "eval_stsb_spearman": 0.8596347536365871, | |
| "step": 1325 | |
| }, | |
| { | |
| "epoch": 2.5, | |
| "eval_avg_sts": 0.8184879956680027, | |
| "eval_sickr_spearman": 0.7775680563608829, | |
| "eval_stsb_spearman": 0.8594079349751224, | |
| "step": 1350 | |
| }, | |
| { | |
| "epoch": 2.55, | |
| "eval_avg_sts": 0.8240646293698506, | |
| "eval_sickr_spearman": 0.7871783112610262, | |
| "eval_stsb_spearman": 0.8609509474786748, | |
| "step": 1375 | |
| }, | |
| { | |
| "epoch": 2.6, | |
| "eval_avg_sts": 0.8232889615255443, | |
| "eval_sickr_spearman": 0.7868230252036885, | |
| "eval_stsb_spearman": 0.8597548978474002, | |
| "step": 1400 | |
| }, | |
| { | |
| "epoch": 2.64, | |
| "eval_avg_sts": 0.8214126106703122, | |
| "eval_sickr_spearman": 0.7826799584558398, | |
| "eval_stsb_spearman": 0.8601452628847847, | |
| "step": 1425 | |
| }, | |
| { | |
| "epoch": 2.69, | |
| "eval_avg_sts": 0.8256026599230287, | |
| "eval_sickr_spearman": 0.7879515639630783, | |
| "eval_stsb_spearman": 0.8632537558829791, | |
| "step": 1450 | |
| }, | |
| { | |
| "epoch": 2.74, | |
| "eval_avg_sts": 0.8227290144728177, | |
| "eval_sickr_spearman": 0.7835550370929407, | |
| "eval_stsb_spearman": 0.8619029918526946, | |
| "step": 1475 | |
| }, | |
| { | |
| "epoch": 2.78, | |
| "learning_rate": 3.6178107606679037e-06, | |
| "loss": 0.2129, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 2.78, | |
| "eval_avg_sts": 0.8228934679819335, | |
| "eval_sickr_spearman": 0.7842996632585357, | |
| "eval_stsb_spearman": 0.8614872727053314, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 2.83, | |
| "eval_avg_sts": 0.8208607916598496, | |
| "eval_sickr_spearman": 0.7816013240108441, | |
| "eval_stsb_spearman": 0.860120259308855, | |
| "step": 1525 | |
| }, | |
| { | |
| "epoch": 2.88, | |
| "eval_avg_sts": 0.8206687609569976, | |
| "eval_sickr_spearman": 0.7812808124709476, | |
| "eval_stsb_spearman": 0.8600567094430476, | |
| "step": 1550 | |
| }, | |
| { | |
| "epoch": 2.92, | |
| "eval_avg_sts": 0.8208944641677367, | |
| "eval_sickr_spearman": 0.7819390787161569, | |
| "eval_stsb_spearman": 0.8598498496193164, | |
| "step": 1575 | |
| }, | |
| { | |
| "epoch": 2.97, | |
| "eval_avg_sts": 0.8211952992867365, | |
| "eval_sickr_spearman": 0.7822705413471812, | |
| "eval_stsb_spearman": 0.8601200572262918, | |
| "step": 1600 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "step": 1617, | |
| "train_runtime": 2320.0614, | |
| "train_samples_per_second": 0.697 | |
| } | |
| ], | |
| "max_steps": 1617, | |
| "num_train_epochs": 3, | |
| "total_flos": 156090475282942080, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |