SynCSE-scratch-RoBERTa-base / trainer_state.json
Junlei
init
59dc35f
{
"best_metric": 0.8287429760185343,
"best_model_checkpoint": "result/my-sup-simcse-roberta-base_filtered_final_augx_0517_275578",
"epoch": 3.0,
"global_step": 1617,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.05,
"eval_avg_sts": 0.7923727821060924,
"eval_sickr_spearman": 0.7589401062590382,
"eval_stsb_spearman": 0.8258054579531467,
"step": 25
},
{
"epoch": 0.09,
"eval_avg_sts": 0.788369556206714,
"eval_sickr_spearman": 0.7429059316970545,
"eval_stsb_spearman": 0.8338331807163735,
"step": 50
},
{
"epoch": 0.14,
"eval_avg_sts": 0.8104646483652821,
"eval_sickr_spearman": 0.7750206308339096,
"eval_stsb_spearman": 0.8459086658966546,
"step": 75
},
{
"epoch": 0.19,
"eval_avg_sts": 0.8156440464261943,
"eval_sickr_spearman": 0.7790718621158088,
"eval_stsb_spearman": 0.8522162307365796,
"step": 100
},
{
"epoch": 0.23,
"eval_avg_sts": 0.8158874725367419,
"eval_sickr_spearman": 0.7767967729339896,
"eval_stsb_spearman": 0.8549781721394941,
"step": 125
},
{
"epoch": 0.28,
"eval_avg_sts": 0.8226456308827159,
"eval_sickr_spearman": 0.7900410609689407,
"eval_stsb_spearman": 0.8552502007964913,
"step": 150
},
{
"epoch": 0.32,
"eval_avg_sts": 0.8233733407465815,
"eval_sickr_spearman": 0.7881731314340124,
"eval_stsb_spearman": 0.8585735500591508,
"step": 175
},
{
"epoch": 0.37,
"eval_avg_sts": 0.8246758200303745,
"eval_sickr_spearman": 0.7910648919271954,
"eval_stsb_spearman": 0.8582867481335537,
"step": 200
},
{
"epoch": 0.42,
"eval_avg_sts": 0.8127837390967988,
"eval_sickr_spearman": 0.7683723098661505,
"eval_stsb_spearman": 0.8571951683274471,
"step": 225
},
{
"epoch": 0.46,
"eval_avg_sts": 0.8211001358940954,
"eval_sickr_spearman": 0.7857309900813916,
"eval_stsb_spearman": 0.8564692817067991,
"step": 250
},
{
"epoch": 0.51,
"eval_avg_sts": 0.8231415754884768,
"eval_sickr_spearman": 0.7870932481803794,
"eval_stsb_spearman": 0.859189902796574,
"step": 275
},
{
"epoch": 0.56,
"eval_avg_sts": 0.8281698148839484,
"eval_sickr_spearman": 0.7933201442641206,
"eval_stsb_spearman": 0.8630194855037762,
"step": 300
},
{
"epoch": 0.6,
"eval_avg_sts": 0.8261624892170372,
"eval_sickr_spearman": 0.7934045829404487,
"eval_stsb_spearman": 0.8589203954936255,
"step": 325
},
{
"epoch": 0.65,
"eval_avg_sts": 0.8223223884475288,
"eval_sickr_spearman": 0.7860610117793729,
"eval_stsb_spearman": 0.8585837651156847,
"step": 350
},
{
"epoch": 0.7,
"eval_avg_sts": 0.8239117966986287,
"eval_sickr_spearman": 0.7878053572903008,
"eval_stsb_spearman": 0.8600182361069565,
"step": 375
},
{
"epoch": 0.74,
"eval_avg_sts": 0.8189825828946973,
"eval_sickr_spearman": 0.7824180448596978,
"eval_stsb_spearman": 0.8555471209296966,
"step": 400
},
{
"epoch": 0.79,
"eval_avg_sts": 0.8284554395260346,
"eval_sickr_spearman": 0.7938278330063215,
"eval_stsb_spearman": 0.8630830460457476,
"step": 425
},
{
"epoch": 0.83,
"eval_avg_sts": 0.8287429760185343,
"eval_sickr_spearman": 0.7950705897249312,
"eval_stsb_spearman": 0.8624153623121376,
"step": 450
},
{
"epoch": 0.88,
"eval_avg_sts": 0.8175086199936331,
"eval_sickr_spearman": 0.7783943353989228,
"eval_stsb_spearman": 0.8566229045883434,
"step": 475
},
{
"epoch": 0.93,
"learning_rate": 3.453927025355597e-05,
"loss": 0.4533,
"step": 500
},
{
"epoch": 0.93,
"eval_avg_sts": 0.8230793846551405,
"eval_sickr_spearman": 0.791305047434386,
"eval_stsb_spearman": 0.8548537218758949,
"step": 500
},
{
"epoch": 0.97,
"eval_avg_sts": 0.813507998872834,
"eval_sickr_spearman": 0.7710531177618173,
"eval_stsb_spearman": 0.8559628799838506,
"step": 525
},
{
"epoch": 1.02,
"eval_avg_sts": 0.8152806946649198,
"eval_sickr_spearman": 0.7748347024402428,
"eval_stsb_spearman": 0.8557266868895969,
"step": 550
},
{
"epoch": 1.07,
"eval_avg_sts": 0.8193593042077025,
"eval_sickr_spearman": 0.7769575330305031,
"eval_stsb_spearman": 0.8617610753849019,
"step": 575
},
{
"epoch": 1.11,
"eval_avg_sts": 0.8122703001838674,
"eval_sickr_spearman": 0.7715038416177126,
"eval_stsb_spearman": 0.8530367587500223,
"step": 600
},
{
"epoch": 1.16,
"eval_avg_sts": 0.8236420464403356,
"eval_sickr_spearman": 0.7849814167123483,
"eval_stsb_spearman": 0.8623026761683228,
"step": 625
},
{
"epoch": 1.21,
"eval_avg_sts": 0.8133106230456628,
"eval_sickr_spearman": 0.770097202780996,
"eval_stsb_spearman": 0.8565240433103297,
"step": 650
},
{
"epoch": 1.25,
"eval_avg_sts": 0.8207134638537716,
"eval_sickr_spearman": 0.7790919391162099,
"eval_stsb_spearman": 0.8623349885913333,
"step": 675
},
{
"epoch": 1.3,
"eval_avg_sts": 0.8130353473025216,
"eval_sickr_spearman": 0.7694488309426829,
"eval_stsb_spearman": 0.8566218636623602,
"step": 700
},
{
"epoch": 1.35,
"eval_avg_sts": 0.8135852616644544,
"eval_sickr_spearman": 0.7713928417422891,
"eval_stsb_spearman": 0.8557776815866198,
"step": 725
},
{
"epoch": 1.39,
"eval_avg_sts": 0.8182033488573868,
"eval_sickr_spearman": 0.7772465361678562,
"eval_stsb_spearman": 0.8591601615469172,
"step": 750
},
{
"epoch": 1.44,
"eval_avg_sts": 0.8248685458177708,
"eval_sickr_spearman": 0.7874361422135461,
"eval_stsb_spearman": 0.8623009494219955,
"step": 775
},
{
"epoch": 1.48,
"eval_avg_sts": 0.8161782720571904,
"eval_sickr_spearman": 0.7755229400927496,
"eval_stsb_spearman": 0.8568336040216311,
"step": 800
},
{
"epoch": 1.53,
"eval_avg_sts": 0.8207483887962784,
"eval_sickr_spearman": 0.7822897537877566,
"eval_stsb_spearman": 0.8592070238048003,
"step": 825
},
{
"epoch": 1.58,
"eval_avg_sts": 0.8239255438283619,
"eval_sickr_spearman": 0.7867861853488854,
"eval_stsb_spearman": 0.8610649023078384,
"step": 850
},
{
"epoch": 1.62,
"eval_avg_sts": 0.8190144607374632,
"eval_sickr_spearman": 0.7796808964820441,
"eval_stsb_spearman": 0.8583480249928824,
"step": 875
},
{
"epoch": 1.67,
"eval_avg_sts": 0.8211177033463906,
"eval_sickr_spearman": 0.7840137821427762,
"eval_stsb_spearman": 0.8582216245500051,
"step": 900
},
{
"epoch": 1.72,
"eval_avg_sts": 0.8201580926083631,
"eval_sickr_spearman": 0.7816100656713059,
"eval_stsb_spearman": 0.8587061195454205,
"step": 925
},
{
"epoch": 1.76,
"eval_avg_sts": 0.8140545936227954,
"eval_sickr_spearman": 0.7693706363095416,
"eval_stsb_spearman": 0.8587385509360493,
"step": 950
},
{
"epoch": 1.81,
"eval_avg_sts": 0.8205478478328316,
"eval_sickr_spearman": 0.778550484509698,
"eval_stsb_spearman": 0.8625452111559652,
"step": 975
},
{
"epoch": 1.86,
"learning_rate": 1.9078540507111937e-05,
"loss": 0.2352,
"step": 1000
},
{
"epoch": 1.86,
"eval_avg_sts": 0.8194978907732944,
"eval_sickr_spearman": 0.7797764783739058,
"eval_stsb_spearman": 0.859219303172683,
"step": 1000
},
{
"epoch": 1.9,
"eval_avg_sts": 0.8179603788237452,
"eval_sickr_spearman": 0.7792966476705391,
"eval_stsb_spearman": 0.8566241099769513,
"step": 1025
},
{
"epoch": 1.95,
"eval_avg_sts": 0.814634655693672,
"eval_sickr_spearman": 0.7726660501792106,
"eval_stsb_spearman": 0.8566032612081333,
"step": 1050
},
{
"epoch": 1.99,
"eval_avg_sts": 0.8229387572431492,
"eval_sickr_spearman": 0.786164518802972,
"eval_stsb_spearman": 0.8597129956833264,
"step": 1075
},
{
"epoch": 2.04,
"eval_avg_sts": 0.8170446704890681,
"eval_sickr_spearman": 0.7740013628302915,
"eval_stsb_spearman": 0.8600879781478449,
"step": 1100
},
{
"epoch": 2.09,
"eval_avg_sts": 0.823749807845302,
"eval_sickr_spearman": 0.7840726202420378,
"eval_stsb_spearman": 0.8634269954485662,
"step": 1125
},
{
"epoch": 2.13,
"eval_avg_sts": 0.824679097934147,
"eval_sickr_spearman": 0.786571486325457,
"eval_stsb_spearman": 0.8627867095428369,
"step": 1150
},
{
"epoch": 2.18,
"eval_avg_sts": 0.8215752053838693,
"eval_sickr_spearman": 0.7836207916708096,
"eval_stsb_spearman": 0.859529619096929,
"step": 1175
},
{
"epoch": 2.23,
"eval_avg_sts": 0.8271625177527122,
"eval_sickr_spearman": 0.790379536140775,
"eval_stsb_spearman": 0.8639454993646494,
"step": 1200
},
{
"epoch": 2.27,
"eval_avg_sts": 0.8175642564462906,
"eval_sickr_spearman": 0.7762766441365164,
"eval_stsb_spearman": 0.8588518687560649,
"step": 1225
},
{
"epoch": 2.32,
"eval_avg_sts": 0.8189636390886708,
"eval_sickr_spearman": 0.7794043814310648,
"eval_stsb_spearman": 0.8585228967462767,
"step": 1250
},
{
"epoch": 2.37,
"eval_avg_sts": 0.8235331481562411,
"eval_sickr_spearman": 0.7853204202262986,
"eval_stsb_spearman": 0.8617458760861836,
"step": 1275
},
{
"epoch": 2.41,
"eval_avg_sts": 0.8212932121455792,
"eval_sickr_spearman": 0.7838025893897528,
"eval_stsb_spearman": 0.8587838349014056,
"step": 1300
},
{
"epoch": 2.46,
"eval_avg_sts": 0.8200184185533622,
"eval_sickr_spearman": 0.7804020834701373,
"eval_stsb_spearman": 0.8596347536365871,
"step": 1325
},
{
"epoch": 2.5,
"eval_avg_sts": 0.8184879956680027,
"eval_sickr_spearman": 0.7775680563608829,
"eval_stsb_spearman": 0.8594079349751224,
"step": 1350
},
{
"epoch": 2.55,
"eval_avg_sts": 0.8240646293698506,
"eval_sickr_spearman": 0.7871783112610262,
"eval_stsb_spearman": 0.8609509474786748,
"step": 1375
},
{
"epoch": 2.6,
"eval_avg_sts": 0.8232889615255443,
"eval_sickr_spearman": 0.7868230252036885,
"eval_stsb_spearman": 0.8597548978474002,
"step": 1400
},
{
"epoch": 2.64,
"eval_avg_sts": 0.8214126106703122,
"eval_sickr_spearman": 0.7826799584558398,
"eval_stsb_spearman": 0.8601452628847847,
"step": 1425
},
{
"epoch": 2.69,
"eval_avg_sts": 0.8256026599230287,
"eval_sickr_spearman": 0.7879515639630783,
"eval_stsb_spearman": 0.8632537558829791,
"step": 1450
},
{
"epoch": 2.74,
"eval_avg_sts": 0.8227290144728177,
"eval_sickr_spearman": 0.7835550370929407,
"eval_stsb_spearman": 0.8619029918526946,
"step": 1475
},
{
"epoch": 2.78,
"learning_rate": 3.6178107606679037e-06,
"loss": 0.2129,
"step": 1500
},
{
"epoch": 2.78,
"eval_avg_sts": 0.8228934679819335,
"eval_sickr_spearman": 0.7842996632585357,
"eval_stsb_spearman": 0.8614872727053314,
"step": 1500
},
{
"epoch": 2.83,
"eval_avg_sts": 0.8208607916598496,
"eval_sickr_spearman": 0.7816013240108441,
"eval_stsb_spearman": 0.860120259308855,
"step": 1525
},
{
"epoch": 2.88,
"eval_avg_sts": 0.8206687609569976,
"eval_sickr_spearman": 0.7812808124709476,
"eval_stsb_spearman": 0.8600567094430476,
"step": 1550
},
{
"epoch": 2.92,
"eval_avg_sts": 0.8208944641677367,
"eval_sickr_spearman": 0.7819390787161569,
"eval_stsb_spearman": 0.8598498496193164,
"step": 1575
},
{
"epoch": 2.97,
"eval_avg_sts": 0.8211952992867365,
"eval_sickr_spearman": 0.7822705413471812,
"eval_stsb_spearman": 0.8601200572262918,
"step": 1600
},
{
"epoch": 3.0,
"step": 1617,
"train_runtime": 2320.0614,
"train_samples_per_second": 0.697
}
],
"max_steps": 1617,
"num_train_epochs": 3,
"total_flos": 156090475282942080,
"trial_name": null,
"trial_params": null
}