bcai001's picture
Upload 9 files
60eeaf1 verified
{
"best_metric": 0.8754395915831782,
"best_model_checkpoint": "v3v2dqwsyn8103.san-roberta-large",
"epoch": 3.0,
"global_step": 6126,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.06,
"eval_avg_sts": 0.8149644786494956,
"eval_sickr_spearman": 0.7907241592935935,
"eval_stsb_spearman": 0.8392047980053978,
"step": 125
},
{
"epoch": 0.12,
"eval_avg_sts": 0.8388577709591086,
"eval_sickr_spearman": 0.8233415039069986,
"eval_stsb_spearman": 0.8543740380112187,
"step": 250
},
{
"epoch": 0.18,
"eval_avg_sts": 0.8396589199542435,
"eval_sickr_spearman": 0.8129205800767828,
"eval_stsb_spearman": 0.8663972598317042,
"step": 375
},
{
"epoch": 0.24,
"learning_rate": 9.183806725432584e-06,
"loss": 0.5341,
"step": 500
},
{
"epoch": 0.24,
"eval_avg_sts": 0.8363342200594388,
"eval_sickr_spearman": 0.8093077766888108,
"eval_stsb_spearman": 0.8633606634300668,
"step": 500
},
{
"epoch": 0.31,
"eval_avg_sts": 0.8338329341909468,
"eval_sickr_spearman": 0.8055060189477813,
"eval_stsb_spearman": 0.8621598494341124,
"step": 625
},
{
"epoch": 0.37,
"eval_avg_sts": 0.839609299977649,
"eval_sickr_spearman": 0.8169147023790718,
"eval_stsb_spearman": 0.8623038975762263,
"step": 750
},
{
"epoch": 0.43,
"eval_avg_sts": 0.846074071178897,
"eval_sickr_spearman": 0.8259940214839182,
"eval_stsb_spearman": 0.8661541208738758,
"step": 875
},
{
"epoch": 0.49,
"learning_rate": 8.367613450865165e-06,
"loss": 0.1279,
"step": 1000
},
{
"epoch": 0.49,
"eval_avg_sts": 0.8453144553836196,
"eval_sickr_spearman": 0.8210699209955844,
"eval_stsb_spearman": 0.8695589897716549,
"step": 1000
},
{
"epoch": 0.55,
"eval_avg_sts": 0.845320179475549,
"eval_sickr_spearman": 0.8282974490155858,
"eval_stsb_spearman": 0.8623429099355123,
"step": 1125
},
{
"epoch": 0.61,
"eval_avg_sts": 0.8460474498271838,
"eval_sickr_spearman": 0.826672508822833,
"eval_stsb_spearman": 0.8654223908315346,
"step": 1250
},
{
"epoch": 0.67,
"eval_avg_sts": 0.8426410233010573,
"eval_sickr_spearman": 0.8190030466384995,
"eval_stsb_spearman": 0.8662789999636149,
"step": 1375
},
{
"epoch": 0.73,
"learning_rate": 7.551420176297748e-06,
"loss": 0.1108,
"step": 1500
},
{
"epoch": 0.73,
"eval_avg_sts": 0.8549386812398281,
"eval_sickr_spearman": 0.8434020296403363,
"eval_stsb_spearman": 0.8664753328393199,
"step": 1500
},
{
"epoch": 0.8,
"eval_avg_sts": 0.8501103601570379,
"eval_sickr_spearman": 0.834787891752918,
"eval_stsb_spearman": 0.8654328285611577,
"step": 1625
},
{
"epoch": 0.86,
"eval_avg_sts": 0.849271502533093,
"eval_sickr_spearman": 0.8330568988881898,
"eval_stsb_spearman": 0.8654861061779964,
"step": 1750
},
{
"epoch": 0.92,
"eval_avg_sts": 0.8536431760480087,
"eval_sickr_spearman": 0.8382815780093236,
"eval_stsb_spearman": 0.8690047740866937,
"step": 1875
},
{
"epoch": 0.98,
"learning_rate": 6.735226901730331e-06,
"loss": 0.0995,
"step": 2000
},
{
"epoch": 0.98,
"eval_avg_sts": 0.859307976655676,
"eval_sickr_spearman": 0.8446237487365161,
"eval_stsb_spearman": 0.873992204574836,
"step": 2000
},
{
"epoch": 1.04,
"eval_avg_sts": 0.8539432294379701,
"eval_sickr_spearman": 0.839737448725014,
"eval_stsb_spearman": 0.868149010150926,
"step": 2125
},
{
"epoch": 1.1,
"eval_avg_sts": 0.8550783980122398,
"eval_sickr_spearman": 0.8398799570029809,
"eval_stsb_spearman": 0.8702768390214988,
"step": 2250
},
{
"epoch": 1.16,
"eval_avg_sts": 0.8513744867439872,
"eval_sickr_spearman": 0.8382596758270676,
"eval_stsb_spearman": 0.8644892976609067,
"step": 2375
},
{
"epoch": 1.22,
"learning_rate": 5.919033627162912e-06,
"loss": 0.0755,
"step": 2500
},
{
"epoch": 1.22,
"eval_avg_sts": 0.852586624774087,
"eval_sickr_spearman": 0.8348869799151848,
"eval_stsb_spearman": 0.8702862696329892,
"step": 2500
},
{
"epoch": 1.29,
"eval_avg_sts": 0.8536153767856529,
"eval_sickr_spearman": 0.8408841432407476,
"eval_stsb_spearman": 0.8663466103305583,
"step": 2625
},
{
"epoch": 1.35,
"eval_avg_sts": 0.8516843556326315,
"eval_sickr_spearman": 0.8374268645592322,
"eval_stsb_spearman": 0.8659418467060308,
"step": 2750
},
{
"epoch": 1.41,
"eval_avg_sts": 0.8415420172889546,
"eval_sickr_spearman": 0.819215344106856,
"eval_stsb_spearman": 0.8638686904710532,
"step": 2875
},
{
"epoch": 1.47,
"learning_rate": 5.102840352595495e-06,
"loss": 0.0701,
"step": 3000
},
{
"epoch": 1.47,
"eval_avg_sts": 0.8561622122931456,
"eval_sickr_spearman": 0.8410006666928366,
"eval_stsb_spearman": 0.8713237578934547,
"step": 3000
},
{
"epoch": 1.53,
"eval_avg_sts": 0.8482745103445485,
"eval_sickr_spearman": 0.8300929476495453,
"eval_stsb_spearman": 0.8664560730395516,
"step": 3125
},
{
"epoch": 1.59,
"eval_avg_sts": 0.8509009129630769,
"eval_sickr_spearman": 0.8311688923528606,
"eval_stsb_spearman": 0.8706329335732933,
"step": 3250
},
{
"epoch": 1.65,
"eval_avg_sts": 0.8546193575409455,
"eval_sickr_spearman": 0.833799123498713,
"eval_stsb_spearman": 0.8754395915831782,
"step": 3375
},
{
"epoch": 1.71,
"learning_rate": 4.286647078028077e-06,
"loss": 0.0691,
"step": 3500
},
{
"epoch": 1.71,
"eval_avg_sts": 0.8480763616470857,
"eval_sickr_spearman": 0.8280656989511468,
"eval_stsb_spearman": 0.8680870243430245,
"step": 3500
},
{
"epoch": 1.78,
"eval_avg_sts": 0.8510804038712448,
"eval_sickr_spearman": 0.8315828243850542,
"eval_stsb_spearman": 0.8705779833574355,
"step": 3625
},
{
"epoch": 1.84,
"eval_avg_sts": 0.8481254894982377,
"eval_sickr_spearman": 0.8284941363759749,
"eval_stsb_spearman": 0.8677568426205006,
"step": 3750
},
{
"epoch": 1.9,
"eval_avg_sts": 0.8518486456802068,
"eval_sickr_spearman": 0.8313096234800742,
"eval_stsb_spearman": 0.8723876678803395,
"step": 3875
},
{
"epoch": 1.96,
"learning_rate": 3.47045380346066e-06,
"loss": 0.0639,
"step": 4000
},
{
"epoch": 1.96,
"eval_avg_sts": 0.8494848749262629,
"eval_sickr_spearman": 0.8275968673700096,
"eval_stsb_spearman": 0.8713728824825163,
"step": 4000
},
{
"epoch": 2.02,
"eval_avg_sts": 0.8478683507440115,
"eval_sickr_spearman": 0.8257009357029429,
"eval_stsb_spearman": 0.87003576578508,
"step": 4125
},
{
"epoch": 2.08,
"eval_avg_sts": 0.8511953137011732,
"eval_sickr_spearman": 0.8320414253415853,
"eval_stsb_spearman": 0.870349202060761,
"step": 4250
},
{
"epoch": 2.14,
"eval_avg_sts": 0.8501760957050806,
"eval_sickr_spearman": 0.8315510758270036,
"eval_stsb_spearman": 0.8688011155831574,
"step": 4375
},
{
"epoch": 2.2,
"learning_rate": 2.654260528893242e-06,
"loss": 0.0525,
"step": 4500
},
{
"epoch": 2.2,
"eval_avg_sts": 0.8496234541718779,
"eval_sickr_spearman": 0.8301971271085646,
"eval_stsb_spearman": 0.8690497812351913,
"step": 4500
},
{
"epoch": 2.26,
"eval_avg_sts": 0.8437167774343648,
"eval_sickr_spearman": 0.820443979681643,
"eval_stsb_spearman": 0.8669895751870865,
"step": 4625
},
{
"epoch": 2.33,
"eval_avg_sts": 0.8439814114677218,
"eval_sickr_spearman": 0.8205907627276378,
"eval_stsb_spearman": 0.8673720602078059,
"step": 4750
},
{
"epoch": 2.39,
"eval_avg_sts": 0.848080574777744,
"eval_sickr_spearman": 0.8265265903366641,
"eval_stsb_spearman": 0.869634559218824,
"step": 4875
},
{
"epoch": 2.45,
"learning_rate": 1.8380672543258246e-06,
"loss": 0.0462,
"step": 5000
},
{
"epoch": 2.45,
"eval_avg_sts": 0.8452623360298752,
"eval_sickr_spearman": 0.8238323337325946,
"eval_stsb_spearman": 0.866692338327156,
"step": 5000
},
{
"epoch": 2.51,
"eval_avg_sts": 0.847977497396065,
"eval_sickr_spearman": 0.8265478681146011,
"eval_stsb_spearman": 0.8694071266775288,
"step": 5125
},
{
"epoch": 2.57,
"eval_avg_sts": 0.8479098375907992,
"eval_sickr_spearman": 0.826889897587942,
"eval_stsb_spearman": 0.8689297775936565,
"step": 5250
},
{
"epoch": 2.63,
"eval_avg_sts": 0.8457732999493977,
"eval_sickr_spearman": 0.8235308425088674,
"eval_stsb_spearman": 0.8680157573899278,
"step": 5375
},
{
"epoch": 2.69,
"learning_rate": 1.021873979758407e-06,
"loss": 0.0454,
"step": 5500
},
{
"epoch": 2.69,
"eval_avg_sts": 0.8463330711965237,
"eval_sickr_spearman": 0.824173882894921,
"eval_stsb_spearman": 0.8684922594981264,
"step": 5500
},
{
"epoch": 2.75,
"eval_avg_sts": 0.8475412183069994,
"eval_sickr_spearman": 0.8259262015686877,
"eval_stsb_spearman": 0.869156235045311,
"step": 5625
},
{
"epoch": 2.82,
"eval_avg_sts": 0.8474056652640968,
"eval_sickr_spearman": 0.8258597265242973,
"eval_stsb_spearman": 0.8689516040038963,
"step": 5750
},
{
"epoch": 2.88,
"eval_avg_sts": 0.846709994814922,
"eval_sickr_spearman": 0.8247918990771251,
"eval_stsb_spearman": 0.868628090552719,
"step": 5875
},
{
"epoch": 2.94,
"learning_rate": 2.0568070519098922e-07,
"loss": 0.0456,
"step": 6000
},
{
"epoch": 2.94,
"eval_avg_sts": 0.8476613552908148,
"eval_sickr_spearman": 0.8262576161686107,
"eval_stsb_spearman": 0.8690650944130188,
"step": 6000
},
{
"epoch": 3.0,
"eval_avg_sts": 0.8477936113942104,
"eval_sickr_spearman": 0.8264356674616418,
"eval_stsb_spearman": 0.8691515553267789,
"step": 6125
},
{
"epoch": 3.0,
"step": 6126,
"train_runtime": 4478.0897,
"train_samples_per_second": 1.368
}
],
"max_steps": 6126,
"num_train_epochs": 3,
"total_flos": 213963637016494080,
"trial_name": null,
"trial_params": null
}