DEk21_hcmute_embedding / trainer_state.json
huyydangg's picture
Initial model upload
ed088a0 verified
{
"best_metric": 0.16643136739730835,
"best_model_checkpoint": "bkai-fine-tuned-legal/checkpoint-282",
"epoch": 5.878048780487805,
"eval_steps": 500,
"global_step": 282,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"grad_norm": 3041986.25,
"learning_rate": 2.9967614628878062e-05,
"loss": 1.1542,
"step": 48
},
{
"epoch": 1.0,
"eval_dim_128_cosine_accuracy@1": 0.19871705480407195,
"eval_dim_128_cosine_accuracy@10": 0.6681076558360062,
"eval_dim_128_cosine_accuracy@3": 0.3995258680797657,
"eval_dim_128_cosine_accuracy@5": 0.4922604936549993,
"eval_dim_128_cosine_map@100": 0.33912660774009473,
"eval_dim_128_cosine_mrr@10": 0.32818611337994835,
"eval_dim_128_cosine_ndcg@10": 0.40810554118165804,
"eval_dim_128_cosine_precision@1": 0.19871705480407195,
"eval_dim_128_cosine_precision@10": 0.06681076558360062,
"eval_dim_128_cosine_precision@3": 0.1331752893599219,
"eval_dim_128_cosine_precision@5": 0.09845209873099986,
"eval_dim_128_cosine_recall@1": 0.19871705480407195,
"eval_dim_128_cosine_recall@10": 0.6681076558360062,
"eval_dim_128_cosine_recall@3": 0.3995258680797657,
"eval_dim_128_cosine_recall@5": 0.4922604936549993,
"eval_dim_256_cosine_accuracy@1": 0.19983265932227026,
"eval_dim_256_cosine_accuracy@10": 0.6777297448054664,
"eval_dim_256_cosine_accuracy@3": 0.3998047692093153,
"eval_dim_256_cosine_accuracy@5": 0.4954678566448194,
"eval_dim_256_cosine_map@100": 0.34191237247567885,
"eval_dim_256_cosine_mrr@10": 0.33120438804443747,
"eval_dim_256_cosine_ndcg@10": 0.4125662992991588,
"eval_dim_256_cosine_precision@1": 0.19983265932227026,
"eval_dim_256_cosine_precision@10": 0.06777297448054664,
"eval_dim_256_cosine_precision@3": 0.13326825640310508,
"eval_dim_256_cosine_precision@5": 0.09909357132896388,
"eval_dim_256_cosine_recall@1": 0.19983265932227026,
"eval_dim_256_cosine_recall@10": 0.6777297448054664,
"eval_dim_256_cosine_recall@3": 0.3998047692093153,
"eval_dim_256_cosine_recall@5": 0.4954678566448194,
"eval_dim_512_cosine_accuracy@1": 0.20945474829173058,
"eval_dim_512_cosine_accuracy@10": 0.6849811741737554,
"eval_dim_512_cosine_accuracy@3": 0.41040301213219915,
"eval_dim_512_cosine_accuracy@5": 0.5059266490029285,
"eval_dim_512_cosine_map@100": 0.3513161520991861,
"eval_dim_512_cosine_mrr@10": 0.340864051193851,
"eval_dim_512_cosine_ndcg@10": 0.42175585614805716,
"eval_dim_512_cosine_precision@1": 0.20945474829173058,
"eval_dim_512_cosine_precision@10": 0.06849811741737553,
"eval_dim_512_cosine_precision@3": 0.13680100404406637,
"eval_dim_512_cosine_precision@5": 0.1011853298005857,
"eval_dim_512_cosine_recall@1": 0.20945474829173058,
"eval_dim_512_cosine_recall@10": 0.6849811741737554,
"eval_dim_512_cosine_recall@3": 0.41040301213219915,
"eval_dim_512_cosine_recall@5": 0.5059266490029285,
"eval_dim_64_cosine_accuracy@1": 0.18923441639938643,
"eval_dim_64_cosine_accuracy@10": 0.6431460047413192,
"eval_dim_64_cosine_accuracy@3": 0.38056059127039465,
"eval_dim_64_cosine_accuracy@5": 0.4667410403012132,
"eval_dim_64_cosine_map@100": 0.32516177346707625,
"eval_dim_64_cosine_mrr@10": 0.3137617785923441,
"eval_dim_64_cosine_ndcg@10": 0.39102781421972704,
"eval_dim_64_cosine_precision@1": 0.18923441639938643,
"eval_dim_64_cosine_precision@10": 0.06431460047413191,
"eval_dim_64_cosine_precision@3": 0.12685353042346487,
"eval_dim_64_cosine_precision@5": 0.09334820806024266,
"eval_dim_64_cosine_recall@1": 0.18923441639938643,
"eval_dim_64_cosine_recall@10": 0.6431460047413192,
"eval_dim_64_cosine_recall@3": 0.38056059127039465,
"eval_dim_64_cosine_recall@5": 0.4667410403012132,
"eval_dim_768_cosine_accuracy@1": 0.2069446381257844,
"eval_dim_768_cosine_accuracy@10": 0.6877701854692512,
"eval_dim_768_cosine_accuracy@3": 0.41110026495607305,
"eval_dim_768_cosine_accuracy@5": 0.5078789569097755,
"eval_dim_768_cosine_map@100": 0.35016286957488246,
"eval_dim_768_cosine_mrr@10": 0.33975193293977246,
"eval_dim_768_cosine_ndcg@10": 0.42158855710438475,
"eval_dim_768_cosine_precision@1": 0.2069446381257844,
"eval_dim_768_cosine_precision@10": 0.06877701854692511,
"eval_dim_768_cosine_precision@3": 0.13703342165202437,
"eval_dim_768_cosine_precision@5": 0.1015757913819551,
"eval_dim_768_cosine_recall@1": 0.2069446381257844,
"eval_dim_768_cosine_recall@10": 0.6877701854692512,
"eval_dim_768_cosine_recall@3": 0.41110026495607305,
"eval_dim_768_cosine_recall@5": 0.5078789569097755,
"eval_loss": 0.35814541578292847,
"eval_runtime": 5308.0606,
"eval_samples_per_second": 1.351,
"eval_sequential_score": 0.39102781421972704,
"eval_steps_per_second": 0.014,
"step": 48
},
{
"epoch": 2.0,
"grad_norm": 1227518.25,
"learning_rate": 2.65047365119413e-05,
"loss": 0.3058,
"step": 96
},
{
"epoch": 2.0,
"eval_dim_128_cosine_accuracy@1": 0.319341793334263,
"eval_dim_128_cosine_accuracy@10": 0.7118951331752894,
"eval_dim_128_cosine_accuracy@3": 0.45670059963742854,
"eval_dim_128_cosine_accuracy@5": 0.5373030260772557,
"eval_dim_128_cosine_map@100": 0.43025589198069303,
"eval_dim_128_cosine_mrr@10": 0.4206424465384167,
"eval_dim_128_cosine_ndcg@10": 0.48839839347709046,
"eval_dim_128_cosine_precision@1": 0.319341793334263,
"eval_dim_128_cosine_precision@10": 0.07118951331752894,
"eval_dim_128_cosine_precision@3": 0.15223353321247615,
"eval_dim_128_cosine_precision@5": 0.10746060521545113,
"eval_dim_128_cosine_recall@1": 0.319341793334263,
"eval_dim_128_cosine_recall@10": 0.7118951331752894,
"eval_dim_128_cosine_recall@3": 0.45670059963742854,
"eval_dim_128_cosine_recall@5": 0.5373030260772557,
"eval_dim_256_cosine_accuracy@1": 0.3284060800446242,
"eval_dim_256_cosine_accuracy@10": 0.709524473574118,
"eval_dim_256_cosine_accuracy@3": 0.4618602705340957,
"eval_dim_256_cosine_accuracy@5": 0.5356296192999581,
"eval_dim_256_cosine_map@100": 0.4364935437376769,
"eval_dim_256_cosine_mrr@10": 0.42624382156525586,
"eval_dim_256_cosine_ndcg@10": 0.49204715409513783,
"eval_dim_256_cosine_precision@1": 0.3284060800446242,
"eval_dim_256_cosine_precision@10": 0.07095244735741181,
"eval_dim_256_cosine_precision@3": 0.15395342351136523,
"eval_dim_256_cosine_precision@5": 0.10712592385999165,
"eval_dim_256_cosine_recall@1": 0.3284060800446242,
"eval_dim_256_cosine_recall@10": 0.709524473574118,
"eval_dim_256_cosine_recall@3": 0.4618602705340957,
"eval_dim_256_cosine_recall@5": 0.5356296192999581,
"eval_dim_512_cosine_accuracy@1": 0.33663366336633666,
"eval_dim_512_cosine_accuracy@10": 0.7125923859991633,
"eval_dim_512_cosine_accuracy@3": 0.46841444707851065,
"eval_dim_512_cosine_accuracy@5": 0.5441361037512202,
"eval_dim_512_cosine_map@100": 0.4433337740824084,
"eval_dim_512_cosine_mrr@10": 0.43360332512124483,
"eval_dim_512_cosine_ndcg@10": 0.4984772586608768,
"eval_dim_512_cosine_precision@1": 0.33663366336633666,
"eval_dim_512_cosine_precision@10": 0.07125923859991633,
"eval_dim_512_cosine_precision@3": 0.15613814902617024,
"eval_dim_512_cosine_precision@5": 0.10882722075024404,
"eval_dim_512_cosine_recall@1": 0.33663366336633666,
"eval_dim_512_cosine_recall@10": 0.7125923859991633,
"eval_dim_512_cosine_recall@3": 0.46841444707851065,
"eval_dim_512_cosine_recall@5": 0.5441361037512202,
"eval_dim_64_cosine_accuracy@1": 0.3026077255612885,
"eval_dim_64_cosine_accuracy@10": 0.689861943940873,
"eval_dim_64_cosine_accuracy@3": 0.4437316971133733,
"eval_dim_64_cosine_accuracy@5": 0.519313903221308,
"eval_dim_64_cosine_map@100": 0.4140292225757397,
"eval_dim_64_cosine_mrr@10": 0.4037352829850398,
"eval_dim_64_cosine_ndcg@10": 0.47036063500166436,
"eval_dim_64_cosine_precision@1": 0.3026077255612885,
"eval_dim_64_cosine_precision@10": 0.0689861943940873,
"eval_dim_64_cosine_precision@3": 0.14791056570445774,
"eval_dim_64_cosine_precision@5": 0.10386278064426162,
"eval_dim_64_cosine_recall@1": 0.3026077255612885,
"eval_dim_64_cosine_recall@10": 0.689861943940873,
"eval_dim_64_cosine_recall@3": 0.4437316971133733,
"eval_dim_64_cosine_recall@5": 0.519313903221308,
"eval_dim_768_cosine_accuracy@1": 0.3332868498117417,
"eval_dim_768_cosine_accuracy@10": 0.7166364523776322,
"eval_dim_768_cosine_accuracy@3": 0.46841444707851065,
"eval_dim_768_cosine_accuracy@5": 0.546227862222842,
"eval_dim_768_cosine_map@100": 0.44212169088004494,
"eval_dim_768_cosine_mrr@10": 0.4324117975177812,
"eval_dim_768_cosine_ndcg@10": 0.498508349299699,
"eval_dim_768_cosine_precision@1": 0.3332868498117417,
"eval_dim_768_cosine_precision@10": 0.07166364523776322,
"eval_dim_768_cosine_precision@3": 0.1561381490261702,
"eval_dim_768_cosine_precision@5": 0.1092455724445684,
"eval_dim_768_cosine_recall@1": 0.3332868498117417,
"eval_dim_768_cosine_recall@10": 0.7166364523776322,
"eval_dim_768_cosine_recall@3": 0.46841444707851065,
"eval_dim_768_cosine_recall@5": 0.546227862222842,
"eval_loss": 0.2100292444229126,
"eval_runtime": 5303.3966,
"eval_samples_per_second": 1.352,
"eval_sequential_score": 0.47036063500166436,
"eval_steps_per_second": 0.014,
"step": 96
},
{
"epoch": 3.0,
"grad_norm": 751449.875,
"learning_rate": 1.8611820248535433e-05,
"loss": 0.1395,
"step": 144
},
{
"epoch": 3.0,
"eval_dim_128_cosine_accuracy@1": 0.3420722353925533,
"eval_dim_128_cosine_accuracy@10": 0.7111978803514154,
"eval_dim_128_cosine_accuracy@3": 0.4580951052851764,
"eval_dim_128_cosine_accuracy@5": 0.5392553339841026,
"eval_dim_128_cosine_map@100": 0.44322012540075556,
"eval_dim_128_cosine_mrr@10": 0.43320030192154113,
"eval_dim_128_cosine_ndcg@10": 0.49761764615839976,
"eval_dim_128_cosine_precision@1": 0.3420722353925533,
"eval_dim_128_cosine_precision@10": 0.07111978803514155,
"eval_dim_128_cosine_precision@3": 0.15269836842839213,
"eval_dim_128_cosine_precision@5": 0.10785106679682054,
"eval_dim_128_cosine_recall@1": 0.3420722353925533,
"eval_dim_128_cosine_recall@10": 0.7111978803514154,
"eval_dim_128_cosine_recall@3": 0.4580951052851764,
"eval_dim_128_cosine_recall@5": 0.5392553339841026,
"eval_dim_256_cosine_accuracy@1": 0.34876586250174313,
"eval_dim_256_cosine_accuracy@10": 0.7184493097197043,
"eval_dim_256_cosine_accuracy@3": 0.4705062055501325,
"eval_dim_256_cosine_accuracy@5": 0.5427415981034723,
"eval_dim_256_cosine_map@100": 0.4497903349951724,
"eval_dim_256_cosine_mrr@10": 0.4402565004991461,
"eval_dim_256_cosine_ndcg@10": 0.5046482555536308,
"eval_dim_256_cosine_precision@1": 0.34876586250174313,
"eval_dim_256_cosine_precision@10": 0.07184493097197044,
"eval_dim_256_cosine_precision@3": 0.15683540185004413,
"eval_dim_256_cosine_precision@5": 0.10854831962069447,
"eval_dim_256_cosine_recall@1": 0.34876586250174313,
"eval_dim_256_cosine_recall@10": 0.7184493097197043,
"eval_dim_256_cosine_recall@3": 0.4705062055501325,
"eval_dim_256_cosine_recall@5": 0.5427415981034723,
"eval_dim_512_cosine_accuracy@1": 0.3525310277506624,
"eval_dim_512_cosine_accuracy@10": 0.7208199693208758,
"eval_dim_512_cosine_accuracy@3": 0.47190071119788035,
"eval_dim_512_cosine_accuracy@5": 0.5545948961093292,
"eval_dim_512_cosine_map@100": 0.4537559279114653,
"eval_dim_512_cosine_mrr@10": 0.44413881528997956,
"eval_dim_512_cosine_ndcg@10": 0.5083169852417319,
"eval_dim_512_cosine_precision@1": 0.3525310277506624,
"eval_dim_512_cosine_precision@10": 0.07208199693208758,
"eval_dim_512_cosine_precision@3": 0.1573002370659601,
"eval_dim_512_cosine_precision@5": 0.11091897922186586,
"eval_dim_512_cosine_recall@1": 0.3525310277506624,
"eval_dim_512_cosine_recall@10": 0.7208199693208758,
"eval_dim_512_cosine_recall@3": 0.47190071119788035,
"eval_dim_512_cosine_recall@5": 0.5545948961093292,
"eval_dim_64_cosine_accuracy@1": 0.3289638823037233,
"eval_dim_64_cosine_accuracy@10": 0.6980895272625854,
"eval_dim_64_cosine_accuracy@3": 0.447217961232743,
"eval_dim_64_cosine_accuracy@5": 0.5223818156463533,
"eval_dim_64_cosine_map@100": 0.4300263980717357,
"eval_dim_64_cosine_mrr@10": 0.4197134401568931,
"eval_dim_64_cosine_ndcg@10": 0.48411999159781,
"eval_dim_64_cosine_precision@1": 0.3289638823037233,
"eval_dim_64_cosine_precision@10": 0.06980895272625855,
"eval_dim_64_cosine_precision@3": 0.14907265374424766,
"eval_dim_64_cosine_precision@5": 0.10447636312927068,
"eval_dim_64_cosine_recall@1": 0.3289638823037233,
"eval_dim_64_cosine_recall@10": 0.6980895272625854,
"eval_dim_64_cosine_recall@3": 0.447217961232743,
"eval_dim_64_cosine_recall@5": 0.5223818156463533,
"eval_dim_768_cosine_accuracy@1": 0.35392553339841026,
"eval_dim_768_cosine_accuracy@10": 0.7202621670617766,
"eval_dim_768_cosine_accuracy@3": 0.47078510667968204,
"eval_dim_768_cosine_accuracy@5": 0.5458095105285177,
"eval_dim_768_cosine_map@100": 0.45349669058599684,
"eval_dim_768_cosine_mrr@10": 0.4438007583454529,
"eval_dim_768_cosine_ndcg@10": 0.5077758391371117,
"eval_dim_768_cosine_precision@1": 0.35392553339841026,
"eval_dim_768_cosine_precision@10": 0.07202621670617766,
"eval_dim_768_cosine_precision@3": 0.15692836889322734,
"eval_dim_768_cosine_precision@5": 0.10916190210570352,
"eval_dim_768_cosine_recall@1": 0.35392553339841026,
"eval_dim_768_cosine_recall@10": 0.7202621670617766,
"eval_dim_768_cosine_recall@3": 0.47078510667968204,
"eval_dim_768_cosine_recall@5": 0.5458095105285177,
"eval_loss": 0.1820719689130783,
"eval_runtime": 5286.0245,
"eval_samples_per_second": 1.357,
"eval_sequential_score": 0.48411999159781,
"eval_steps_per_second": 0.014,
"step": 144
},
{
"epoch": 4.0,
"grad_norm": 609946.5,
"learning_rate": 9.328128849810832e-06,
"loss": 0.0828,
"step": 192
},
{
"epoch": 4.0,
"eval_dim_128_cosine_accuracy@1": 0.34876586250174313,
"eval_dim_128_cosine_accuracy@10": 0.7169153535071817,
"eval_dim_128_cosine_accuracy@3": 0.4691116999023846,
"eval_dim_128_cosine_accuracy@5": 0.5466462139171664,
"eval_dim_128_cosine_map@100": 0.44992557552198303,
"eval_dim_128_cosine_mrr@10": 0.4401795813384156,
"eval_dim_128_cosine_ndcg@10": 0.504316835829398,
"eval_dim_128_cosine_precision@1": 0.34876586250174313,
"eval_dim_128_cosine_precision@10": 0.07169153535071818,
"eval_dim_128_cosine_precision@3": 0.15637056663412818,
"eval_dim_128_cosine_precision@5": 0.10932924278343327,
"eval_dim_128_cosine_recall@1": 0.34876586250174313,
"eval_dim_128_cosine_recall@10": 0.7169153535071817,
"eval_dim_128_cosine_recall@3": 0.4691116999023846,
"eval_dim_128_cosine_recall@5": 0.5466462139171664,
"eval_dim_256_cosine_accuracy@1": 0.3514154232324641,
"eval_dim_256_cosine_accuracy@10": 0.7198438153674522,
"eval_dim_256_cosine_accuracy@3": 0.47482917305815087,
"eval_dim_256_cosine_accuracy@5": 0.5479012690001395,
"eval_dim_256_cosine_map@100": 0.45302713856879157,
"eval_dim_256_cosine_mrr@10": 0.44321866291257,
"eval_dim_256_cosine_ndcg@10": 0.5073024414696454,
"eval_dim_256_cosine_precision@1": 0.3514154232324641,
"eval_dim_256_cosine_precision@10": 0.07198438153674523,
"eval_dim_256_cosine_precision@3": 0.15827639101938362,
"eval_dim_256_cosine_precision@5": 0.10958025380002788,
"eval_dim_256_cosine_recall@1": 0.3514154232324641,
"eval_dim_256_cosine_recall@10": 0.7198438153674522,
"eval_dim_256_cosine_recall@3": 0.47482917305815087,
"eval_dim_256_cosine_recall@5": 0.5479012690001395,
"eval_dim_512_cosine_accuracy@1": 0.35629619299958165,
"eval_dim_512_cosine_accuracy@10": 0.7229117277924976,
"eval_dim_512_cosine_accuracy@3": 0.46966950216148373,
"eval_dim_512_cosine_accuracy@5": 0.5479012690001395,
"eval_dim_512_cosine_map@100": 0.4551128486578315,
"eval_dim_512_cosine_mrr@10": 0.4454170567962228,
"eval_dim_512_cosine_ndcg@10": 0.5095844549678528,
"eval_dim_512_cosine_precision@1": 0.35629619299958165,
"eval_dim_512_cosine_precision@10": 0.07229117277924975,
"eval_dim_512_cosine_precision@3": 0.1565565007204946,
"eval_dim_512_cosine_precision@5": 0.10958025380002788,
"eval_dim_512_cosine_recall@1": 0.35629619299958165,
"eval_dim_512_cosine_recall@10": 0.7229117277924976,
"eval_dim_512_cosine_recall@3": 0.46966950216148373,
"eval_dim_512_cosine_recall@5": 0.5479012690001395,
"eval_dim_64_cosine_accuracy@1": 0.33649421280156183,
"eval_dim_64_cosine_accuracy@10": 0.7029702970297029,
"eval_dim_64_cosine_accuracy@3": 0.45432994003625715,
"eval_dim_64_cosine_accuracy@5": 0.5300515967089666,
"eval_dim_64_cosine_map@100": 0.43606205857055896,
"eval_dim_64_cosine_mrr@10": 0.4258440632795675,
"eval_dim_64_cosine_ndcg@10": 0.48996806351717825,
"eval_dim_64_cosine_precision@1": 0.33649421280156183,
"eval_dim_64_cosine_precision@10": 0.0702970297029703,
"eval_dim_64_cosine_precision@3": 0.15144331334541905,
"eval_dim_64_cosine_precision@5": 0.10601031934179334,
"eval_dim_64_cosine_recall@1": 0.33649421280156183,
"eval_dim_64_cosine_recall@10": 0.7029702970297029,
"eval_dim_64_cosine_recall@3": 0.45432994003625715,
"eval_dim_64_cosine_recall@5": 0.5300515967089666,
"eval_dim_768_cosine_accuracy@1": 0.356714544693906,
"eval_dim_768_cosine_accuracy@10": 0.7251429368288942,
"eval_dim_768_cosine_accuracy@3": 0.47315576628085343,
"eval_dim_768_cosine_accuracy@5": 0.5499930274717613,
"eval_dim_768_cosine_map@100": 0.4565653595396862,
"eval_dim_768_cosine_mrr@10": 0.44696689487862346,
"eval_dim_768_cosine_ndcg@10": 0.5113293441302604,
"eval_dim_768_cosine_precision@1": 0.356714544693906,
"eval_dim_768_cosine_precision@10": 0.07251429368288942,
"eval_dim_768_cosine_precision@3": 0.15771858876028447,
"eval_dim_768_cosine_precision@5": 0.10999860549435224,
"eval_dim_768_cosine_recall@1": 0.356714544693906,
"eval_dim_768_cosine_recall@10": 0.7251429368288942,
"eval_dim_768_cosine_recall@3": 0.47315576628085343,
"eval_dim_768_cosine_recall@5": 0.5499930274717613,
"eval_loss": 0.17269685864448547,
"eval_runtime": 5288.939,
"eval_samples_per_second": 1.356,
"eval_sequential_score": 0.48996806351717825,
"eval_steps_per_second": 0.014,
"step": 192
},
{
"epoch": 5.0,
"grad_norm": 373272.25,
"learning_rate": 2.2284601387084617e-06,
"loss": 0.0601,
"step": 240
},
{
"epoch": 5.0,
"eval_dim_128_cosine_accuracy@1": 0.345558499511923,
"eval_dim_128_cosine_accuracy@10": 0.7213777715799748,
"eval_dim_128_cosine_accuracy@3": 0.466880490865988,
"eval_dim_128_cosine_accuracy@5": 0.5456700599637428,
"eval_dim_128_cosine_map@100": 0.44781889706523814,
"eval_dim_128_cosine_mrr@10": 0.4382224037293079,
"eval_dim_128_cosine_ndcg@10": 0.5037796273775794,
"eval_dim_128_cosine_precision@1": 0.345558499511923,
"eval_dim_128_cosine_precision@10": 0.07213777715799749,
"eval_dim_128_cosine_precision@3": 0.15562683028866267,
"eval_dim_128_cosine_precision@5": 0.10913401199274857,
"eval_dim_128_cosine_recall@1": 0.345558499511923,
"eval_dim_128_cosine_recall@10": 0.7213777715799748,
"eval_dim_128_cosine_recall@3": 0.466880490865988,
"eval_dim_128_cosine_recall@5": 0.5456700599637428,
"eval_dim_256_cosine_accuracy@1": 0.3511365221029145,
"eval_dim_256_cosine_accuracy@10": 0.7241667828754706,
"eval_dim_256_cosine_accuracy@3": 0.47399246966950215,
"eval_dim_256_cosine_accuracy@5": 0.5540370938502301,
"eval_dim_256_cosine_map@100": 0.45382807101318545,
"eval_dim_256_cosine_mrr@10": 0.444310748982345,
"eval_dim_256_cosine_ndcg@10": 0.509228248886466,
"eval_dim_256_cosine_precision@1": 0.3511365221029145,
"eval_dim_256_cosine_precision@10": 0.07241667828754707,
"eval_dim_256_cosine_precision@3": 0.15799748988983406,
"eval_dim_256_cosine_precision@5": 0.11080741877004602,
"eval_dim_256_cosine_recall@1": 0.3511365221029145,
"eval_dim_256_cosine_recall@10": 0.7241667828754706,
"eval_dim_256_cosine_recall@3": 0.47399246966950215,
"eval_dim_256_cosine_recall@5": 0.5540370938502301,
"eval_dim_512_cosine_accuracy@1": 0.35545948961093293,
"eval_dim_512_cosine_accuracy@10": 0.7241667828754706,
"eval_dim_512_cosine_accuracy@3": 0.47622367870589877,
"eval_dim_512_cosine_accuracy@5": 0.5550132478036536,
"eval_dim_512_cosine_map@100": 0.4566662947498507,
"eval_dim_512_cosine_mrr@10": 0.4469697724299597,
"eval_dim_512_cosine_ndcg@10": 0.5112339641773941,
"eval_dim_512_cosine_precision@1": 0.35545948961093293,
"eval_dim_512_cosine_precision@10": 0.07241667828754705,
"eval_dim_512_cosine_precision@3": 0.1587412262352996,
"eval_dim_512_cosine_precision@5": 0.11100264956073073,
"eval_dim_512_cosine_recall@1": 0.35545948961093293,
"eval_dim_512_cosine_recall@10": 0.7241667828754706,
"eval_dim_512_cosine_recall@3": 0.47622367870589877,
"eval_dim_512_cosine_recall@5": 0.5550132478036536,
"eval_dim_64_cosine_accuracy@1": 0.3371914656254358,
"eval_dim_64_cosine_accuracy@10": 0.7071538139729466,
"eval_dim_64_cosine_accuracy@3": 0.45725840189652767,
"eval_dim_64_cosine_accuracy@5": 0.5389764328545531,
"eval_dim_64_cosine_map@100": 0.43880820327735404,
"eval_dim_64_cosine_mrr@10": 0.428855420753344,
"eval_dim_64_cosine_ndcg@10": 0.4933751447627624,
"eval_dim_64_cosine_precision@1": 0.3371914656254358,
"eval_dim_64_cosine_precision@10": 0.07071538139729466,
"eval_dim_64_cosine_precision@3": 0.15241946729884256,
"eval_dim_64_cosine_precision@5": 0.10779528657091063,
"eval_dim_64_cosine_recall@1": 0.3371914656254358,
"eval_dim_64_cosine_recall@10": 0.7071538139729466,
"eval_dim_64_cosine_recall@3": 0.45725840189652767,
"eval_dim_64_cosine_recall@5": 0.5389764328545531,
"eval_dim_768_cosine_accuracy@1": 0.35406498396318503,
"eval_dim_768_cosine_accuracy@10": 0.7283502998187142,
"eval_dim_768_cosine_accuracy@3": 0.4713429089387812,
"eval_dim_768_cosine_accuracy@5": 0.552782038767257,
"eval_dim_768_cosine_map@100": 0.45544037871042936,
"eval_dim_768_cosine_mrr@10": 0.4460218406146454,
"eval_dim_768_cosine_ndcg@10": 0.5113413299327996,
"eval_dim_768_cosine_precision@1": 0.35406498396318503,
"eval_dim_768_cosine_precision@10": 0.07283502998187143,
"eval_dim_768_cosine_precision@3": 0.15711430297959372,
"eval_dim_768_cosine_precision@5": 0.1105564077534514,
"eval_dim_768_cosine_recall@1": 0.35406498396318503,
"eval_dim_768_cosine_recall@10": 0.7283502998187142,
"eval_dim_768_cosine_recall@3": 0.4713429089387812,
"eval_dim_768_cosine_recall@5": 0.552782038767257,
"eval_loss": 0.166685089468956,
"eval_runtime": 5294.4091,
"eval_samples_per_second": 1.355,
"eval_sequential_score": 0.4933751447627624,
"eval_steps_per_second": 0.014,
"step": 240
},
{
"epoch": 5.878048780487805,
"grad_norm": 715763.1875,
"learning_rate": 0.0,
"loss": 0.0521,
"step": 282
},
{
"epoch": 5.878048780487805,
"eval_dim_128_cosine_accuracy@1": 0.34667410403012133,
"eval_dim_128_cosine_accuracy@10": 0.7259796402175429,
"eval_dim_128_cosine_accuracy@3": 0.46869334820806025,
"eval_dim_128_cosine_accuracy@5": 0.548877422953563,
"eval_dim_128_cosine_map@100": 0.44958294087462464,
"eval_dim_128_cosine_mrr@10": 0.44026242161439555,
"eval_dim_128_cosine_ndcg@10": 0.5064194393114915,
"eval_dim_128_cosine_precision@1": 0.34667410403012133,
"eval_dim_128_cosine_precision@10": 0.0725979640217543,
"eval_dim_128_cosine_precision@3": 0.15623111606935342,
"eval_dim_128_cosine_precision@5": 0.1097754845907126,
"eval_dim_128_cosine_recall@1": 0.34667410403012133,
"eval_dim_128_cosine_recall@10": 0.7259796402175429,
"eval_dim_128_cosine_recall@3": 0.46869334820806025,
"eval_dim_128_cosine_recall@5": 0.548877422953563,
"eval_dim_256_cosine_accuracy@1": 0.35099707153813975,
"eval_dim_256_cosine_accuracy@10": 0.719286013108353,
"eval_dim_256_cosine_accuracy@3": 0.47455027192860133,
"eval_dim_256_cosine_accuracy@5": 0.5502719286013108,
"eval_dim_256_cosine_map@100": 0.45309491401564994,
"eval_dim_256_cosine_mrr@10": 0.4432182202123648,
"eval_dim_256_cosine_ndcg@10": 0.5072173461870104,
"eval_dim_256_cosine_precision@1": 0.35099707153813975,
"eval_dim_256_cosine_precision@10": 0.0719286013108353,
"eval_dim_256_cosine_precision@3": 0.15818342397620047,
"eval_dim_256_cosine_precision@5": 0.11005438572026217,
"eval_dim_256_cosine_recall@1": 0.35099707153813975,
"eval_dim_256_cosine_recall@10": 0.719286013108353,
"eval_dim_256_cosine_recall@3": 0.47455027192860133,
"eval_dim_256_cosine_recall@5": 0.5502719286013108,
"eval_dim_512_cosine_accuracy@1": 0.3569934458234556,
"eval_dim_512_cosine_accuracy@10": 0.7248640356993445,
"eval_dim_512_cosine_accuracy@3": 0.4744108213638265,
"eval_dim_512_cosine_accuracy@5": 0.5523636870729326,
"eval_dim_512_cosine_map@100": 0.45691118758008836,
"eval_dim_512_cosine_mrr@10": 0.4473125330641728,
"eval_dim_512_cosine_ndcg@10": 0.5115413503217677,
"eval_dim_512_cosine_precision@1": 0.3569934458234556,
"eval_dim_512_cosine_precision@10": 0.07248640356993445,
"eval_dim_512_cosine_precision@3": 0.15813694045460885,
"eval_dim_512_cosine_precision@5": 0.11047273741458653,
"eval_dim_512_cosine_recall@1": 0.3569934458234556,
"eval_dim_512_cosine_recall@10": 0.7248640356993445,
"eval_dim_512_cosine_recall@3": 0.4744108213638265,
"eval_dim_512_cosine_recall@5": 0.5523636870729326,
"eval_dim_64_cosine_accuracy@1": 0.3380281690140845,
"eval_dim_64_cosine_accuracy@10": 0.7046437038070004,
"eval_dim_64_cosine_accuracy@3": 0.4548877422953563,
"eval_dim_64_cosine_accuracy@5": 0.5322828057453632,
"eval_dim_64_cosine_map@100": 0.4382982729365051,
"eval_dim_64_cosine_mrr@10": 0.4281275109402298,
"eval_dim_64_cosine_ndcg@10": 0.49214355622918665,
"eval_dim_64_cosine_precision@1": 0.3380281690140845,
"eval_dim_64_cosine_precision@10": 0.07046437038070004,
"eval_dim_64_cosine_precision@3": 0.1516292474317854,
"eval_dim_64_cosine_precision@5": 0.10645656114907265,
"eval_dim_64_cosine_recall@1": 0.3380281690140845,
"eval_dim_64_cosine_recall@10": 0.7046437038070004,
"eval_dim_64_cosine_recall@3": 0.4548877422953563,
"eval_dim_64_cosine_recall@5": 0.5322828057453632,
"eval_dim_768_cosine_accuracy@1": 0.35490168735183375,
"eval_dim_768_cosine_accuracy@10": 0.7261190907823176,
"eval_dim_768_cosine_accuracy@3": 0.4723190628922047,
"eval_dim_768_cosine_accuracy@5": 0.5504113791660856,
"eval_dim_768_cosine_map@100": 0.455135537492312,
"eval_dim_768_cosine_mrr@10": 0.44549231583118165,
"eval_dim_768_cosine_ndcg@10": 0.5104063813142831,
"eval_dim_768_cosine_precision@1": 0.35490168735183375,
"eval_dim_768_cosine_precision@10": 0.07261190907823176,
"eval_dim_768_cosine_precision@3": 0.1574396876307349,
"eval_dim_768_cosine_precision@5": 0.11008227583321714,
"eval_dim_768_cosine_recall@1": 0.35490168735183375,
"eval_dim_768_cosine_recall@10": 0.7261190907823176,
"eval_dim_768_cosine_recall@3": 0.4723190628922047,
"eval_dim_768_cosine_recall@5": 0.5504113791660856,
"eval_loss": 0.16643136739730835,
"eval_runtime": 5293.6409,
"eval_samples_per_second": 1.355,
"eval_sequential_score": 0.49214355622918665,
"eval_steps_per_second": 0.014,
"step": 282
}
],
"logging_steps": 500,
"max_steps": 282,
"num_input_tokens_seen": 0,
"num_train_epochs": 6,
"save_steps": 500,
"stateful_callbacks": {
"EarlyStoppingCallback": {
"args": {
"early_stopping_patience": 1,
"early_stopping_threshold": 0.001
},
"attributes": {
"early_stopping_patience_counter": 1
}
},
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 0.0,
"train_batch_size": 100,
"trial_name": null,
"trial_params": null
}