|
{ |
|
"best_metric": 0.16643136739730835, |
|
"best_model_checkpoint": "bkai-fine-tuned-legal/checkpoint-282", |
|
"epoch": 5.878048780487805, |
|
"eval_steps": 500, |
|
"global_step": 282, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"grad_norm": 3041986.25, |
|
"learning_rate": 2.9967614628878062e-05, |
|
"loss": 1.1542, |
|
"step": 48 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_dim_128_cosine_accuracy@1": 0.19871705480407195, |
|
"eval_dim_128_cosine_accuracy@10": 0.6681076558360062, |
|
"eval_dim_128_cosine_accuracy@3": 0.3995258680797657, |
|
"eval_dim_128_cosine_accuracy@5": 0.4922604936549993, |
|
"eval_dim_128_cosine_map@100": 0.33912660774009473, |
|
"eval_dim_128_cosine_mrr@10": 0.32818611337994835, |
|
"eval_dim_128_cosine_ndcg@10": 0.40810554118165804, |
|
"eval_dim_128_cosine_precision@1": 0.19871705480407195, |
|
"eval_dim_128_cosine_precision@10": 0.06681076558360062, |
|
"eval_dim_128_cosine_precision@3": 0.1331752893599219, |
|
"eval_dim_128_cosine_precision@5": 0.09845209873099986, |
|
"eval_dim_128_cosine_recall@1": 0.19871705480407195, |
|
"eval_dim_128_cosine_recall@10": 0.6681076558360062, |
|
"eval_dim_128_cosine_recall@3": 0.3995258680797657, |
|
"eval_dim_128_cosine_recall@5": 0.4922604936549993, |
|
"eval_dim_256_cosine_accuracy@1": 0.19983265932227026, |
|
"eval_dim_256_cosine_accuracy@10": 0.6777297448054664, |
|
"eval_dim_256_cosine_accuracy@3": 0.3998047692093153, |
|
"eval_dim_256_cosine_accuracy@5": 0.4954678566448194, |
|
"eval_dim_256_cosine_map@100": 0.34191237247567885, |
|
"eval_dim_256_cosine_mrr@10": 0.33120438804443747, |
|
"eval_dim_256_cosine_ndcg@10": 0.4125662992991588, |
|
"eval_dim_256_cosine_precision@1": 0.19983265932227026, |
|
"eval_dim_256_cosine_precision@10": 0.06777297448054664, |
|
"eval_dim_256_cosine_precision@3": 0.13326825640310508, |
|
"eval_dim_256_cosine_precision@5": 0.09909357132896388, |
|
"eval_dim_256_cosine_recall@1": 0.19983265932227026, |
|
"eval_dim_256_cosine_recall@10": 0.6777297448054664, |
|
"eval_dim_256_cosine_recall@3": 0.3998047692093153, |
|
"eval_dim_256_cosine_recall@5": 0.4954678566448194, |
|
"eval_dim_512_cosine_accuracy@1": 0.20945474829173058, |
|
"eval_dim_512_cosine_accuracy@10": 0.6849811741737554, |
|
"eval_dim_512_cosine_accuracy@3": 0.41040301213219915, |
|
"eval_dim_512_cosine_accuracy@5": 0.5059266490029285, |
|
"eval_dim_512_cosine_map@100": 0.3513161520991861, |
|
"eval_dim_512_cosine_mrr@10": 0.340864051193851, |
|
"eval_dim_512_cosine_ndcg@10": 0.42175585614805716, |
|
"eval_dim_512_cosine_precision@1": 0.20945474829173058, |
|
"eval_dim_512_cosine_precision@10": 0.06849811741737553, |
|
"eval_dim_512_cosine_precision@3": 0.13680100404406637, |
|
"eval_dim_512_cosine_precision@5": 0.1011853298005857, |
|
"eval_dim_512_cosine_recall@1": 0.20945474829173058, |
|
"eval_dim_512_cosine_recall@10": 0.6849811741737554, |
|
"eval_dim_512_cosine_recall@3": 0.41040301213219915, |
|
"eval_dim_512_cosine_recall@5": 0.5059266490029285, |
|
"eval_dim_64_cosine_accuracy@1": 0.18923441639938643, |
|
"eval_dim_64_cosine_accuracy@10": 0.6431460047413192, |
|
"eval_dim_64_cosine_accuracy@3": 0.38056059127039465, |
|
"eval_dim_64_cosine_accuracy@5": 0.4667410403012132, |
|
"eval_dim_64_cosine_map@100": 0.32516177346707625, |
|
"eval_dim_64_cosine_mrr@10": 0.3137617785923441, |
|
"eval_dim_64_cosine_ndcg@10": 0.39102781421972704, |
|
"eval_dim_64_cosine_precision@1": 0.18923441639938643, |
|
"eval_dim_64_cosine_precision@10": 0.06431460047413191, |
|
"eval_dim_64_cosine_precision@3": 0.12685353042346487, |
|
"eval_dim_64_cosine_precision@5": 0.09334820806024266, |
|
"eval_dim_64_cosine_recall@1": 0.18923441639938643, |
|
"eval_dim_64_cosine_recall@10": 0.6431460047413192, |
|
"eval_dim_64_cosine_recall@3": 0.38056059127039465, |
|
"eval_dim_64_cosine_recall@5": 0.4667410403012132, |
|
"eval_dim_768_cosine_accuracy@1": 0.2069446381257844, |
|
"eval_dim_768_cosine_accuracy@10": 0.6877701854692512, |
|
"eval_dim_768_cosine_accuracy@3": 0.41110026495607305, |
|
"eval_dim_768_cosine_accuracy@5": 0.5078789569097755, |
|
"eval_dim_768_cosine_map@100": 0.35016286957488246, |
|
"eval_dim_768_cosine_mrr@10": 0.33975193293977246, |
|
"eval_dim_768_cosine_ndcg@10": 0.42158855710438475, |
|
"eval_dim_768_cosine_precision@1": 0.2069446381257844, |
|
"eval_dim_768_cosine_precision@10": 0.06877701854692511, |
|
"eval_dim_768_cosine_precision@3": 0.13703342165202437, |
|
"eval_dim_768_cosine_precision@5": 0.1015757913819551, |
|
"eval_dim_768_cosine_recall@1": 0.2069446381257844, |
|
"eval_dim_768_cosine_recall@10": 0.6877701854692512, |
|
"eval_dim_768_cosine_recall@3": 0.41110026495607305, |
|
"eval_dim_768_cosine_recall@5": 0.5078789569097755, |
|
"eval_loss": 0.35814541578292847, |
|
"eval_runtime": 5308.0606, |
|
"eval_samples_per_second": 1.351, |
|
"eval_sequential_score": 0.39102781421972704, |
|
"eval_steps_per_second": 0.014, |
|
"step": 48 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"grad_norm": 1227518.25, |
|
"learning_rate": 2.65047365119413e-05, |
|
"loss": 0.3058, |
|
"step": 96 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_dim_128_cosine_accuracy@1": 0.319341793334263, |
|
"eval_dim_128_cosine_accuracy@10": 0.7118951331752894, |
|
"eval_dim_128_cosine_accuracy@3": 0.45670059963742854, |
|
"eval_dim_128_cosine_accuracy@5": 0.5373030260772557, |
|
"eval_dim_128_cosine_map@100": 0.43025589198069303, |
|
"eval_dim_128_cosine_mrr@10": 0.4206424465384167, |
|
"eval_dim_128_cosine_ndcg@10": 0.48839839347709046, |
|
"eval_dim_128_cosine_precision@1": 0.319341793334263, |
|
"eval_dim_128_cosine_precision@10": 0.07118951331752894, |
|
"eval_dim_128_cosine_precision@3": 0.15223353321247615, |
|
"eval_dim_128_cosine_precision@5": 0.10746060521545113, |
|
"eval_dim_128_cosine_recall@1": 0.319341793334263, |
|
"eval_dim_128_cosine_recall@10": 0.7118951331752894, |
|
"eval_dim_128_cosine_recall@3": 0.45670059963742854, |
|
"eval_dim_128_cosine_recall@5": 0.5373030260772557, |
|
"eval_dim_256_cosine_accuracy@1": 0.3284060800446242, |
|
"eval_dim_256_cosine_accuracy@10": 0.709524473574118, |
|
"eval_dim_256_cosine_accuracy@3": 0.4618602705340957, |
|
"eval_dim_256_cosine_accuracy@5": 0.5356296192999581, |
|
"eval_dim_256_cosine_map@100": 0.4364935437376769, |
|
"eval_dim_256_cosine_mrr@10": 0.42624382156525586, |
|
"eval_dim_256_cosine_ndcg@10": 0.49204715409513783, |
|
"eval_dim_256_cosine_precision@1": 0.3284060800446242, |
|
"eval_dim_256_cosine_precision@10": 0.07095244735741181, |
|
"eval_dim_256_cosine_precision@3": 0.15395342351136523, |
|
"eval_dim_256_cosine_precision@5": 0.10712592385999165, |
|
"eval_dim_256_cosine_recall@1": 0.3284060800446242, |
|
"eval_dim_256_cosine_recall@10": 0.709524473574118, |
|
"eval_dim_256_cosine_recall@3": 0.4618602705340957, |
|
"eval_dim_256_cosine_recall@5": 0.5356296192999581, |
|
"eval_dim_512_cosine_accuracy@1": 0.33663366336633666, |
|
"eval_dim_512_cosine_accuracy@10": 0.7125923859991633, |
|
"eval_dim_512_cosine_accuracy@3": 0.46841444707851065, |
|
"eval_dim_512_cosine_accuracy@5": 0.5441361037512202, |
|
"eval_dim_512_cosine_map@100": 0.4433337740824084, |
|
"eval_dim_512_cosine_mrr@10": 0.43360332512124483, |
|
"eval_dim_512_cosine_ndcg@10": 0.4984772586608768, |
|
"eval_dim_512_cosine_precision@1": 0.33663366336633666, |
|
"eval_dim_512_cosine_precision@10": 0.07125923859991633, |
|
"eval_dim_512_cosine_precision@3": 0.15613814902617024, |
|
"eval_dim_512_cosine_precision@5": 0.10882722075024404, |
|
"eval_dim_512_cosine_recall@1": 0.33663366336633666, |
|
"eval_dim_512_cosine_recall@10": 0.7125923859991633, |
|
"eval_dim_512_cosine_recall@3": 0.46841444707851065, |
|
"eval_dim_512_cosine_recall@5": 0.5441361037512202, |
|
"eval_dim_64_cosine_accuracy@1": 0.3026077255612885, |
|
"eval_dim_64_cosine_accuracy@10": 0.689861943940873, |
|
"eval_dim_64_cosine_accuracy@3": 0.4437316971133733, |
|
"eval_dim_64_cosine_accuracy@5": 0.519313903221308, |
|
"eval_dim_64_cosine_map@100": 0.4140292225757397, |
|
"eval_dim_64_cosine_mrr@10": 0.4037352829850398, |
|
"eval_dim_64_cosine_ndcg@10": 0.47036063500166436, |
|
"eval_dim_64_cosine_precision@1": 0.3026077255612885, |
|
"eval_dim_64_cosine_precision@10": 0.0689861943940873, |
|
"eval_dim_64_cosine_precision@3": 0.14791056570445774, |
|
"eval_dim_64_cosine_precision@5": 0.10386278064426162, |
|
"eval_dim_64_cosine_recall@1": 0.3026077255612885, |
|
"eval_dim_64_cosine_recall@10": 0.689861943940873, |
|
"eval_dim_64_cosine_recall@3": 0.4437316971133733, |
|
"eval_dim_64_cosine_recall@5": 0.519313903221308, |
|
"eval_dim_768_cosine_accuracy@1": 0.3332868498117417, |
|
"eval_dim_768_cosine_accuracy@10": 0.7166364523776322, |
|
"eval_dim_768_cosine_accuracy@3": 0.46841444707851065, |
|
"eval_dim_768_cosine_accuracy@5": 0.546227862222842, |
|
"eval_dim_768_cosine_map@100": 0.44212169088004494, |
|
"eval_dim_768_cosine_mrr@10": 0.4324117975177812, |
|
"eval_dim_768_cosine_ndcg@10": 0.498508349299699, |
|
"eval_dim_768_cosine_precision@1": 0.3332868498117417, |
|
"eval_dim_768_cosine_precision@10": 0.07166364523776322, |
|
"eval_dim_768_cosine_precision@3": 0.1561381490261702, |
|
"eval_dim_768_cosine_precision@5": 0.1092455724445684, |
|
"eval_dim_768_cosine_recall@1": 0.3332868498117417, |
|
"eval_dim_768_cosine_recall@10": 0.7166364523776322, |
|
"eval_dim_768_cosine_recall@3": 0.46841444707851065, |
|
"eval_dim_768_cosine_recall@5": 0.546227862222842, |
|
"eval_loss": 0.2100292444229126, |
|
"eval_runtime": 5303.3966, |
|
"eval_samples_per_second": 1.352, |
|
"eval_sequential_score": 0.47036063500166436, |
|
"eval_steps_per_second": 0.014, |
|
"step": 96 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"grad_norm": 751449.875, |
|
"learning_rate": 1.8611820248535433e-05, |
|
"loss": 0.1395, |
|
"step": 144 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_dim_128_cosine_accuracy@1": 0.3420722353925533, |
|
"eval_dim_128_cosine_accuracy@10": 0.7111978803514154, |
|
"eval_dim_128_cosine_accuracy@3": 0.4580951052851764, |
|
"eval_dim_128_cosine_accuracy@5": 0.5392553339841026, |
|
"eval_dim_128_cosine_map@100": 0.44322012540075556, |
|
"eval_dim_128_cosine_mrr@10": 0.43320030192154113, |
|
"eval_dim_128_cosine_ndcg@10": 0.49761764615839976, |
|
"eval_dim_128_cosine_precision@1": 0.3420722353925533, |
|
"eval_dim_128_cosine_precision@10": 0.07111978803514155, |
|
"eval_dim_128_cosine_precision@3": 0.15269836842839213, |
|
"eval_dim_128_cosine_precision@5": 0.10785106679682054, |
|
"eval_dim_128_cosine_recall@1": 0.3420722353925533, |
|
"eval_dim_128_cosine_recall@10": 0.7111978803514154, |
|
"eval_dim_128_cosine_recall@3": 0.4580951052851764, |
|
"eval_dim_128_cosine_recall@5": 0.5392553339841026, |
|
"eval_dim_256_cosine_accuracy@1": 0.34876586250174313, |
|
"eval_dim_256_cosine_accuracy@10": 0.7184493097197043, |
|
"eval_dim_256_cosine_accuracy@3": 0.4705062055501325, |
|
"eval_dim_256_cosine_accuracy@5": 0.5427415981034723, |
|
"eval_dim_256_cosine_map@100": 0.4497903349951724, |
|
"eval_dim_256_cosine_mrr@10": 0.4402565004991461, |
|
"eval_dim_256_cosine_ndcg@10": 0.5046482555536308, |
|
"eval_dim_256_cosine_precision@1": 0.34876586250174313, |
|
"eval_dim_256_cosine_precision@10": 0.07184493097197044, |
|
"eval_dim_256_cosine_precision@3": 0.15683540185004413, |
|
"eval_dim_256_cosine_precision@5": 0.10854831962069447, |
|
"eval_dim_256_cosine_recall@1": 0.34876586250174313, |
|
"eval_dim_256_cosine_recall@10": 0.7184493097197043, |
|
"eval_dim_256_cosine_recall@3": 0.4705062055501325, |
|
"eval_dim_256_cosine_recall@5": 0.5427415981034723, |
|
"eval_dim_512_cosine_accuracy@1": 0.3525310277506624, |
|
"eval_dim_512_cosine_accuracy@10": 0.7208199693208758, |
|
"eval_dim_512_cosine_accuracy@3": 0.47190071119788035, |
|
"eval_dim_512_cosine_accuracy@5": 0.5545948961093292, |
|
"eval_dim_512_cosine_map@100": 0.4537559279114653, |
|
"eval_dim_512_cosine_mrr@10": 0.44413881528997956, |
|
"eval_dim_512_cosine_ndcg@10": 0.5083169852417319, |
|
"eval_dim_512_cosine_precision@1": 0.3525310277506624, |
|
"eval_dim_512_cosine_precision@10": 0.07208199693208758, |
|
"eval_dim_512_cosine_precision@3": 0.1573002370659601, |
|
"eval_dim_512_cosine_precision@5": 0.11091897922186586, |
|
"eval_dim_512_cosine_recall@1": 0.3525310277506624, |
|
"eval_dim_512_cosine_recall@10": 0.7208199693208758, |
|
"eval_dim_512_cosine_recall@3": 0.47190071119788035, |
|
"eval_dim_512_cosine_recall@5": 0.5545948961093292, |
|
"eval_dim_64_cosine_accuracy@1": 0.3289638823037233, |
|
"eval_dim_64_cosine_accuracy@10": 0.6980895272625854, |
|
"eval_dim_64_cosine_accuracy@3": 0.447217961232743, |
|
"eval_dim_64_cosine_accuracy@5": 0.5223818156463533, |
|
"eval_dim_64_cosine_map@100": 0.4300263980717357, |
|
"eval_dim_64_cosine_mrr@10": 0.4197134401568931, |
|
"eval_dim_64_cosine_ndcg@10": 0.48411999159781, |
|
"eval_dim_64_cosine_precision@1": 0.3289638823037233, |
|
"eval_dim_64_cosine_precision@10": 0.06980895272625855, |
|
"eval_dim_64_cosine_precision@3": 0.14907265374424766, |
|
"eval_dim_64_cosine_precision@5": 0.10447636312927068, |
|
"eval_dim_64_cosine_recall@1": 0.3289638823037233, |
|
"eval_dim_64_cosine_recall@10": 0.6980895272625854, |
|
"eval_dim_64_cosine_recall@3": 0.447217961232743, |
|
"eval_dim_64_cosine_recall@5": 0.5223818156463533, |
|
"eval_dim_768_cosine_accuracy@1": 0.35392553339841026, |
|
"eval_dim_768_cosine_accuracy@10": 0.7202621670617766, |
|
"eval_dim_768_cosine_accuracy@3": 0.47078510667968204, |
|
"eval_dim_768_cosine_accuracy@5": 0.5458095105285177, |
|
"eval_dim_768_cosine_map@100": 0.45349669058599684, |
|
"eval_dim_768_cosine_mrr@10": 0.4438007583454529, |
|
"eval_dim_768_cosine_ndcg@10": 0.5077758391371117, |
|
"eval_dim_768_cosine_precision@1": 0.35392553339841026, |
|
"eval_dim_768_cosine_precision@10": 0.07202621670617766, |
|
"eval_dim_768_cosine_precision@3": 0.15692836889322734, |
|
"eval_dim_768_cosine_precision@5": 0.10916190210570352, |
|
"eval_dim_768_cosine_recall@1": 0.35392553339841026, |
|
"eval_dim_768_cosine_recall@10": 0.7202621670617766, |
|
"eval_dim_768_cosine_recall@3": 0.47078510667968204, |
|
"eval_dim_768_cosine_recall@5": 0.5458095105285177, |
|
"eval_loss": 0.1820719689130783, |
|
"eval_runtime": 5286.0245, |
|
"eval_samples_per_second": 1.357, |
|
"eval_sequential_score": 0.48411999159781, |
|
"eval_steps_per_second": 0.014, |
|
"step": 144 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"grad_norm": 609946.5, |
|
"learning_rate": 9.328128849810832e-06, |
|
"loss": 0.0828, |
|
"step": 192 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_dim_128_cosine_accuracy@1": 0.34876586250174313, |
|
"eval_dim_128_cosine_accuracy@10": 0.7169153535071817, |
|
"eval_dim_128_cosine_accuracy@3": 0.4691116999023846, |
|
"eval_dim_128_cosine_accuracy@5": 0.5466462139171664, |
|
"eval_dim_128_cosine_map@100": 0.44992557552198303, |
|
"eval_dim_128_cosine_mrr@10": 0.4401795813384156, |
|
"eval_dim_128_cosine_ndcg@10": 0.504316835829398, |
|
"eval_dim_128_cosine_precision@1": 0.34876586250174313, |
|
"eval_dim_128_cosine_precision@10": 0.07169153535071818, |
|
"eval_dim_128_cosine_precision@3": 0.15637056663412818, |
|
"eval_dim_128_cosine_precision@5": 0.10932924278343327, |
|
"eval_dim_128_cosine_recall@1": 0.34876586250174313, |
|
"eval_dim_128_cosine_recall@10": 0.7169153535071817, |
|
"eval_dim_128_cosine_recall@3": 0.4691116999023846, |
|
"eval_dim_128_cosine_recall@5": 0.5466462139171664, |
|
"eval_dim_256_cosine_accuracy@1": 0.3514154232324641, |
|
"eval_dim_256_cosine_accuracy@10": 0.7198438153674522, |
|
"eval_dim_256_cosine_accuracy@3": 0.47482917305815087, |
|
"eval_dim_256_cosine_accuracy@5": 0.5479012690001395, |
|
"eval_dim_256_cosine_map@100": 0.45302713856879157, |
|
"eval_dim_256_cosine_mrr@10": 0.44321866291257, |
|
"eval_dim_256_cosine_ndcg@10": 0.5073024414696454, |
|
"eval_dim_256_cosine_precision@1": 0.3514154232324641, |
|
"eval_dim_256_cosine_precision@10": 0.07198438153674523, |
|
"eval_dim_256_cosine_precision@3": 0.15827639101938362, |
|
"eval_dim_256_cosine_precision@5": 0.10958025380002788, |
|
"eval_dim_256_cosine_recall@1": 0.3514154232324641, |
|
"eval_dim_256_cosine_recall@10": 0.7198438153674522, |
|
"eval_dim_256_cosine_recall@3": 0.47482917305815087, |
|
"eval_dim_256_cosine_recall@5": 0.5479012690001395, |
|
"eval_dim_512_cosine_accuracy@1": 0.35629619299958165, |
|
"eval_dim_512_cosine_accuracy@10": 0.7229117277924976, |
|
"eval_dim_512_cosine_accuracy@3": 0.46966950216148373, |
|
"eval_dim_512_cosine_accuracy@5": 0.5479012690001395, |
|
"eval_dim_512_cosine_map@100": 0.4551128486578315, |
|
"eval_dim_512_cosine_mrr@10": 0.4454170567962228, |
|
"eval_dim_512_cosine_ndcg@10": 0.5095844549678528, |
|
"eval_dim_512_cosine_precision@1": 0.35629619299958165, |
|
"eval_dim_512_cosine_precision@10": 0.07229117277924975, |
|
"eval_dim_512_cosine_precision@3": 0.1565565007204946, |
|
"eval_dim_512_cosine_precision@5": 0.10958025380002788, |
|
"eval_dim_512_cosine_recall@1": 0.35629619299958165, |
|
"eval_dim_512_cosine_recall@10": 0.7229117277924976, |
|
"eval_dim_512_cosine_recall@3": 0.46966950216148373, |
|
"eval_dim_512_cosine_recall@5": 0.5479012690001395, |
|
"eval_dim_64_cosine_accuracy@1": 0.33649421280156183, |
|
"eval_dim_64_cosine_accuracy@10": 0.7029702970297029, |
|
"eval_dim_64_cosine_accuracy@3": 0.45432994003625715, |
|
"eval_dim_64_cosine_accuracy@5": 0.5300515967089666, |
|
"eval_dim_64_cosine_map@100": 0.43606205857055896, |
|
"eval_dim_64_cosine_mrr@10": 0.4258440632795675, |
|
"eval_dim_64_cosine_ndcg@10": 0.48996806351717825, |
|
"eval_dim_64_cosine_precision@1": 0.33649421280156183, |
|
"eval_dim_64_cosine_precision@10": 0.0702970297029703, |
|
"eval_dim_64_cosine_precision@3": 0.15144331334541905, |
|
"eval_dim_64_cosine_precision@5": 0.10601031934179334, |
|
"eval_dim_64_cosine_recall@1": 0.33649421280156183, |
|
"eval_dim_64_cosine_recall@10": 0.7029702970297029, |
|
"eval_dim_64_cosine_recall@3": 0.45432994003625715, |
|
"eval_dim_64_cosine_recall@5": 0.5300515967089666, |
|
"eval_dim_768_cosine_accuracy@1": 0.356714544693906, |
|
"eval_dim_768_cosine_accuracy@10": 0.7251429368288942, |
|
"eval_dim_768_cosine_accuracy@3": 0.47315576628085343, |
|
"eval_dim_768_cosine_accuracy@5": 0.5499930274717613, |
|
"eval_dim_768_cosine_map@100": 0.4565653595396862, |
|
"eval_dim_768_cosine_mrr@10": 0.44696689487862346, |
|
"eval_dim_768_cosine_ndcg@10": 0.5113293441302604, |
|
"eval_dim_768_cosine_precision@1": 0.356714544693906, |
|
"eval_dim_768_cosine_precision@10": 0.07251429368288942, |
|
"eval_dim_768_cosine_precision@3": 0.15771858876028447, |
|
"eval_dim_768_cosine_precision@5": 0.10999860549435224, |
|
"eval_dim_768_cosine_recall@1": 0.356714544693906, |
|
"eval_dim_768_cosine_recall@10": 0.7251429368288942, |
|
"eval_dim_768_cosine_recall@3": 0.47315576628085343, |
|
"eval_dim_768_cosine_recall@5": 0.5499930274717613, |
|
"eval_loss": 0.17269685864448547, |
|
"eval_runtime": 5288.939, |
|
"eval_samples_per_second": 1.356, |
|
"eval_sequential_score": 0.48996806351717825, |
|
"eval_steps_per_second": 0.014, |
|
"step": 192 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"grad_norm": 373272.25, |
|
"learning_rate": 2.2284601387084617e-06, |
|
"loss": 0.0601, |
|
"step": 240 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_dim_128_cosine_accuracy@1": 0.345558499511923, |
|
"eval_dim_128_cosine_accuracy@10": 0.7213777715799748, |
|
"eval_dim_128_cosine_accuracy@3": 0.466880490865988, |
|
"eval_dim_128_cosine_accuracy@5": 0.5456700599637428, |
|
"eval_dim_128_cosine_map@100": 0.44781889706523814, |
|
"eval_dim_128_cosine_mrr@10": 0.4382224037293079, |
|
"eval_dim_128_cosine_ndcg@10": 0.5037796273775794, |
|
"eval_dim_128_cosine_precision@1": 0.345558499511923, |
|
"eval_dim_128_cosine_precision@10": 0.07213777715799749, |
|
"eval_dim_128_cosine_precision@3": 0.15562683028866267, |
|
"eval_dim_128_cosine_precision@5": 0.10913401199274857, |
|
"eval_dim_128_cosine_recall@1": 0.345558499511923, |
|
"eval_dim_128_cosine_recall@10": 0.7213777715799748, |
|
"eval_dim_128_cosine_recall@3": 0.466880490865988, |
|
"eval_dim_128_cosine_recall@5": 0.5456700599637428, |
|
"eval_dim_256_cosine_accuracy@1": 0.3511365221029145, |
|
"eval_dim_256_cosine_accuracy@10": 0.7241667828754706, |
|
"eval_dim_256_cosine_accuracy@3": 0.47399246966950215, |
|
"eval_dim_256_cosine_accuracy@5": 0.5540370938502301, |
|
"eval_dim_256_cosine_map@100": 0.45382807101318545, |
|
"eval_dim_256_cosine_mrr@10": 0.444310748982345, |
|
"eval_dim_256_cosine_ndcg@10": 0.509228248886466, |
|
"eval_dim_256_cosine_precision@1": 0.3511365221029145, |
|
"eval_dim_256_cosine_precision@10": 0.07241667828754707, |
|
"eval_dim_256_cosine_precision@3": 0.15799748988983406, |
|
"eval_dim_256_cosine_precision@5": 0.11080741877004602, |
|
"eval_dim_256_cosine_recall@1": 0.3511365221029145, |
|
"eval_dim_256_cosine_recall@10": 0.7241667828754706, |
|
"eval_dim_256_cosine_recall@3": 0.47399246966950215, |
|
"eval_dim_256_cosine_recall@5": 0.5540370938502301, |
|
"eval_dim_512_cosine_accuracy@1": 0.35545948961093293, |
|
"eval_dim_512_cosine_accuracy@10": 0.7241667828754706, |
|
"eval_dim_512_cosine_accuracy@3": 0.47622367870589877, |
|
"eval_dim_512_cosine_accuracy@5": 0.5550132478036536, |
|
"eval_dim_512_cosine_map@100": 0.4566662947498507, |
|
"eval_dim_512_cosine_mrr@10": 0.4469697724299597, |
|
"eval_dim_512_cosine_ndcg@10": 0.5112339641773941, |
|
"eval_dim_512_cosine_precision@1": 0.35545948961093293, |
|
"eval_dim_512_cosine_precision@10": 0.07241667828754705, |
|
"eval_dim_512_cosine_precision@3": 0.1587412262352996, |
|
"eval_dim_512_cosine_precision@5": 0.11100264956073073, |
|
"eval_dim_512_cosine_recall@1": 0.35545948961093293, |
|
"eval_dim_512_cosine_recall@10": 0.7241667828754706, |
|
"eval_dim_512_cosine_recall@3": 0.47622367870589877, |
|
"eval_dim_512_cosine_recall@5": 0.5550132478036536, |
|
"eval_dim_64_cosine_accuracy@1": 0.3371914656254358, |
|
"eval_dim_64_cosine_accuracy@10": 0.7071538139729466, |
|
"eval_dim_64_cosine_accuracy@3": 0.45725840189652767, |
|
"eval_dim_64_cosine_accuracy@5": 0.5389764328545531, |
|
"eval_dim_64_cosine_map@100": 0.43880820327735404, |
|
"eval_dim_64_cosine_mrr@10": 0.428855420753344, |
|
"eval_dim_64_cosine_ndcg@10": 0.4933751447627624, |
|
"eval_dim_64_cosine_precision@1": 0.3371914656254358, |
|
"eval_dim_64_cosine_precision@10": 0.07071538139729466, |
|
"eval_dim_64_cosine_precision@3": 0.15241946729884256, |
|
"eval_dim_64_cosine_precision@5": 0.10779528657091063, |
|
"eval_dim_64_cosine_recall@1": 0.3371914656254358, |
|
"eval_dim_64_cosine_recall@10": 0.7071538139729466, |
|
"eval_dim_64_cosine_recall@3": 0.45725840189652767, |
|
"eval_dim_64_cosine_recall@5": 0.5389764328545531, |
|
"eval_dim_768_cosine_accuracy@1": 0.35406498396318503, |
|
"eval_dim_768_cosine_accuracy@10": 0.7283502998187142, |
|
"eval_dim_768_cosine_accuracy@3": 0.4713429089387812, |
|
"eval_dim_768_cosine_accuracy@5": 0.552782038767257, |
|
"eval_dim_768_cosine_map@100": 0.45544037871042936, |
|
"eval_dim_768_cosine_mrr@10": 0.4460218406146454, |
|
"eval_dim_768_cosine_ndcg@10": 0.5113413299327996, |
|
"eval_dim_768_cosine_precision@1": 0.35406498396318503, |
|
"eval_dim_768_cosine_precision@10": 0.07283502998187143, |
|
"eval_dim_768_cosine_precision@3": 0.15711430297959372, |
|
"eval_dim_768_cosine_precision@5": 0.1105564077534514, |
|
"eval_dim_768_cosine_recall@1": 0.35406498396318503, |
|
"eval_dim_768_cosine_recall@10": 0.7283502998187142, |
|
"eval_dim_768_cosine_recall@3": 0.4713429089387812, |
|
"eval_dim_768_cosine_recall@5": 0.552782038767257, |
|
"eval_loss": 0.166685089468956, |
|
"eval_runtime": 5294.4091, |
|
"eval_samples_per_second": 1.355, |
|
"eval_sequential_score": 0.4933751447627624, |
|
"eval_steps_per_second": 0.014, |
|
"step": 240 |
|
}, |
|
{ |
|
"epoch": 5.878048780487805, |
|
"grad_norm": 715763.1875, |
|
"learning_rate": 0.0, |
|
"loss": 0.0521, |
|
"step": 282 |
|
}, |
|
{ |
|
"epoch": 5.878048780487805, |
|
"eval_dim_128_cosine_accuracy@1": 0.34667410403012133, |
|
"eval_dim_128_cosine_accuracy@10": 0.7259796402175429, |
|
"eval_dim_128_cosine_accuracy@3": 0.46869334820806025, |
|
"eval_dim_128_cosine_accuracy@5": 0.548877422953563, |
|
"eval_dim_128_cosine_map@100": 0.44958294087462464, |
|
"eval_dim_128_cosine_mrr@10": 0.44026242161439555, |
|
"eval_dim_128_cosine_ndcg@10": 0.5064194393114915, |
|
"eval_dim_128_cosine_precision@1": 0.34667410403012133, |
|
"eval_dim_128_cosine_precision@10": 0.0725979640217543, |
|
"eval_dim_128_cosine_precision@3": 0.15623111606935342, |
|
"eval_dim_128_cosine_precision@5": 0.1097754845907126, |
|
"eval_dim_128_cosine_recall@1": 0.34667410403012133, |
|
"eval_dim_128_cosine_recall@10": 0.7259796402175429, |
|
"eval_dim_128_cosine_recall@3": 0.46869334820806025, |
|
"eval_dim_128_cosine_recall@5": 0.548877422953563, |
|
"eval_dim_256_cosine_accuracy@1": 0.35099707153813975, |
|
"eval_dim_256_cosine_accuracy@10": 0.719286013108353, |
|
"eval_dim_256_cosine_accuracy@3": 0.47455027192860133, |
|
"eval_dim_256_cosine_accuracy@5": 0.5502719286013108, |
|
"eval_dim_256_cosine_map@100": 0.45309491401564994, |
|
"eval_dim_256_cosine_mrr@10": 0.4432182202123648, |
|
"eval_dim_256_cosine_ndcg@10": 0.5072173461870104, |
|
"eval_dim_256_cosine_precision@1": 0.35099707153813975, |
|
"eval_dim_256_cosine_precision@10": 0.0719286013108353, |
|
"eval_dim_256_cosine_precision@3": 0.15818342397620047, |
|
"eval_dim_256_cosine_precision@5": 0.11005438572026217, |
|
"eval_dim_256_cosine_recall@1": 0.35099707153813975, |
|
"eval_dim_256_cosine_recall@10": 0.719286013108353, |
|
"eval_dim_256_cosine_recall@3": 0.47455027192860133, |
|
"eval_dim_256_cosine_recall@5": 0.5502719286013108, |
|
"eval_dim_512_cosine_accuracy@1": 0.3569934458234556, |
|
"eval_dim_512_cosine_accuracy@10": 0.7248640356993445, |
|
"eval_dim_512_cosine_accuracy@3": 0.4744108213638265, |
|
"eval_dim_512_cosine_accuracy@5": 0.5523636870729326, |
|
"eval_dim_512_cosine_map@100": 0.45691118758008836, |
|
"eval_dim_512_cosine_mrr@10": 0.4473125330641728, |
|
"eval_dim_512_cosine_ndcg@10": 0.5115413503217677, |
|
"eval_dim_512_cosine_precision@1": 0.3569934458234556, |
|
"eval_dim_512_cosine_precision@10": 0.07248640356993445, |
|
"eval_dim_512_cosine_precision@3": 0.15813694045460885, |
|
"eval_dim_512_cosine_precision@5": 0.11047273741458653, |
|
"eval_dim_512_cosine_recall@1": 0.3569934458234556, |
|
"eval_dim_512_cosine_recall@10": 0.7248640356993445, |
|
"eval_dim_512_cosine_recall@3": 0.4744108213638265, |
|
"eval_dim_512_cosine_recall@5": 0.5523636870729326, |
|
"eval_dim_64_cosine_accuracy@1": 0.3380281690140845, |
|
"eval_dim_64_cosine_accuracy@10": 0.7046437038070004, |
|
"eval_dim_64_cosine_accuracy@3": 0.4548877422953563, |
|
"eval_dim_64_cosine_accuracy@5": 0.5322828057453632, |
|
"eval_dim_64_cosine_map@100": 0.4382982729365051, |
|
"eval_dim_64_cosine_mrr@10": 0.4281275109402298, |
|
"eval_dim_64_cosine_ndcg@10": 0.49214355622918665, |
|
"eval_dim_64_cosine_precision@1": 0.3380281690140845, |
|
"eval_dim_64_cosine_precision@10": 0.07046437038070004, |
|
"eval_dim_64_cosine_precision@3": 0.1516292474317854, |
|
"eval_dim_64_cosine_precision@5": 0.10645656114907265, |
|
"eval_dim_64_cosine_recall@1": 0.3380281690140845, |
|
"eval_dim_64_cosine_recall@10": 0.7046437038070004, |
|
"eval_dim_64_cosine_recall@3": 0.4548877422953563, |
|
"eval_dim_64_cosine_recall@5": 0.5322828057453632, |
|
"eval_dim_768_cosine_accuracy@1": 0.35490168735183375, |
|
"eval_dim_768_cosine_accuracy@10": 0.7261190907823176, |
|
"eval_dim_768_cosine_accuracy@3": 0.4723190628922047, |
|
"eval_dim_768_cosine_accuracy@5": 0.5504113791660856, |
|
"eval_dim_768_cosine_map@100": 0.455135537492312, |
|
"eval_dim_768_cosine_mrr@10": 0.44549231583118165, |
|
"eval_dim_768_cosine_ndcg@10": 0.5104063813142831, |
|
"eval_dim_768_cosine_precision@1": 0.35490168735183375, |
|
"eval_dim_768_cosine_precision@10": 0.07261190907823176, |
|
"eval_dim_768_cosine_precision@3": 0.1574396876307349, |
|
"eval_dim_768_cosine_precision@5": 0.11008227583321714, |
|
"eval_dim_768_cosine_recall@1": 0.35490168735183375, |
|
"eval_dim_768_cosine_recall@10": 0.7261190907823176, |
|
"eval_dim_768_cosine_recall@3": 0.4723190628922047, |
|
"eval_dim_768_cosine_recall@5": 0.5504113791660856, |
|
"eval_loss": 0.16643136739730835, |
|
"eval_runtime": 5293.6409, |
|
"eval_samples_per_second": 1.355, |
|
"eval_sequential_score": 0.49214355622918665, |
|
"eval_steps_per_second": 0.014, |
|
"step": 282 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 282, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 6, |
|
"save_steps": 500, |
|
"stateful_callbacks": { |
|
"EarlyStoppingCallback": { |
|
"args": { |
|
"early_stopping_patience": 1, |
|
"early_stopping_threshold": 0.001 |
|
}, |
|
"attributes": { |
|
"early_stopping_patience_counter": 1 |
|
} |
|
}, |
|
"TrainerControl": { |
|
"args": { |
|
"should_epoch_stop": false, |
|
"should_evaluate": false, |
|
"should_log": false, |
|
"should_save": true, |
|
"should_training_stop": true |
|
}, |
|
"attributes": {} |
|
} |
|
}, |
|
"total_flos": 0.0, |
|
"train_batch_size": 100, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|