{ "best_global_step": 72, "best_metric": 0.7275517192718437, "best_model_checkpoint": "MNLP_M3_document_encoder_sciqa/checkpoint-72", "epoch": 3.8135593220338984, "eval_steps": 500, "global_step": 72, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.5423728813559322, "grad_norm": 164.72093200683594, "learning_rate": 1.9987954562051724e-05, "loss": 22.4049, "step": 10 }, { "epoch": 1.0, "eval_dim_128_cosine_accuracy@1": 0.5452812202097236, "eval_dim_128_cosine_accuracy@10": 0.8760724499523356, "eval_dim_128_cosine_accuracy@3": 0.7416587225929456, "eval_dim_128_cosine_accuracy@5": 0.8074356530028599, "eval_dim_128_cosine_map@100": 0.6605612754102786, "eval_dim_128_cosine_mrr@10": 0.6559349796480402, "eval_dim_128_cosine_ndcg@10": 0.7092688022688834, "eval_dim_128_cosine_precision@1": 0.5452812202097236, "eval_dim_128_cosine_precision@10": 0.08760724499523356, "eval_dim_128_cosine_precision@3": 0.24721957419764853, "eval_dim_128_cosine_precision@5": 0.161487130600572, "eval_dim_128_cosine_recall@1": 0.5452812202097236, "eval_dim_128_cosine_recall@10": 0.8760724499523356, "eval_dim_128_cosine_recall@3": 0.7416587225929456, "eval_dim_128_cosine_recall@5": 0.8074356530028599, "eval_dim_192_cosine_accuracy@1": 0.5624404194470924, "eval_dim_192_cosine_accuracy@10": 0.8932316491897044, "eval_dim_192_cosine_accuracy@3": 0.7597712106768351, "eval_dim_192_cosine_accuracy@5": 0.8188751191611058, "eval_dim_192_cosine_map@100": 0.677245219852975, "eval_dim_192_cosine_mrr@10": 0.6730234388003697, "eval_dim_192_cosine_ndcg@10": 0.7262712999939527, "eval_dim_192_cosine_precision@1": 0.5624404194470924, "eval_dim_192_cosine_precision@10": 0.08932316491897044, "eval_dim_192_cosine_precision@3": 0.25325707022561167, "eval_dim_192_cosine_precision@5": 0.16377502383222117, "eval_dim_192_cosine_recall@1": 0.5624404194470924, "eval_dim_192_cosine_recall@10": 0.8932316491897044, "eval_dim_192_cosine_recall@3": 0.7597712106768351, "eval_dim_192_cosine_recall@5": 0.8188751191611058, "eval_dim_256_cosine_accuracy@1": 0.5653002859866539, "eval_dim_256_cosine_accuracy@10": 0.8960915157292659, "eval_dim_256_cosine_accuracy@3": 0.7683508102955195, "eval_dim_256_cosine_accuracy@5": 0.8236415633937083, "eval_dim_256_cosine_map@100": 0.6831583296339104, "eval_dim_256_cosine_mrr@10": 0.6786784844220503, "eval_dim_256_cosine_ndcg@10": 0.7314611486548883, "eval_dim_256_cosine_precision@1": 0.5653002859866539, "eval_dim_256_cosine_precision@10": 0.08960915157292659, "eval_dim_256_cosine_precision@3": 0.25611693676517316, "eval_dim_256_cosine_precision@5": 0.16472831267874166, "eval_dim_256_cosine_recall@1": 0.5653002859866539, "eval_dim_256_cosine_recall@10": 0.8960915157292659, "eval_dim_256_cosine_recall@3": 0.7683508102955195, "eval_dim_256_cosine_recall@5": 0.8236415633937083, "eval_dim_384_cosine_accuracy@1": 0.5786463298379408, "eval_dim_384_cosine_accuracy@10": 0.9075309818875119, "eval_dim_384_cosine_accuracy@3": 0.776930409914204, "eval_dim_384_cosine_accuracy@5": 0.8417540514775977, "eval_dim_384_cosine_map@100": 0.6932934943306605, "eval_dim_384_cosine_mrr@10": 0.6894563227261042, "eval_dim_384_cosine_ndcg@10": 0.7423737824827953, "eval_dim_384_cosine_precision@1": 0.5786463298379408, "eval_dim_384_cosine_precision@10": 0.0907530981887512, "eval_dim_384_cosine_precision@3": 0.2589768033047346, "eval_dim_384_cosine_precision@5": 0.16835081029551957, "eval_dim_384_cosine_recall@1": 0.5786463298379408, "eval_dim_384_cosine_recall@10": 0.9075309818875119, "eval_dim_384_cosine_recall@3": 0.776930409914204, "eval_dim_384_cosine_recall@5": 0.8417540514775977, "eval_dim_64_cosine_accuracy@1": 0.49285033365109626, "eval_dim_64_cosine_accuracy@10": 0.8274547187797903, "eval_dim_64_cosine_accuracy@3": 0.684461391801716, "eval_dim_64_cosine_accuracy@5": 0.7578646329837941, "eval_dim_64_cosine_map@100": 0.6088952628032813, "eval_dim_64_cosine_mrr@10": 0.6032237807738285, "eval_dim_64_cosine_ndcg@10": 0.6575406372744073, "eval_dim_64_cosine_precision@1": 0.49285033365109626, "eval_dim_64_cosine_precision@10": 0.08274547187797902, "eval_dim_64_cosine_precision@3": 0.2281537972672386, "eval_dim_64_cosine_precision@5": 0.1515729265967588, "eval_dim_64_cosine_recall@1": 0.49285033365109626, "eval_dim_64_cosine_recall@10": 0.8274547187797903, "eval_dim_64_cosine_recall@3": 0.684461391801716, "eval_dim_64_cosine_recall@5": 0.7578646329837941, "eval_dim_96_cosine_accuracy@1": 0.5214489990467112, "eval_dim_96_cosine_accuracy@10": 0.8636796949475691, "eval_dim_96_cosine_accuracy@3": 0.7264061010486177, "eval_dim_96_cosine_accuracy@5": 0.7893231649189705, "eval_dim_96_cosine_map@100": 0.6418431352074736, "eval_dim_96_cosine_mrr@10": 0.6369528046363133, "eval_dim_96_cosine_ndcg@10": 0.6919097155042885, "eval_dim_96_cosine_precision@1": 0.5214489990467112, "eval_dim_96_cosine_precision@10": 0.0863679694947569, "eval_dim_96_cosine_precision@3": 0.2421353670162059, "eval_dim_96_cosine_precision@5": 0.15786463298379408, "eval_dim_96_cosine_recall@1": 0.5214489990467112, "eval_dim_96_cosine_recall@10": 0.8636796949475691, "eval_dim_96_cosine_recall@3": 0.7264061010486177, "eval_dim_96_cosine_recall@5": 0.7893231649189705, "eval_runtime": 116.4269, "eval_samples_per_second": 0.0, "eval_sequential_score": 0.6575406372744073, "eval_steps_per_second": 0.0, "step": 19 }, { "epoch": 1.0542372881355933, "grad_norm": 107.04779815673828, "learning_rate": 1.8577286100002723e-05, "loss": 16.6616, "step": 20 }, { "epoch": 1.5966101694915253, "grad_norm": 97.63832092285156, "learning_rate": 1.5141027441932217e-05, "loss": 16.8367, "step": 30 }, { "epoch": 2.0, "eval_dim_128_cosine_accuracy@1": 0.567206863679695, "eval_dim_128_cosine_accuracy@10": 0.886558627264061, "eval_dim_128_cosine_accuracy@3": 0.7607244995233555, "eval_dim_128_cosine_accuracy@5": 0.8236415633937083, "eval_dim_128_cosine_map@100": 0.6790430112153837, "eval_dim_128_cosine_mrr@10": 0.6746886679679823, "eval_dim_128_cosine_ndcg@10": 0.7260517487265687, "eval_dim_128_cosine_precision@1": 0.567206863679695, "eval_dim_128_cosine_precision@10": 0.0886558627264061, "eval_dim_128_cosine_precision@3": 0.25357483317445184, "eval_dim_128_cosine_precision@5": 0.16472831267874166, "eval_dim_128_cosine_recall@1": 0.567206863679695, "eval_dim_128_cosine_recall@10": 0.886558627264061, "eval_dim_128_cosine_recall@3": 0.7607244995233555, "eval_dim_128_cosine_recall@5": 0.8236415633937083, "eval_dim_192_cosine_accuracy@1": 0.5805529075309819, "eval_dim_192_cosine_accuracy@10": 0.9008579599618685, "eval_dim_192_cosine_accuracy@3": 0.782650142993327, "eval_dim_192_cosine_accuracy@5": 0.8322211630123928, "eval_dim_192_cosine_map@100": 0.6964841260809953, "eval_dim_192_cosine_mrr@10": 0.6923562879234952, "eval_dim_192_cosine_ndcg@10": 0.7430712975035773, "eval_dim_192_cosine_precision@1": 0.5805529075309819, "eval_dim_192_cosine_precision@10": 0.09008579599618685, "eval_dim_192_cosine_precision@3": 0.26088338099777564, "eval_dim_192_cosine_precision@5": 0.16644423260247856, "eval_dim_192_cosine_recall@1": 0.5805529075309819, "eval_dim_192_cosine_recall@10": 0.9008579599618685, "eval_dim_192_cosine_recall@3": 0.782650142993327, "eval_dim_192_cosine_recall@5": 0.8322211630123928, "eval_dim_256_cosine_accuracy@1": 0.5919923736892279, "eval_dim_256_cosine_accuracy@10": 0.9142040038131554, "eval_dim_256_cosine_accuracy@3": 0.7902764537654909, "eval_dim_256_cosine_accuracy@5": 0.8360343183984748, "eval_dim_256_cosine_map@100": 0.7038093293311698, "eval_dim_256_cosine_mrr@10": 0.700305279404422, "eval_dim_256_cosine_ndcg@10": 0.7520267351833514, "eval_dim_256_cosine_precision@1": 0.5919923736892279, "eval_dim_256_cosine_precision@10": 0.09142040038131555, "eval_dim_256_cosine_precision@3": 0.26342548458849696, "eval_dim_256_cosine_precision@5": 0.16720686367969492, "eval_dim_256_cosine_recall@1": 0.5919923736892279, "eval_dim_256_cosine_recall@10": 0.9142040038131554, "eval_dim_256_cosine_recall@3": 0.7902764537654909, "eval_dim_256_cosine_recall@5": 0.8360343183984748, "eval_dim_384_cosine_accuracy@1": 0.6015252621544328, "eval_dim_384_cosine_accuracy@10": 0.9199237368922784, "eval_dim_384_cosine_accuracy@3": 0.7959961868446139, "eval_dim_384_cosine_accuracy@5": 0.8531935176358436, "eval_dim_384_cosine_map@100": 0.713601684515785, "eval_dim_384_cosine_mrr@10": 0.7104082497314151, "eval_dim_384_cosine_ndcg@10": 0.761241503632434, "eval_dim_384_cosine_precision@1": 0.6015252621544328, "eval_dim_384_cosine_precision@10": 0.09199237368922783, "eval_dim_384_cosine_precision@3": 0.26533206228153794, "eval_dim_384_cosine_precision@5": 0.17063870352716873, "eval_dim_384_cosine_recall@1": 0.6015252621544328, "eval_dim_384_cosine_recall@10": 0.9199237368922784, "eval_dim_384_cosine_recall@3": 0.7959961868446139, "eval_dim_384_cosine_recall@5": 0.8531935176358436, "eval_dim_64_cosine_accuracy@1": 0.5138226882745471, "eval_dim_64_cosine_accuracy@10": 0.8341277407054337, "eval_dim_64_cosine_accuracy@3": 0.7016205910390848, "eval_dim_64_cosine_accuracy@5": 0.7645376549094376, "eval_dim_64_cosine_map@100": 0.6242158272303533, "eval_dim_64_cosine_mrr@10": 0.618670464690484, "eval_dim_64_cosine_ndcg@10": 0.6707950308444217, "eval_dim_64_cosine_precision@1": 0.5138226882745471, "eval_dim_64_cosine_precision@10": 0.08341277407054337, "eval_dim_64_cosine_precision@3": 0.2338735303463616, "eval_dim_64_cosine_precision@5": 0.1529075309818875, "eval_dim_64_cosine_recall@1": 0.5138226882745471, "eval_dim_64_cosine_recall@10": 0.8341277407054337, "eval_dim_64_cosine_recall@3": 0.7016205910390848, "eval_dim_64_cosine_recall@5": 0.7645376549094376, "eval_dim_96_cosine_accuracy@1": 0.5471877979027645, "eval_dim_96_cosine_accuracy@10": 0.8722592945662536, "eval_dim_96_cosine_accuracy@3": 0.7407054337464252, "eval_dim_96_cosine_accuracy@5": 0.8017159199237369, "eval_dim_96_cosine_map@100": 0.6622003643008398, "eval_dim_96_cosine_mrr@10": 0.6576811627097615, "eval_dim_96_cosine_ndcg@10": 0.7097194683573752, "eval_dim_96_cosine_precision@1": 0.5471877979027645, "eval_dim_96_cosine_precision@10": 0.08722592945662536, "eval_dim_96_cosine_precision@3": 0.2469018112488084, "eval_dim_96_cosine_precision@5": 0.16034318398474737, "eval_dim_96_cosine_recall@1": 0.5471877979027645, "eval_dim_96_cosine_recall@10": 0.8722592945662536, "eval_dim_96_cosine_recall@3": 0.7407054337464252, "eval_dim_96_cosine_recall@5": 0.8017159199237369, "eval_runtime": 119.8934, "eval_samples_per_second": 0.0, "eval_sequential_score": 0.6707950308444217, "eval_steps_per_second": 0.0, "step": 38 }, { "epoch": 2.1084745762711865, "grad_norm": 113.89473724365234, "learning_rate": 1.0490676743274181e-05, "loss": 12.8169, "step": 40 }, { "epoch": 2.6508474576271186, "grad_norm": 81.27326965332031, "learning_rate": 5.724449065697182e-06, "loss": 13.7826, "step": 50 }, { "epoch": 3.0, "eval_dim_128_cosine_accuracy@1": 0.567206863679695, "eval_dim_128_cosine_accuracy@10": 0.8903717826501429, "eval_dim_128_cosine_accuracy@3": 0.7616777883698761, "eval_dim_128_cosine_accuracy@5": 0.8265014299332698, "eval_dim_128_cosine_map@100": 0.6794753898354032, "eval_dim_128_cosine_mrr@10": 0.6752920392815543, "eval_dim_128_cosine_ndcg@10": 0.7273531110418706, "eval_dim_128_cosine_precision@1": 0.567206863679695, "eval_dim_128_cosine_precision@10": 0.08903717826501431, "eval_dim_128_cosine_precision@3": 0.253892596123292, "eval_dim_128_cosine_precision@5": 0.16530028598665394, "eval_dim_128_cosine_recall@1": 0.567206863679695, "eval_dim_128_cosine_recall@10": 0.8903717826501429, "eval_dim_128_cosine_recall@3": 0.7616777883698761, "eval_dim_128_cosine_recall@5": 0.8265014299332698, "eval_dim_192_cosine_accuracy@1": 0.5910390848427073, "eval_dim_192_cosine_accuracy@10": 0.9046711153479504, "eval_dim_192_cosine_accuracy@3": 0.7778836987607245, "eval_dim_192_cosine_accuracy@5": 0.8360343183984748, "eval_dim_192_cosine_map@100": 0.7014228144337117, "eval_dim_192_cosine_mrr@10": 0.6975449029309853, "eval_dim_192_cosine_ndcg@10": 0.7477240665900656, "eval_dim_192_cosine_precision@1": 0.5910390848427073, "eval_dim_192_cosine_precision@10": 0.09046711153479504, "eval_dim_192_cosine_precision@3": 0.25929456625357483, "eval_dim_192_cosine_precision@5": 0.16720686367969495, "eval_dim_192_cosine_recall@1": 0.5910390848427073, "eval_dim_192_cosine_recall@10": 0.9046711153479504, "eval_dim_192_cosine_recall@3": 0.7778836987607245, "eval_dim_192_cosine_recall@5": 0.8360343183984748, "eval_dim_256_cosine_accuracy@1": 0.5948522402287894, "eval_dim_256_cosine_accuracy@10": 0.9151572926596759, "eval_dim_256_cosine_accuracy@3": 0.792183031458532, "eval_dim_256_cosine_accuracy@5": 0.8398474737845567, "eval_dim_256_cosine_map@100": 0.7070932589939358, "eval_dim_256_cosine_mrr@10": 0.7035797509343749, "eval_dim_256_cosine_ndcg@10": 0.7548435122429773, "eval_dim_256_cosine_precision@1": 0.5948522402287894, "eval_dim_256_cosine_precision@10": 0.09151572926596759, "eval_dim_256_cosine_precision@3": 0.2640610104861773, "eval_dim_256_cosine_precision@5": 0.16796949475691134, "eval_dim_256_cosine_recall@1": 0.5948522402287894, "eval_dim_256_cosine_recall@10": 0.9151572926596759, "eval_dim_256_cosine_recall@3": 0.792183031458532, "eval_dim_256_cosine_recall@5": 0.8398474737845567, "eval_dim_384_cosine_accuracy@1": 0.6101048617731173, "eval_dim_384_cosine_accuracy@10": 0.9256434699714013, "eval_dim_384_cosine_accuracy@3": 0.8007626310772163, "eval_dim_384_cosine_accuracy@5": 0.8541468064823642, "eval_dim_384_cosine_map@100": 0.7197084605820631, "eval_dim_384_cosine_mrr@10": 0.7170116664396936, "eval_dim_384_cosine_ndcg@10": 0.7675175612283535, "eval_dim_384_cosine_precision@1": 0.6101048617731173, "eval_dim_384_cosine_precision@10": 0.09256434699714014, "eval_dim_384_cosine_precision@3": 0.2669208770257388, "eval_dim_384_cosine_precision@5": 0.17082936129647283, "eval_dim_384_cosine_recall@1": 0.6101048617731173, "eval_dim_384_cosine_recall@10": 0.9256434699714013, "eval_dim_384_cosine_recall@3": 0.8007626310772163, "eval_dim_384_cosine_recall@5": 0.8541468064823642, "eval_dim_64_cosine_accuracy@1": 0.5166825548141086, "eval_dim_64_cosine_accuracy@10": 0.8369876072449952, "eval_dim_64_cosine_accuracy@3": 0.7054337464251669, "eval_dim_64_cosine_accuracy@5": 0.7673975214489991, "eval_dim_64_cosine_map@100": 0.629350282837756, "eval_dim_64_cosine_mrr@10": 0.6240088822309986, "eval_dim_64_cosine_ndcg@10": 0.6755921916053389, "eval_dim_64_cosine_precision@1": 0.5166825548141086, "eval_dim_64_cosine_precision@10": 0.08369876072449953, "eval_dim_64_cosine_precision@3": 0.23514458214172226, "eval_dim_64_cosine_precision@5": 0.1534795042897998, "eval_dim_64_cosine_recall@1": 0.5166825548141086, "eval_dim_64_cosine_recall@10": 0.8369876072449952, "eval_dim_64_cosine_recall@3": 0.7054337464251669, "eval_dim_64_cosine_recall@5": 0.7673975214489991, "eval_dim_96_cosine_accuracy@1": 0.5529075309818875, "eval_dim_96_cosine_accuracy@10": 0.8741658722592945, "eval_dim_96_cosine_accuracy@3": 0.7416587225929456, "eval_dim_96_cosine_accuracy@5": 0.8093422306959008, "eval_dim_96_cosine_map@100": 0.6652525185575742, "eval_dim_96_cosine_mrr@10": 0.6608247461679306, "eval_dim_96_cosine_ndcg@10": 0.7125237648315317, "eval_dim_96_cosine_precision@1": 0.5529075309818875, "eval_dim_96_cosine_precision@10": 0.08741658722592945, "eval_dim_96_cosine_precision@3": 0.24721957419764853, "eval_dim_96_cosine_precision@5": 0.1618684461391802, "eval_dim_96_cosine_recall@1": 0.5529075309818875, "eval_dim_96_cosine_recall@10": 0.8741658722592945, "eval_dim_96_cosine_recall@3": 0.7416587225929456, "eval_dim_96_cosine_recall@5": 0.8093422306959008, "eval_runtime": 120.2085, "eval_samples_per_second": 0.0, "eval_sequential_score": 0.6755921916053389, "eval_steps_per_second": 0.0, "step": 57 }, { "epoch": 3.1627118644067798, "grad_norm": 102.55581665039062, "learning_rate": 1.967924685193552e-06, "loss": 12.4455, "step": 60 }, { "epoch": 3.705084745762712, "grad_norm": 84.57442474365234, "learning_rate": 1.0823490035218986e-07, "loss": 12.2968, "step": 70 }, { "epoch": 3.8135593220338984, "eval_dim_128_cosine_accuracy@1": 0.5662535748331744, "eval_dim_128_cosine_accuracy@10": 0.8913250714966635, "eval_dim_128_cosine_accuracy@3": 0.7626310772163966, "eval_dim_128_cosine_accuracy@5": 0.8265014299332698, "eval_dim_128_cosine_map@100": 0.6793502491099088, "eval_dim_128_cosine_mrr@10": 0.6752375656331816, "eval_dim_128_cosine_ndcg@10": 0.7275517192718437, "eval_dim_128_cosine_precision@1": 0.5662535748331744, "eval_dim_128_cosine_precision@10": 0.08913250714966635, "eval_dim_128_cosine_precision@3": 0.25421035907213213, "eval_dim_128_cosine_precision@5": 0.16530028598665394, "eval_dim_128_cosine_recall@1": 0.5662535748331744, "eval_dim_128_cosine_recall@10": 0.8913250714966635, "eval_dim_128_cosine_recall@3": 0.7626310772163966, "eval_dim_128_cosine_recall@5": 0.8265014299332698, "eval_dim_192_cosine_accuracy@1": 0.5891325071496664, "eval_dim_192_cosine_accuracy@10": 0.90371782650143, "eval_dim_192_cosine_accuracy@3": 0.778836987607245, "eval_dim_192_cosine_accuracy@5": 0.8331744518589133, "eval_dim_192_cosine_map@100": 0.7004357679049269, "eval_dim_192_cosine_mrr@10": 0.6964694266648511, "eval_dim_192_cosine_ndcg@10": 0.7467179313530818, "eval_dim_192_cosine_precision@1": 0.5891325071496664, "eval_dim_192_cosine_precision@10": 0.090371782650143, "eval_dim_192_cosine_precision@3": 0.259612329202415, "eval_dim_192_cosine_precision@5": 0.16663489037178267, "eval_dim_192_cosine_recall@1": 0.5891325071496664, "eval_dim_192_cosine_recall@10": 0.90371782650143, "eval_dim_192_cosine_recall@3": 0.778836987607245, "eval_dim_192_cosine_recall@5": 0.8331744518589133, "eval_dim_256_cosine_accuracy@1": 0.5977121067683508, "eval_dim_256_cosine_accuracy@10": 0.9151572926596759, "eval_dim_256_cosine_accuracy@3": 0.7912297426120114, "eval_dim_256_cosine_accuracy@5": 0.8398474737845567, "eval_dim_256_cosine_map@100": 0.7084736712852033, "eval_dim_256_cosine_mrr@10": 0.7049529408204341, "eval_dim_256_cosine_ndcg@10": 0.7558547240171754, "eval_dim_256_cosine_precision@1": 0.5977121067683508, "eval_dim_256_cosine_precision@10": 0.09151572926596759, "eval_dim_256_cosine_precision@3": 0.26374324753733713, "eval_dim_256_cosine_precision@5": 0.16796949475691134, "eval_dim_256_cosine_recall@1": 0.5977121067683508, "eval_dim_256_cosine_recall@10": 0.9151572926596759, "eval_dim_256_cosine_recall@3": 0.7912297426120114, "eval_dim_256_cosine_recall@5": 0.8398474737845567, "eval_dim_384_cosine_accuracy@1": 0.6120114394661582, "eval_dim_384_cosine_accuracy@10": 0.9275500476644424, "eval_dim_384_cosine_accuracy@3": 0.8017159199237369, "eval_dim_384_cosine_accuracy@5": 0.8541468064823642, "eval_dim_384_cosine_map@100": 0.7210073638258574, "eval_dim_384_cosine_mrr@10": 0.7184669450875366, "eval_dim_384_cosine_ndcg@10": 0.7690377395004954, "eval_dim_384_cosine_precision@1": 0.6120114394661582, "eval_dim_384_cosine_precision@10": 0.09275500476644424, "eval_dim_384_cosine_precision@3": 0.267238639974579, "eval_dim_384_cosine_precision@5": 0.17082936129647283, "eval_dim_384_cosine_recall@1": 0.6120114394661582, "eval_dim_384_cosine_recall@10": 0.9275500476644424, "eval_dim_384_cosine_recall@3": 0.8017159199237369, "eval_dim_384_cosine_recall@5": 0.8541468064823642, "eval_dim_64_cosine_accuracy@1": 0.5166825548141086, "eval_dim_64_cosine_accuracy@10": 0.8369876072449952, "eval_dim_64_cosine_accuracy@3": 0.7044804575786463, "eval_dim_64_cosine_accuracy@5": 0.7683508102955195, "eval_dim_64_cosine_map@100": 0.6292715088820261, "eval_dim_64_cosine_mrr@10": 0.6239059875618503, "eval_dim_64_cosine_ndcg@10": 0.6755211859192654, "eval_dim_64_cosine_precision@1": 0.5166825548141086, "eval_dim_64_cosine_precision@10": 0.08369876072449953, "eval_dim_64_cosine_precision@3": 0.2348268191928821, "eval_dim_64_cosine_precision@5": 0.1536701620591039, "eval_dim_64_cosine_recall@1": 0.5166825548141086, "eval_dim_64_cosine_recall@10": 0.8369876072449952, "eval_dim_64_cosine_recall@3": 0.7044804575786463, "eval_dim_64_cosine_recall@5": 0.7683508102955195, "eval_dim_96_cosine_accuracy@1": 0.551954242135367, "eval_dim_96_cosine_accuracy@10": 0.8732125834127741, "eval_dim_96_cosine_accuracy@3": 0.7416587225929456, "eval_dim_96_cosine_accuracy@5": 0.8093422306959008, "eval_dim_96_cosine_map@100": 0.6648689218069684, "eval_dim_96_cosine_mrr@10": 0.660333348464903, "eval_dim_96_cosine_ndcg@10": 0.7119774118711802, "eval_dim_96_cosine_precision@1": 0.551954242135367, "eval_dim_96_cosine_precision@10": 0.08732125834127741, "eval_dim_96_cosine_precision@3": 0.24721957419764853, "eval_dim_96_cosine_precision@5": 0.1618684461391802, "eval_dim_96_cosine_recall@1": 0.551954242135367, "eval_dim_96_cosine_recall@10": 0.8732125834127741, "eval_dim_96_cosine_recall@3": 0.7416587225929456, "eval_dim_96_cosine_recall@5": 0.8093422306959008, "eval_runtime": 122.4656, "eval_samples_per_second": 0.0, "eval_sequential_score": 0.6755211859192654, "eval_steps_per_second": 0.0, "step": 72 } ], "logging_steps": 10, "max_steps": 72, "num_input_tokens_seen": 0, "num_train_epochs": 4, "save_steps": 500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 0.0, "train_batch_size": 32, "trial_name": null, "trial_params": null }