| { |
| "best_global_step": 72, |
| "best_metric": 0.7275517192718437, |
| "best_model_checkpoint": "MNLP_M3_document_encoder_sciqa/checkpoint-72", |
| "epoch": 3.8135593220338984, |
| "eval_steps": 500, |
| "global_step": 72, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.5423728813559322, |
| "grad_norm": 164.72093200683594, |
| "learning_rate": 1.9987954562051724e-05, |
| "loss": 22.4049, |
| "step": 10 |
| }, |
| { |
| "epoch": 1.0, |
| "eval_dim_128_cosine_accuracy@1": 0.5452812202097236, |
| "eval_dim_128_cosine_accuracy@10": 0.8760724499523356, |
| "eval_dim_128_cosine_accuracy@3": 0.7416587225929456, |
| "eval_dim_128_cosine_accuracy@5": 0.8074356530028599, |
| "eval_dim_128_cosine_map@100": 0.6605612754102786, |
| "eval_dim_128_cosine_mrr@10": 0.6559349796480402, |
| "eval_dim_128_cosine_ndcg@10": 0.7092688022688834, |
| "eval_dim_128_cosine_precision@1": 0.5452812202097236, |
| "eval_dim_128_cosine_precision@10": 0.08760724499523356, |
| "eval_dim_128_cosine_precision@3": 0.24721957419764853, |
| "eval_dim_128_cosine_precision@5": 0.161487130600572, |
| "eval_dim_128_cosine_recall@1": 0.5452812202097236, |
| "eval_dim_128_cosine_recall@10": 0.8760724499523356, |
| "eval_dim_128_cosine_recall@3": 0.7416587225929456, |
| "eval_dim_128_cosine_recall@5": 0.8074356530028599, |
| "eval_dim_192_cosine_accuracy@1": 0.5624404194470924, |
| "eval_dim_192_cosine_accuracy@10": 0.8932316491897044, |
| "eval_dim_192_cosine_accuracy@3": 0.7597712106768351, |
| "eval_dim_192_cosine_accuracy@5": 0.8188751191611058, |
| "eval_dim_192_cosine_map@100": 0.677245219852975, |
| "eval_dim_192_cosine_mrr@10": 0.6730234388003697, |
| "eval_dim_192_cosine_ndcg@10": 0.7262712999939527, |
| "eval_dim_192_cosine_precision@1": 0.5624404194470924, |
| "eval_dim_192_cosine_precision@10": 0.08932316491897044, |
| "eval_dim_192_cosine_precision@3": 0.25325707022561167, |
| "eval_dim_192_cosine_precision@5": 0.16377502383222117, |
| "eval_dim_192_cosine_recall@1": 0.5624404194470924, |
| "eval_dim_192_cosine_recall@10": 0.8932316491897044, |
| "eval_dim_192_cosine_recall@3": 0.7597712106768351, |
| "eval_dim_192_cosine_recall@5": 0.8188751191611058, |
| "eval_dim_256_cosine_accuracy@1": 0.5653002859866539, |
| "eval_dim_256_cosine_accuracy@10": 0.8960915157292659, |
| "eval_dim_256_cosine_accuracy@3": 0.7683508102955195, |
| "eval_dim_256_cosine_accuracy@5": 0.8236415633937083, |
| "eval_dim_256_cosine_map@100": 0.6831583296339104, |
| "eval_dim_256_cosine_mrr@10": 0.6786784844220503, |
| "eval_dim_256_cosine_ndcg@10": 0.7314611486548883, |
| "eval_dim_256_cosine_precision@1": 0.5653002859866539, |
| "eval_dim_256_cosine_precision@10": 0.08960915157292659, |
| "eval_dim_256_cosine_precision@3": 0.25611693676517316, |
| "eval_dim_256_cosine_precision@5": 0.16472831267874166, |
| "eval_dim_256_cosine_recall@1": 0.5653002859866539, |
| "eval_dim_256_cosine_recall@10": 0.8960915157292659, |
| "eval_dim_256_cosine_recall@3": 0.7683508102955195, |
| "eval_dim_256_cosine_recall@5": 0.8236415633937083, |
| "eval_dim_384_cosine_accuracy@1": 0.5786463298379408, |
| "eval_dim_384_cosine_accuracy@10": 0.9075309818875119, |
| "eval_dim_384_cosine_accuracy@3": 0.776930409914204, |
| "eval_dim_384_cosine_accuracy@5": 0.8417540514775977, |
| "eval_dim_384_cosine_map@100": 0.6932934943306605, |
| "eval_dim_384_cosine_mrr@10": 0.6894563227261042, |
| "eval_dim_384_cosine_ndcg@10": 0.7423737824827953, |
| "eval_dim_384_cosine_precision@1": 0.5786463298379408, |
| "eval_dim_384_cosine_precision@10": 0.0907530981887512, |
| "eval_dim_384_cosine_precision@3": 0.2589768033047346, |
| "eval_dim_384_cosine_precision@5": 0.16835081029551957, |
| "eval_dim_384_cosine_recall@1": 0.5786463298379408, |
| "eval_dim_384_cosine_recall@10": 0.9075309818875119, |
| "eval_dim_384_cosine_recall@3": 0.776930409914204, |
| "eval_dim_384_cosine_recall@5": 0.8417540514775977, |
| "eval_dim_64_cosine_accuracy@1": 0.49285033365109626, |
| "eval_dim_64_cosine_accuracy@10": 0.8274547187797903, |
| "eval_dim_64_cosine_accuracy@3": 0.684461391801716, |
| "eval_dim_64_cosine_accuracy@5": 0.7578646329837941, |
| "eval_dim_64_cosine_map@100": 0.6088952628032813, |
| "eval_dim_64_cosine_mrr@10": 0.6032237807738285, |
| "eval_dim_64_cosine_ndcg@10": 0.6575406372744073, |
| "eval_dim_64_cosine_precision@1": 0.49285033365109626, |
| "eval_dim_64_cosine_precision@10": 0.08274547187797902, |
| "eval_dim_64_cosine_precision@3": 0.2281537972672386, |
| "eval_dim_64_cosine_precision@5": 0.1515729265967588, |
| "eval_dim_64_cosine_recall@1": 0.49285033365109626, |
| "eval_dim_64_cosine_recall@10": 0.8274547187797903, |
| "eval_dim_64_cosine_recall@3": 0.684461391801716, |
| "eval_dim_64_cosine_recall@5": 0.7578646329837941, |
| "eval_dim_96_cosine_accuracy@1": 0.5214489990467112, |
| "eval_dim_96_cosine_accuracy@10": 0.8636796949475691, |
| "eval_dim_96_cosine_accuracy@3": 0.7264061010486177, |
| "eval_dim_96_cosine_accuracy@5": 0.7893231649189705, |
| "eval_dim_96_cosine_map@100": 0.6418431352074736, |
| "eval_dim_96_cosine_mrr@10": 0.6369528046363133, |
| "eval_dim_96_cosine_ndcg@10": 0.6919097155042885, |
| "eval_dim_96_cosine_precision@1": 0.5214489990467112, |
| "eval_dim_96_cosine_precision@10": 0.0863679694947569, |
| "eval_dim_96_cosine_precision@3": 0.2421353670162059, |
| "eval_dim_96_cosine_precision@5": 0.15786463298379408, |
| "eval_dim_96_cosine_recall@1": 0.5214489990467112, |
| "eval_dim_96_cosine_recall@10": 0.8636796949475691, |
| "eval_dim_96_cosine_recall@3": 0.7264061010486177, |
| "eval_dim_96_cosine_recall@5": 0.7893231649189705, |
| "eval_runtime": 116.4269, |
| "eval_samples_per_second": 0.0, |
| "eval_sequential_score": 0.6575406372744073, |
| "eval_steps_per_second": 0.0, |
| "step": 19 |
| }, |
| { |
| "epoch": 1.0542372881355933, |
| "grad_norm": 107.04779815673828, |
| "learning_rate": 1.8577286100002723e-05, |
| "loss": 16.6616, |
| "step": 20 |
| }, |
| { |
| "epoch": 1.5966101694915253, |
| "grad_norm": 97.63832092285156, |
| "learning_rate": 1.5141027441932217e-05, |
| "loss": 16.8367, |
| "step": 30 |
| }, |
| { |
| "epoch": 2.0, |
| "eval_dim_128_cosine_accuracy@1": 0.567206863679695, |
| "eval_dim_128_cosine_accuracy@10": 0.886558627264061, |
| "eval_dim_128_cosine_accuracy@3": 0.7607244995233555, |
| "eval_dim_128_cosine_accuracy@5": 0.8236415633937083, |
| "eval_dim_128_cosine_map@100": 0.6790430112153837, |
| "eval_dim_128_cosine_mrr@10": 0.6746886679679823, |
| "eval_dim_128_cosine_ndcg@10": 0.7260517487265687, |
| "eval_dim_128_cosine_precision@1": 0.567206863679695, |
| "eval_dim_128_cosine_precision@10": 0.0886558627264061, |
| "eval_dim_128_cosine_precision@3": 0.25357483317445184, |
| "eval_dim_128_cosine_precision@5": 0.16472831267874166, |
| "eval_dim_128_cosine_recall@1": 0.567206863679695, |
| "eval_dim_128_cosine_recall@10": 0.886558627264061, |
| "eval_dim_128_cosine_recall@3": 0.7607244995233555, |
| "eval_dim_128_cosine_recall@5": 0.8236415633937083, |
| "eval_dim_192_cosine_accuracy@1": 0.5805529075309819, |
| "eval_dim_192_cosine_accuracy@10": 0.9008579599618685, |
| "eval_dim_192_cosine_accuracy@3": 0.782650142993327, |
| "eval_dim_192_cosine_accuracy@5": 0.8322211630123928, |
| "eval_dim_192_cosine_map@100": 0.6964841260809953, |
| "eval_dim_192_cosine_mrr@10": 0.6923562879234952, |
| "eval_dim_192_cosine_ndcg@10": 0.7430712975035773, |
| "eval_dim_192_cosine_precision@1": 0.5805529075309819, |
| "eval_dim_192_cosine_precision@10": 0.09008579599618685, |
| "eval_dim_192_cosine_precision@3": 0.26088338099777564, |
| "eval_dim_192_cosine_precision@5": 0.16644423260247856, |
| "eval_dim_192_cosine_recall@1": 0.5805529075309819, |
| "eval_dim_192_cosine_recall@10": 0.9008579599618685, |
| "eval_dim_192_cosine_recall@3": 0.782650142993327, |
| "eval_dim_192_cosine_recall@5": 0.8322211630123928, |
| "eval_dim_256_cosine_accuracy@1": 0.5919923736892279, |
| "eval_dim_256_cosine_accuracy@10": 0.9142040038131554, |
| "eval_dim_256_cosine_accuracy@3": 0.7902764537654909, |
| "eval_dim_256_cosine_accuracy@5": 0.8360343183984748, |
| "eval_dim_256_cosine_map@100": 0.7038093293311698, |
| "eval_dim_256_cosine_mrr@10": 0.700305279404422, |
| "eval_dim_256_cosine_ndcg@10": 0.7520267351833514, |
| "eval_dim_256_cosine_precision@1": 0.5919923736892279, |
| "eval_dim_256_cosine_precision@10": 0.09142040038131555, |
| "eval_dim_256_cosine_precision@3": 0.26342548458849696, |
| "eval_dim_256_cosine_precision@5": 0.16720686367969492, |
| "eval_dim_256_cosine_recall@1": 0.5919923736892279, |
| "eval_dim_256_cosine_recall@10": 0.9142040038131554, |
| "eval_dim_256_cosine_recall@3": 0.7902764537654909, |
| "eval_dim_256_cosine_recall@5": 0.8360343183984748, |
| "eval_dim_384_cosine_accuracy@1": 0.6015252621544328, |
| "eval_dim_384_cosine_accuracy@10": 0.9199237368922784, |
| "eval_dim_384_cosine_accuracy@3": 0.7959961868446139, |
| "eval_dim_384_cosine_accuracy@5": 0.8531935176358436, |
| "eval_dim_384_cosine_map@100": 0.713601684515785, |
| "eval_dim_384_cosine_mrr@10": 0.7104082497314151, |
| "eval_dim_384_cosine_ndcg@10": 0.761241503632434, |
| "eval_dim_384_cosine_precision@1": 0.6015252621544328, |
| "eval_dim_384_cosine_precision@10": 0.09199237368922783, |
| "eval_dim_384_cosine_precision@3": 0.26533206228153794, |
| "eval_dim_384_cosine_precision@5": 0.17063870352716873, |
| "eval_dim_384_cosine_recall@1": 0.6015252621544328, |
| "eval_dim_384_cosine_recall@10": 0.9199237368922784, |
| "eval_dim_384_cosine_recall@3": 0.7959961868446139, |
| "eval_dim_384_cosine_recall@5": 0.8531935176358436, |
| "eval_dim_64_cosine_accuracy@1": 0.5138226882745471, |
| "eval_dim_64_cosine_accuracy@10": 0.8341277407054337, |
| "eval_dim_64_cosine_accuracy@3": 0.7016205910390848, |
| "eval_dim_64_cosine_accuracy@5": 0.7645376549094376, |
| "eval_dim_64_cosine_map@100": 0.6242158272303533, |
| "eval_dim_64_cosine_mrr@10": 0.618670464690484, |
| "eval_dim_64_cosine_ndcg@10": 0.6707950308444217, |
| "eval_dim_64_cosine_precision@1": 0.5138226882745471, |
| "eval_dim_64_cosine_precision@10": 0.08341277407054337, |
| "eval_dim_64_cosine_precision@3": 0.2338735303463616, |
| "eval_dim_64_cosine_precision@5": 0.1529075309818875, |
| "eval_dim_64_cosine_recall@1": 0.5138226882745471, |
| "eval_dim_64_cosine_recall@10": 0.8341277407054337, |
| "eval_dim_64_cosine_recall@3": 0.7016205910390848, |
| "eval_dim_64_cosine_recall@5": 0.7645376549094376, |
| "eval_dim_96_cosine_accuracy@1": 0.5471877979027645, |
| "eval_dim_96_cosine_accuracy@10": 0.8722592945662536, |
| "eval_dim_96_cosine_accuracy@3": 0.7407054337464252, |
| "eval_dim_96_cosine_accuracy@5": 0.8017159199237369, |
| "eval_dim_96_cosine_map@100": 0.6622003643008398, |
| "eval_dim_96_cosine_mrr@10": 0.6576811627097615, |
| "eval_dim_96_cosine_ndcg@10": 0.7097194683573752, |
| "eval_dim_96_cosine_precision@1": 0.5471877979027645, |
| "eval_dim_96_cosine_precision@10": 0.08722592945662536, |
| "eval_dim_96_cosine_precision@3": 0.2469018112488084, |
| "eval_dim_96_cosine_precision@5": 0.16034318398474737, |
| "eval_dim_96_cosine_recall@1": 0.5471877979027645, |
| "eval_dim_96_cosine_recall@10": 0.8722592945662536, |
| "eval_dim_96_cosine_recall@3": 0.7407054337464252, |
| "eval_dim_96_cosine_recall@5": 0.8017159199237369, |
| "eval_runtime": 119.8934, |
| "eval_samples_per_second": 0.0, |
| "eval_sequential_score": 0.6707950308444217, |
| "eval_steps_per_second": 0.0, |
| "step": 38 |
| }, |
| { |
| "epoch": 2.1084745762711865, |
| "grad_norm": 113.89473724365234, |
| "learning_rate": 1.0490676743274181e-05, |
| "loss": 12.8169, |
| "step": 40 |
| }, |
| { |
| "epoch": 2.6508474576271186, |
| "grad_norm": 81.27326965332031, |
| "learning_rate": 5.724449065697182e-06, |
| "loss": 13.7826, |
| "step": 50 |
| }, |
| { |
| "epoch": 3.0, |
| "eval_dim_128_cosine_accuracy@1": 0.567206863679695, |
| "eval_dim_128_cosine_accuracy@10": 0.8903717826501429, |
| "eval_dim_128_cosine_accuracy@3": 0.7616777883698761, |
| "eval_dim_128_cosine_accuracy@5": 0.8265014299332698, |
| "eval_dim_128_cosine_map@100": 0.6794753898354032, |
| "eval_dim_128_cosine_mrr@10": 0.6752920392815543, |
| "eval_dim_128_cosine_ndcg@10": 0.7273531110418706, |
| "eval_dim_128_cosine_precision@1": 0.567206863679695, |
| "eval_dim_128_cosine_precision@10": 0.08903717826501431, |
| "eval_dim_128_cosine_precision@3": 0.253892596123292, |
| "eval_dim_128_cosine_precision@5": 0.16530028598665394, |
| "eval_dim_128_cosine_recall@1": 0.567206863679695, |
| "eval_dim_128_cosine_recall@10": 0.8903717826501429, |
| "eval_dim_128_cosine_recall@3": 0.7616777883698761, |
| "eval_dim_128_cosine_recall@5": 0.8265014299332698, |
| "eval_dim_192_cosine_accuracy@1": 0.5910390848427073, |
| "eval_dim_192_cosine_accuracy@10": 0.9046711153479504, |
| "eval_dim_192_cosine_accuracy@3": 0.7778836987607245, |
| "eval_dim_192_cosine_accuracy@5": 0.8360343183984748, |
| "eval_dim_192_cosine_map@100": 0.7014228144337117, |
| "eval_dim_192_cosine_mrr@10": 0.6975449029309853, |
| "eval_dim_192_cosine_ndcg@10": 0.7477240665900656, |
| "eval_dim_192_cosine_precision@1": 0.5910390848427073, |
| "eval_dim_192_cosine_precision@10": 0.09046711153479504, |
| "eval_dim_192_cosine_precision@3": 0.25929456625357483, |
| "eval_dim_192_cosine_precision@5": 0.16720686367969495, |
| "eval_dim_192_cosine_recall@1": 0.5910390848427073, |
| "eval_dim_192_cosine_recall@10": 0.9046711153479504, |
| "eval_dim_192_cosine_recall@3": 0.7778836987607245, |
| "eval_dim_192_cosine_recall@5": 0.8360343183984748, |
| "eval_dim_256_cosine_accuracy@1": 0.5948522402287894, |
| "eval_dim_256_cosine_accuracy@10": 0.9151572926596759, |
| "eval_dim_256_cosine_accuracy@3": 0.792183031458532, |
| "eval_dim_256_cosine_accuracy@5": 0.8398474737845567, |
| "eval_dim_256_cosine_map@100": 0.7070932589939358, |
| "eval_dim_256_cosine_mrr@10": 0.7035797509343749, |
| "eval_dim_256_cosine_ndcg@10": 0.7548435122429773, |
| "eval_dim_256_cosine_precision@1": 0.5948522402287894, |
| "eval_dim_256_cosine_precision@10": 0.09151572926596759, |
| "eval_dim_256_cosine_precision@3": 0.2640610104861773, |
| "eval_dim_256_cosine_precision@5": 0.16796949475691134, |
| "eval_dim_256_cosine_recall@1": 0.5948522402287894, |
| "eval_dim_256_cosine_recall@10": 0.9151572926596759, |
| "eval_dim_256_cosine_recall@3": 0.792183031458532, |
| "eval_dim_256_cosine_recall@5": 0.8398474737845567, |
| "eval_dim_384_cosine_accuracy@1": 0.6101048617731173, |
| "eval_dim_384_cosine_accuracy@10": 0.9256434699714013, |
| "eval_dim_384_cosine_accuracy@3": 0.8007626310772163, |
| "eval_dim_384_cosine_accuracy@5": 0.8541468064823642, |
| "eval_dim_384_cosine_map@100": 0.7197084605820631, |
| "eval_dim_384_cosine_mrr@10": 0.7170116664396936, |
| "eval_dim_384_cosine_ndcg@10": 0.7675175612283535, |
| "eval_dim_384_cosine_precision@1": 0.6101048617731173, |
| "eval_dim_384_cosine_precision@10": 0.09256434699714014, |
| "eval_dim_384_cosine_precision@3": 0.2669208770257388, |
| "eval_dim_384_cosine_precision@5": 0.17082936129647283, |
| "eval_dim_384_cosine_recall@1": 0.6101048617731173, |
| "eval_dim_384_cosine_recall@10": 0.9256434699714013, |
| "eval_dim_384_cosine_recall@3": 0.8007626310772163, |
| "eval_dim_384_cosine_recall@5": 0.8541468064823642, |
| "eval_dim_64_cosine_accuracy@1": 0.5166825548141086, |
| "eval_dim_64_cosine_accuracy@10": 0.8369876072449952, |
| "eval_dim_64_cosine_accuracy@3": 0.7054337464251669, |
| "eval_dim_64_cosine_accuracy@5": 0.7673975214489991, |
| "eval_dim_64_cosine_map@100": 0.629350282837756, |
| "eval_dim_64_cosine_mrr@10": 0.6240088822309986, |
| "eval_dim_64_cosine_ndcg@10": 0.6755921916053389, |
| "eval_dim_64_cosine_precision@1": 0.5166825548141086, |
| "eval_dim_64_cosine_precision@10": 0.08369876072449953, |
| "eval_dim_64_cosine_precision@3": 0.23514458214172226, |
| "eval_dim_64_cosine_precision@5": 0.1534795042897998, |
| "eval_dim_64_cosine_recall@1": 0.5166825548141086, |
| "eval_dim_64_cosine_recall@10": 0.8369876072449952, |
| "eval_dim_64_cosine_recall@3": 0.7054337464251669, |
| "eval_dim_64_cosine_recall@5": 0.7673975214489991, |
| "eval_dim_96_cosine_accuracy@1": 0.5529075309818875, |
| "eval_dim_96_cosine_accuracy@10": 0.8741658722592945, |
| "eval_dim_96_cosine_accuracy@3": 0.7416587225929456, |
| "eval_dim_96_cosine_accuracy@5": 0.8093422306959008, |
| "eval_dim_96_cosine_map@100": 0.6652525185575742, |
| "eval_dim_96_cosine_mrr@10": 0.6608247461679306, |
| "eval_dim_96_cosine_ndcg@10": 0.7125237648315317, |
| "eval_dim_96_cosine_precision@1": 0.5529075309818875, |
| "eval_dim_96_cosine_precision@10": 0.08741658722592945, |
| "eval_dim_96_cosine_precision@3": 0.24721957419764853, |
| "eval_dim_96_cosine_precision@5": 0.1618684461391802, |
| "eval_dim_96_cosine_recall@1": 0.5529075309818875, |
| "eval_dim_96_cosine_recall@10": 0.8741658722592945, |
| "eval_dim_96_cosine_recall@3": 0.7416587225929456, |
| "eval_dim_96_cosine_recall@5": 0.8093422306959008, |
| "eval_runtime": 120.2085, |
| "eval_samples_per_second": 0.0, |
| "eval_sequential_score": 0.6755921916053389, |
| "eval_steps_per_second": 0.0, |
| "step": 57 |
| }, |
| { |
| "epoch": 3.1627118644067798, |
| "grad_norm": 102.55581665039062, |
| "learning_rate": 1.967924685193552e-06, |
| "loss": 12.4455, |
| "step": 60 |
| }, |
| { |
| "epoch": 3.705084745762712, |
| "grad_norm": 84.57442474365234, |
| "learning_rate": 1.0823490035218986e-07, |
| "loss": 12.2968, |
| "step": 70 |
| }, |
| { |
| "epoch": 3.8135593220338984, |
| "eval_dim_128_cosine_accuracy@1": 0.5662535748331744, |
| "eval_dim_128_cosine_accuracy@10": 0.8913250714966635, |
| "eval_dim_128_cosine_accuracy@3": 0.7626310772163966, |
| "eval_dim_128_cosine_accuracy@5": 0.8265014299332698, |
| "eval_dim_128_cosine_map@100": 0.6793502491099088, |
| "eval_dim_128_cosine_mrr@10": 0.6752375656331816, |
| "eval_dim_128_cosine_ndcg@10": 0.7275517192718437, |
| "eval_dim_128_cosine_precision@1": 0.5662535748331744, |
| "eval_dim_128_cosine_precision@10": 0.08913250714966635, |
| "eval_dim_128_cosine_precision@3": 0.25421035907213213, |
| "eval_dim_128_cosine_precision@5": 0.16530028598665394, |
| "eval_dim_128_cosine_recall@1": 0.5662535748331744, |
| "eval_dim_128_cosine_recall@10": 0.8913250714966635, |
| "eval_dim_128_cosine_recall@3": 0.7626310772163966, |
| "eval_dim_128_cosine_recall@5": 0.8265014299332698, |
| "eval_dim_192_cosine_accuracy@1": 0.5891325071496664, |
| "eval_dim_192_cosine_accuracy@10": 0.90371782650143, |
| "eval_dim_192_cosine_accuracy@3": 0.778836987607245, |
| "eval_dim_192_cosine_accuracy@5": 0.8331744518589133, |
| "eval_dim_192_cosine_map@100": 0.7004357679049269, |
| "eval_dim_192_cosine_mrr@10": 0.6964694266648511, |
| "eval_dim_192_cosine_ndcg@10": 0.7467179313530818, |
| "eval_dim_192_cosine_precision@1": 0.5891325071496664, |
| "eval_dim_192_cosine_precision@10": 0.090371782650143, |
| "eval_dim_192_cosine_precision@3": 0.259612329202415, |
| "eval_dim_192_cosine_precision@5": 0.16663489037178267, |
| "eval_dim_192_cosine_recall@1": 0.5891325071496664, |
| "eval_dim_192_cosine_recall@10": 0.90371782650143, |
| "eval_dim_192_cosine_recall@3": 0.778836987607245, |
| "eval_dim_192_cosine_recall@5": 0.8331744518589133, |
| "eval_dim_256_cosine_accuracy@1": 0.5977121067683508, |
| "eval_dim_256_cosine_accuracy@10": 0.9151572926596759, |
| "eval_dim_256_cosine_accuracy@3": 0.7912297426120114, |
| "eval_dim_256_cosine_accuracy@5": 0.8398474737845567, |
| "eval_dim_256_cosine_map@100": 0.7084736712852033, |
| "eval_dim_256_cosine_mrr@10": 0.7049529408204341, |
| "eval_dim_256_cosine_ndcg@10": 0.7558547240171754, |
| "eval_dim_256_cosine_precision@1": 0.5977121067683508, |
| "eval_dim_256_cosine_precision@10": 0.09151572926596759, |
| "eval_dim_256_cosine_precision@3": 0.26374324753733713, |
| "eval_dim_256_cosine_precision@5": 0.16796949475691134, |
| "eval_dim_256_cosine_recall@1": 0.5977121067683508, |
| "eval_dim_256_cosine_recall@10": 0.9151572926596759, |
| "eval_dim_256_cosine_recall@3": 0.7912297426120114, |
| "eval_dim_256_cosine_recall@5": 0.8398474737845567, |
| "eval_dim_384_cosine_accuracy@1": 0.6120114394661582, |
| "eval_dim_384_cosine_accuracy@10": 0.9275500476644424, |
| "eval_dim_384_cosine_accuracy@3": 0.8017159199237369, |
| "eval_dim_384_cosine_accuracy@5": 0.8541468064823642, |
| "eval_dim_384_cosine_map@100": 0.7210073638258574, |
| "eval_dim_384_cosine_mrr@10": 0.7184669450875366, |
| "eval_dim_384_cosine_ndcg@10": 0.7690377395004954, |
| "eval_dim_384_cosine_precision@1": 0.6120114394661582, |
| "eval_dim_384_cosine_precision@10": 0.09275500476644424, |
| "eval_dim_384_cosine_precision@3": 0.267238639974579, |
| "eval_dim_384_cosine_precision@5": 0.17082936129647283, |
| "eval_dim_384_cosine_recall@1": 0.6120114394661582, |
| "eval_dim_384_cosine_recall@10": 0.9275500476644424, |
| "eval_dim_384_cosine_recall@3": 0.8017159199237369, |
| "eval_dim_384_cosine_recall@5": 0.8541468064823642, |
| "eval_dim_64_cosine_accuracy@1": 0.5166825548141086, |
| "eval_dim_64_cosine_accuracy@10": 0.8369876072449952, |
| "eval_dim_64_cosine_accuracy@3": 0.7044804575786463, |
| "eval_dim_64_cosine_accuracy@5": 0.7683508102955195, |
| "eval_dim_64_cosine_map@100": 0.6292715088820261, |
| "eval_dim_64_cosine_mrr@10": 0.6239059875618503, |
| "eval_dim_64_cosine_ndcg@10": 0.6755211859192654, |
| "eval_dim_64_cosine_precision@1": 0.5166825548141086, |
| "eval_dim_64_cosine_precision@10": 0.08369876072449953, |
| "eval_dim_64_cosine_precision@3": 0.2348268191928821, |
| "eval_dim_64_cosine_precision@5": 0.1536701620591039, |
| "eval_dim_64_cosine_recall@1": 0.5166825548141086, |
| "eval_dim_64_cosine_recall@10": 0.8369876072449952, |
| "eval_dim_64_cosine_recall@3": 0.7044804575786463, |
| "eval_dim_64_cosine_recall@5": 0.7683508102955195, |
| "eval_dim_96_cosine_accuracy@1": 0.551954242135367, |
| "eval_dim_96_cosine_accuracy@10": 0.8732125834127741, |
| "eval_dim_96_cosine_accuracy@3": 0.7416587225929456, |
| "eval_dim_96_cosine_accuracy@5": 0.8093422306959008, |
| "eval_dim_96_cosine_map@100": 0.6648689218069684, |
| "eval_dim_96_cosine_mrr@10": 0.660333348464903, |
| "eval_dim_96_cosine_ndcg@10": 0.7119774118711802, |
| "eval_dim_96_cosine_precision@1": 0.551954242135367, |
| "eval_dim_96_cosine_precision@10": 0.08732125834127741, |
| "eval_dim_96_cosine_precision@3": 0.24721957419764853, |
| "eval_dim_96_cosine_precision@5": 0.1618684461391802, |
| "eval_dim_96_cosine_recall@1": 0.551954242135367, |
| "eval_dim_96_cosine_recall@10": 0.8732125834127741, |
| "eval_dim_96_cosine_recall@3": 0.7416587225929456, |
| "eval_dim_96_cosine_recall@5": 0.8093422306959008, |
| "eval_runtime": 122.4656, |
| "eval_samples_per_second": 0.0, |
| "eval_sequential_score": 0.6755211859192654, |
| "eval_steps_per_second": 0.0, |
| "step": 72 |
| } |
| ], |
| "logging_steps": 10, |
| "max_steps": 72, |
| "num_input_tokens_seen": 0, |
| "num_train_epochs": 4, |
| "save_steps": 500, |
| "stateful_callbacks": { |
| "TrainerControl": { |
| "args": { |
| "should_epoch_stop": false, |
| "should_evaluate": false, |
| "should_log": false, |
| "should_save": true, |
| "should_training_stop": true |
| }, |
| "attributes": {} |
| } |
| }, |
| "total_flos": 0.0, |
| "train_batch_size": 32, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|