IoannisKat1's picture
Add finetuned model
42557c6 verified
{
"best_global_step": 39,
"best_metric": 0.37139192897263235,
"best_model_checkpoint": "intfloat/multilingual-e5-large/checkpoint-39",
"epoch": 4.0,
"eval_steps": 500,
"global_step": 52,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.8163265306122449,
"grad_norm": 307.08624267578125,
"learning_rate": 7.500000000000001e-06,
"loss": 31.5155,
"step": 10
},
{
"epoch": 1.0,
"eval_dim_1024_cosine_accuracy@1": 0.42509603072983354,
"eval_dim_1024_cosine_accuracy@10": 0.49295774647887325,
"eval_dim_1024_cosine_accuracy@3": 0.43085787451984636,
"eval_dim_1024_cosine_accuracy@5": 0.46030729833546735,
"eval_dim_1024_cosine_map@100": 0.508986346237021,
"eval_dim_1024_cosine_mrr@10": 0.4369535394183281,
"eval_dim_1024_cosine_ndcg@10": 0.4493804868009024,
"eval_dim_1024_cosine_precision@1": 0.42509603072983354,
"eval_dim_1024_cosine_precision@10": 0.376056338028169,
"eval_dim_1024_cosine_precision@3": 0.42402902262057185,
"eval_dim_1024_cosine_precision@5": 0.4133162612035851,
"eval_dim_1024_cosine_recall@1": 0.04813624827530403,
"eval_dim_1024_cosine_recall@10": 0.3150476790176975,
"eval_dim_1024_cosine_recall@3": 0.1404092551990217,
"eval_dim_1024_cosine_recall@5": 0.21147403835662126,
"eval_dim_128_cosine_accuracy@1": 0.31370038412291934,
"eval_dim_128_cosine_accuracy@10": 0.38156209987195905,
"eval_dim_128_cosine_accuracy@3": 0.31946222791293216,
"eval_dim_128_cosine_accuracy@5": 0.34571062740076824,
"eval_dim_128_cosine_map@100": 0.3991669558616212,
"eval_dim_128_cosine_mrr@10": 0.32517427799117904,
"eval_dim_128_cosine_ndcg@10": 0.33618283481296385,
"eval_dim_128_cosine_precision@1": 0.31370038412291934,
"eval_dim_128_cosine_precision@10": 0.2764404609475032,
"eval_dim_128_cosine_precision@3": 0.31284677763551,
"eval_dim_128_cosine_precision@5": 0.30422535211267604,
"eval_dim_128_cosine_recall@1": 0.037933385936292925,
"eval_dim_128_cosine_recall@10": 0.24798465115464788,
"eval_dim_128_cosine_recall@3": 0.11100168654049715,
"eval_dim_128_cosine_recall@5": 0.1670926413559068,
"eval_dim_256_cosine_accuracy@1": 0.36427656850192064,
"eval_dim_256_cosine_accuracy@10": 0.44814340588988477,
"eval_dim_256_cosine_accuracy@3": 0.36939820742637647,
"eval_dim_256_cosine_accuracy@5": 0.4090909090909091,
"eval_dim_256_cosine_map@100": 0.45841270037343096,
"eval_dim_256_cosine_mrr@10": 0.37879397597707415,
"eval_dim_256_cosine_ndcg@10": 0.3947006636735062,
"eval_dim_256_cosine_precision@1": 0.36427656850192064,
"eval_dim_256_cosine_precision@10": 0.3289372599231754,
"eval_dim_256_cosine_precision@3": 0.36363636363636365,
"eval_dim_256_cosine_precision@5": 0.3560819462227913,
"eval_dim_256_cosine_recall@1": 0.04277277943657814,
"eval_dim_256_cosine_recall@10": 0.28617844199333936,
"eval_dim_256_cosine_recall@3": 0.1253991943934714,
"eval_dim_256_cosine_recall@5": 0.18947388504512186,
"eval_dim_512_cosine_accuracy@1": 0.4084507042253521,
"eval_dim_512_cosine_accuracy@10": 0.4871959026888604,
"eval_dim_512_cosine_accuracy@3": 0.41357234314980795,
"eval_dim_512_cosine_accuracy@5": 0.4519846350832266,
"eval_dim_512_cosine_map@100": 0.495554245202425,
"eval_dim_512_cosine_mrr@10": 0.42213127248338495,
"eval_dim_512_cosine_ndcg@10": 0.43644305450989757,
"eval_dim_512_cosine_precision@1": 0.4084507042253521,
"eval_dim_512_cosine_precision@10": 0.36606914212548014,
"eval_dim_512_cosine_precision@3": 0.40738369611609043,
"eval_dim_512_cosine_precision@5": 0.39846350832266325,
"eval_dim_512_cosine_recall@1": 0.04628035514721453,
"eval_dim_512_cosine_recall@10": 0.30419701916496145,
"eval_dim_512_cosine_recall@3": 0.13522898183596205,
"eval_dim_512_cosine_recall@5": 0.20394662187726964,
"eval_dim_64_cosine_accuracy@1": 0.24199743918053776,
"eval_dim_64_cosine_accuracy@10": 0.29641485275288093,
"eval_dim_64_cosine_accuracy@3": 0.24775928297055058,
"eval_dim_64_cosine_accuracy@5": 0.26952624839948786,
"eval_dim_64_cosine_map@100": 0.31803601064541553,
"eval_dim_64_cosine_mrr@10": 0.25159771761884414,
"eval_dim_64_cosine_ndcg@10": 0.2620553065689597,
"eval_dim_64_cosine_precision@1": 0.24199743918053776,
"eval_dim_64_cosine_precision@10": 0.21568501920614594,
"eval_dim_64_cosine_precision@3": 0.24199743918053776,
"eval_dim_64_cosine_precision@5": 0.23649167733674775,
"eval_dim_64_cosine_recall@1": 0.029110868794154622,
"eval_dim_64_cosine_recall@10": 0.19521971714475267,
"eval_dim_64_cosine_recall@3": 0.08524734139651896,
"eval_dim_64_cosine_recall@5": 0.12921904680249943,
"eval_dim_768_cosine_accuracy@1": 0.4193341869398207,
"eval_dim_768_cosine_accuracy@10": 0.4910371318822023,
"eval_dim_768_cosine_accuracy@3": 0.4238156209987196,
"eval_dim_768_cosine_accuracy@5": 0.4551856594110115,
"eval_dim_768_cosine_map@100": 0.5037778776293926,
"eval_dim_768_cosine_mrr@10": 0.4315339003719285,
"eval_dim_768_cosine_ndcg@10": 0.44456410503401034,
"eval_dim_768_cosine_precision@1": 0.4193341869398207,
"eval_dim_768_cosine_precision@10": 0.37272727272727274,
"eval_dim_768_cosine_precision@3": 0.4180537772087068,
"eval_dim_768_cosine_precision@5": 0.4076824583866837,
"eval_dim_768_cosine_recall@1": 0.04699592881851732,
"eval_dim_768_cosine_recall@10": 0.3107289399017082,
"eval_dim_768_cosine_recall@3": 0.13721565163348118,
"eval_dim_768_cosine_recall@5": 0.20710427114944024,
"eval_runtime": 98.6525,
"eval_samples_per_second": 0.0,
"eval_sequential_score": 0.2620553065689597,
"eval_steps_per_second": 0.0,
"step": 13
},
{
"epoch": 1.5714285714285714,
"grad_norm": 280.07818603515625,
"learning_rate": 1.5833333333333333e-05,
"loss": 19.0409,
"step": 20
},
{
"epoch": 2.0,
"eval_dim_1024_cosine_accuracy@1": 0.3854033290653009,
"eval_dim_1024_cosine_accuracy@10": 0.45454545454545453,
"eval_dim_1024_cosine_accuracy@3": 0.3886043533930858,
"eval_dim_1024_cosine_accuracy@5": 0.41101152368758004,
"eval_dim_1024_cosine_map@100": 0.47259820099791205,
"eval_dim_1024_cosine_mrr@10": 0.39624870434729537,
"eval_dim_1024_cosine_ndcg@10": 0.4065329035406967,
"eval_dim_1024_cosine_precision@1": 0.3854033290653009,
"eval_dim_1024_cosine_precision@10": 0.3357874519846351,
"eval_dim_1024_cosine_precision@3": 0.3839095177123346,
"eval_dim_1024_cosine_precision@5": 0.3713188220230474,
"eval_dim_1024_cosine_recall@1": 0.0451686782205082,
"eval_dim_1024_cosine_recall@10": 0.2918225395020212,
"eval_dim_1024_cosine_recall@3": 0.13200270380544088,
"eval_dim_1024_cosine_recall@5": 0.19735476247586825,
"eval_dim_128_cosine_accuracy@1": 0.31562099871959026,
"eval_dim_128_cosine_accuracy@10": 0.39180537772087065,
"eval_dim_128_cosine_accuracy@3": 0.3207426376440461,
"eval_dim_128_cosine_accuracy@5": 0.352112676056338,
"eval_dim_128_cosine_map@100": 0.40471008477532144,
"eval_dim_128_cosine_mrr@10": 0.32839105339105285,
"eval_dim_128_cosine_ndcg@10": 0.34177784905202935,
"eval_dim_128_cosine_precision@1": 0.31562099871959026,
"eval_dim_128_cosine_precision@10": 0.280729833546735,
"eval_dim_128_cosine_precision@3": 0.31455399061032857,
"eval_dim_128_cosine_precision@5": 0.30640204865556975,
"eval_dim_128_cosine_recall@1": 0.03888088094516579,
"eval_dim_128_cosine_recall@10": 0.2550464126190524,
"eval_dim_128_cosine_recall@3": 0.11341113256173359,
"eval_dim_128_cosine_recall@5": 0.17046484922169536,
"eval_dim_256_cosine_accuracy@1": 0.3418693982074264,
"eval_dim_256_cosine_accuracy@10": 0.4238156209987196,
"eval_dim_256_cosine_accuracy@3": 0.34763124199743917,
"eval_dim_256_cosine_accuracy@5": 0.38092189500640206,
"eval_dim_256_cosine_map@100": 0.43770217754051305,
"eval_dim_256_cosine_mrr@10": 0.35596482938032165,
"eval_dim_256_cosine_ndcg@10": 0.36923043791328775,
"eval_dim_256_cosine_precision@1": 0.3418693982074264,
"eval_dim_256_cosine_precision@10": 0.30441741357234314,
"eval_dim_256_cosine_precision@3": 0.34165599658557405,
"eval_dim_256_cosine_precision@5": 0.3322663252240717,
"eval_dim_256_cosine_recall@1": 0.041410929155814194,
"eval_dim_256_cosine_recall@10": 0.2705196189189818,
"eval_dim_256_cosine_recall@3": 0.1212642412965687,
"eval_dim_256_cosine_recall@5": 0.18173918651563936,
"eval_dim_512_cosine_accuracy@1": 0.37708066581306016,
"eval_dim_512_cosine_accuracy@10": 0.4532650448143406,
"eval_dim_512_cosine_accuracy@3": 0.38092189500640206,
"eval_dim_512_cosine_accuracy@5": 0.4084507042253521,
"eval_dim_512_cosine_map@100": 0.4678017780580059,
"eval_dim_512_cosine_mrr@10": 0.3893670101416575,
"eval_dim_512_cosine_ndcg@10": 0.40127522003513455,
"eval_dim_512_cosine_precision@1": 0.37708066581306016,
"eval_dim_512_cosine_precision@10": 0.33156209987195906,
"eval_dim_512_cosine_precision@3": 0.37537345283824153,
"eval_dim_512_cosine_precision@5": 0.36402048655569774,
"eval_dim_512_cosine_recall@1": 0.04457309853297402,
"eval_dim_512_cosine_recall@10": 0.2883968018428671,
"eval_dim_512_cosine_recall@3": 0.13007205872054822,
"eval_dim_512_cosine_recall@5": 0.19449520589871025,
"eval_dim_64_cosine_accuracy@1": 0.26696542893725994,
"eval_dim_64_cosine_accuracy@10": 0.33098591549295775,
"eval_dim_64_cosine_accuracy@3": 0.27208706786171577,
"eval_dim_64_cosine_accuracy@5": 0.293213828425096,
"eval_dim_64_cosine_map@100": 0.34719730722747555,
"eval_dim_64_cosine_mrr@10": 0.2776957197731842,
"eval_dim_64_cosine_ndcg@10": 0.2881905192612941,
"eval_dim_64_cosine_precision@1": 0.26696542893725994,
"eval_dim_64_cosine_precision@10": 0.237708066581306,
"eval_dim_64_cosine_precision@3": 0.26717883055911223,
"eval_dim_64_cosine_precision@5": 0.2596670934699104,
"eval_dim_64_cosine_recall@1": 0.031692344067516816,
"eval_dim_64_cosine_recall@10": 0.21473974122936995,
"eval_dim_64_cosine_recall@3": 0.09327455064654774,
"eval_dim_64_cosine_recall@5": 0.14131510912407144,
"eval_dim_768_cosine_accuracy@1": 0.37451984635083224,
"eval_dim_768_cosine_accuracy@10": 0.4539052496798976,
"eval_dim_768_cosine_accuracy@3": 0.37900128040973113,
"eval_dim_768_cosine_accuracy@5": 0.40973111395646605,
"eval_dim_768_cosine_map@100": 0.4672061011440217,
"eval_dim_768_cosine_mrr@10": 0.38746671950897227,
"eval_dim_768_cosine_ndcg@10": 0.4004027303245026,
"eval_dim_768_cosine_precision@1": 0.37451984635083224,
"eval_dim_768_cosine_precision@10": 0.3318181818181818,
"eval_dim_768_cosine_precision@3": 0.3734528382415706,
"eval_dim_768_cosine_precision@5": 0.3632522407170295,
"eval_dim_768_cosine_recall@1": 0.04413921317349132,
"eval_dim_768_cosine_recall@10": 0.28955317519546525,
"eval_dim_768_cosine_recall@3": 0.12896663310051748,
"eval_dim_768_cosine_recall@5": 0.19376203165061448,
"eval_runtime": 98.4244,
"eval_samples_per_second": 0.0,
"eval_sequential_score": 0.2881905192612941,
"eval_steps_per_second": 0.0,
"step": 26
},
{
"epoch": 2.326530612244898,
"grad_norm": 305.66259765625,
"learning_rate": 1.9973569167005725e-05,
"loss": 14.5314,
"step": 30
},
{
"epoch": 3.0,
"eval_dim_1024_cosine_accuracy@1": 0.4180537772087068,
"eval_dim_1024_cosine_accuracy@10": 0.49039692701664533,
"eval_dim_1024_cosine_accuracy@3": 0.42189500640204863,
"eval_dim_1024_cosine_accuracy@5": 0.4500640204865557,
"eval_dim_1024_cosine_map@100": 0.506794523350519,
"eval_dim_1024_cosine_mrr@10": 0.42985717334308843,
"eval_dim_1024_cosine_ndcg@10": 0.44178501209869797,
"eval_dim_1024_cosine_precision@1": 0.4180537772087068,
"eval_dim_1024_cosine_precision@10": 0.36869398207426374,
"eval_dim_1024_cosine_precision@3": 0.4163465642338881,
"eval_dim_1024_cosine_precision@5": 0.4043533930857874,
"eval_dim_1024_cosine_recall@1": 0.04734422767263886,
"eval_dim_1024_cosine_recall@10": 0.308531274625124,
"eval_dim_1024_cosine_recall@3": 0.138064233626932,
"eval_dim_1024_cosine_recall@5": 0.2069980430010945,
"eval_dim_128_cosine_accuracy@1": 0.34699103713188223,
"eval_dim_128_cosine_accuracy@10": 0.4212548015364917,
"eval_dim_128_cosine_accuracy@3": 0.35147247119078107,
"eval_dim_128_cosine_accuracy@5": 0.37900128040973113,
"eval_dim_128_cosine_map@100": 0.4338211299784659,
"eval_dim_128_cosine_mrr@10": 0.35916305916305874,
"eval_dim_128_cosine_ndcg@10": 0.37139192897263235,
"eval_dim_128_cosine_precision@1": 0.34699103713188223,
"eval_dim_128_cosine_precision@10": 0.3042893725992318,
"eval_dim_128_cosine_precision@3": 0.34571062740076824,
"eval_dim_128_cosine_precision@5": 0.3352112676056338,
"eval_dim_128_cosine_recall@1": 0.04217848526747235,
"eval_dim_128_cosine_recall@10": 0.2706183968947745,
"eval_dim_128_cosine_recall@3": 0.12288848071178002,
"eval_dim_128_cosine_recall@5": 0.18344012521240954,
"eval_dim_256_cosine_accuracy@1": 0.38348271446862997,
"eval_dim_256_cosine_accuracy@10": 0.4551856594110115,
"eval_dim_256_cosine_accuracy@3": 0.3886043533930858,
"eval_dim_256_cosine_accuracy@5": 0.4206145966709347,
"eval_dim_256_cosine_map@100": 0.4709582085612654,
"eval_dim_256_cosine_mrr@10": 0.3957850639188662,
"eval_dim_256_cosine_ndcg@10": 0.4087462230477571,
"eval_dim_256_cosine_precision@1": 0.38348271446862997,
"eval_dim_256_cosine_precision@10": 0.33886043533930854,
"eval_dim_256_cosine_precision@3": 0.382202304737516,
"eval_dim_256_cosine_precision@5": 0.3718309859154929,
"eval_dim_256_cosine_recall@1": 0.04466034705404223,
"eval_dim_256_cosine_recall@10": 0.2892016292717267,
"eval_dim_256_cosine_recall@3": 0.1301795023253766,
"eval_dim_256_cosine_recall@5": 0.19500340584044382,
"eval_dim_512_cosine_accuracy@1": 0.4065300896286812,
"eval_dim_512_cosine_accuracy@10": 0.4814340588988476,
"eval_dim_512_cosine_accuracy@3": 0.41229193341869397,
"eval_dim_512_cosine_accuracy@5": 0.44494238156209986,
"eval_dim_512_cosine_map@100": 0.49555759572196095,
"eval_dim_512_cosine_mrr@10": 0.41950236774180394,
"eval_dim_512_cosine_ndcg@10": 0.4329095460408428,
"eval_dim_512_cosine_precision@1": 0.4065300896286812,
"eval_dim_512_cosine_precision@10": 0.3596030729833547,
"eval_dim_512_cosine_precision@3": 0.4054630815194195,
"eval_dim_512_cosine_precision@5": 0.3947503201024327,
"eval_dim_512_cosine_recall@1": 0.047372341735862133,
"eval_dim_512_cosine_recall@10": 0.3071623578952262,
"eval_dim_512_cosine_recall@3": 0.1383106496582531,
"eval_dim_512_cosine_recall@5": 0.20757258542171747,
"eval_dim_64_cosine_accuracy@1": 0.3207426376440461,
"eval_dim_64_cosine_accuracy@10": 0.3725992317541613,
"eval_dim_64_cosine_accuracy@3": 0.322663252240717,
"eval_dim_64_cosine_accuracy@5": 0.3405889884763124,
"eval_dim_64_cosine_map@100": 0.3933467041096336,
"eval_dim_64_cosine_mrr@10": 0.32884732638253733,
"eval_dim_64_cosine_ndcg@10": 0.3371953828075091,
"eval_dim_64_cosine_precision@1": 0.3207426376440461,
"eval_dim_64_cosine_precision@10": 0.2797055057618438,
"eval_dim_64_cosine_precision@3": 0.3188220230473751,
"eval_dim_64_cosine_precision@5": 0.3088348271446863,
"eval_dim_64_cosine_recall@1": 0.036318765090758674,
"eval_dim_64_cosine_recall@10": 0.23840960718091392,
"eval_dim_64_cosine_recall@3": 0.10562189493083342,
"eval_dim_64_cosine_recall@5": 0.15867125525021739,
"eval_dim_768_cosine_accuracy@1": 0.41037131882202305,
"eval_dim_768_cosine_accuracy@10": 0.4833546734955186,
"eval_dim_768_cosine_accuracy@3": 0.4142125480153649,
"eval_dim_768_cosine_accuracy@5": 0.44430217669654287,
"eval_dim_768_cosine_map@100": 0.500478306774528,
"eval_dim_768_cosine_mrr@10": 0.4224889742495374,
"eval_dim_768_cosine_ndcg@10": 0.4349862241563486,
"eval_dim_768_cosine_precision@1": 0.41037131882202305,
"eval_dim_768_cosine_precision@10": 0.36165172855313704,
"eval_dim_768_cosine_precision@3": 0.4086641058472044,
"eval_dim_768_cosine_precision@5": 0.3969270166453265,
"eval_dim_768_cosine_recall@1": 0.047186779325657804,
"eval_dim_768_cosine_recall@10": 0.30540044861465576,
"eval_dim_768_cosine_recall@3": 0.1375709294981283,
"eval_dim_768_cosine_recall@5": 0.20603724780478358,
"eval_runtime": 98.5908,
"eval_samples_per_second": 0.0,
"eval_sequential_score": 0.3371953828075091,
"eval_steps_per_second": 0.0,
"step": 39
},
{
"epoch": 3.0816326530612246,
"grad_norm": 255.65982055664062,
"learning_rate": 1.9762960071199334e-05,
"loss": 8.6778,
"step": 40
},
{
"epoch": 3.8979591836734695,
"grad_norm": 470.4803771972656,
"learning_rate": 1.9346189253489888e-05,
"loss": 6.0257,
"step": 50
},
{
"epoch": 4.0,
"eval_dim_1024_cosine_accuracy@1": 0.4046094750320102,
"eval_dim_1024_cosine_accuracy@10": 0.47823303457106275,
"eval_dim_1024_cosine_accuracy@3": 0.4090909090909091,
"eval_dim_1024_cosine_accuracy@5": 0.43918053777208704,
"eval_dim_1024_cosine_map@100": 0.490599623630225,
"eval_dim_1024_cosine_mrr@10": 0.4168417068064951,
"eval_dim_1024_cosine_ndcg@10": 0.42913551824501384,
"eval_dim_1024_cosine_precision@1": 0.4046094750320102,
"eval_dim_1024_cosine_precision@10": 0.3565941101152369,
"eval_dim_1024_cosine_precision@3": 0.40311566367904395,
"eval_dim_1024_cosine_precision@5": 0.39180537772087065,
"eval_dim_1024_cosine_recall@1": 0.04660606778759063,
"eval_dim_1024_cosine_recall@10": 0.3014663479400921,
"eval_dim_1024_cosine_recall@3": 0.13592596883673455,
"eval_dim_1024_cosine_recall@5": 0.20379253880710943,
"eval_dim_128_cosine_accuracy@1": 0.34314980793854033,
"eval_dim_128_cosine_accuracy@10": 0.4148527528809219,
"eval_dim_128_cosine_accuracy@3": 0.34763124199743917,
"eval_dim_128_cosine_accuracy@5": 0.37708066581306016,
"eval_dim_128_cosine_map@100": 0.4276696379169563,
"eval_dim_128_cosine_mrr@10": 0.35513180090644836,
"eval_dim_128_cosine_ndcg@10": 0.36765573601526275,
"eval_dim_128_cosine_precision@1": 0.34314980793854033,
"eval_dim_128_cosine_precision@10": 0.302752880921895,
"eval_dim_128_cosine_precision@3": 0.3418693982074264,
"eval_dim_128_cosine_precision@5": 0.3322663252240717,
"eval_dim_128_cosine_recall@1": 0.040652627677675406,
"eval_dim_128_cosine_recall@10": 0.26330336421247125,
"eval_dim_128_cosine_recall@3": 0.1184519992454523,
"eval_dim_128_cosine_recall@5": 0.1774839552040709,
"eval_dim_256_cosine_accuracy@1": 0.3738796414852753,
"eval_dim_256_cosine_accuracy@10": 0.44558258642765686,
"eval_dim_256_cosine_accuracy@3": 0.37772087067861715,
"eval_dim_256_cosine_accuracy@5": 0.40717029449423814,
"eval_dim_256_cosine_map@100": 0.45855798848430374,
"eval_dim_256_cosine_mrr@10": 0.38572571794402755,
"eval_dim_256_cosine_ndcg@10": 0.3980442434686935,
"eval_dim_256_cosine_precision@1": 0.3738796414852753,
"eval_dim_256_cosine_precision@10": 0.3297695262483995,
"eval_dim_256_cosine_precision@3": 0.37238583013230897,
"eval_dim_256_cosine_precision@5": 0.3615877080665813,
"eval_dim_256_cosine_recall@1": 0.043086085492826574,
"eval_dim_256_cosine_recall@10": 0.2792649180924836,
"eval_dim_256_cosine_recall@3": 0.125747799799009,
"eval_dim_256_cosine_recall@5": 0.18837022600852496,
"eval_dim_512_cosine_accuracy@1": 0.39884763124199746,
"eval_dim_512_cosine_accuracy@10": 0.47823303457106275,
"eval_dim_512_cosine_accuracy@3": 0.4052496798975672,
"eval_dim_512_cosine_accuracy@5": 0.44558258642765686,
"eval_dim_512_cosine_map@100": 0.4876319198894288,
"eval_dim_512_cosine_mrr@10": 0.41307745462675005,
"eval_dim_512_cosine_ndcg@10": 0.42824151108259556,
"eval_dim_512_cosine_precision@1": 0.39884763124199746,
"eval_dim_512_cosine_precision@10": 0.35793854033290645,
"eval_dim_512_cosine_precision@3": 0.3975672215108835,
"eval_dim_512_cosine_precision@5": 0.3888604353393086,
"eval_dim_512_cosine_recall@1": 0.04570727180608771,
"eval_dim_512_cosine_recall@10": 0.2993652309972795,
"eval_dim_512_cosine_recall@3": 0.13329368345632836,
"eval_dim_512_cosine_recall@5": 0.2006035854063678,
"eval_dim_64_cosine_accuracy@1": 0.3079385403329065,
"eval_dim_64_cosine_accuracy@10": 0.36555697823303457,
"eval_dim_64_cosine_accuracy@3": 0.31241997439180536,
"eval_dim_64_cosine_accuracy@5": 0.33290653008962867,
"eval_dim_64_cosine_map@100": 0.38184314430829974,
"eval_dim_64_cosine_mrr@10": 0.31748394406845065,
"eval_dim_64_cosine_ndcg@10": 0.3275369456141822,
"eval_dim_64_cosine_precision@1": 0.3079385403329065,
"eval_dim_64_cosine_precision@10": 0.27215108834827145,
"eval_dim_64_cosine_precision@3": 0.3070849338454972,
"eval_dim_64_cosine_precision@5": 0.29820742637644043,
"eval_dim_64_cosine_recall@1": 0.03504677697523653,
"eval_dim_64_cosine_recall@10": 0.23026653514933906,
"eval_dim_64_cosine_recall@3": 0.10211269541567973,
"eval_dim_64_cosine_recall@5": 0.15297976910096123,
"eval_dim_768_cosine_accuracy@1": 0.3994878361075544,
"eval_dim_768_cosine_accuracy@10": 0.4737516005121639,
"eval_dim_768_cosine_accuracy@3": 0.4046094750320102,
"eval_dim_768_cosine_accuracy@5": 0.4359795134443022,
"eval_dim_768_cosine_map@100": 0.48680507317454147,
"eval_dim_768_cosine_mrr@10": 0.41201019246793846,
"eval_dim_768_cosine_ndcg@10": 0.4244383191680289,
"eval_dim_768_cosine_precision@1": 0.3994878361075544,
"eval_dim_768_cosine_precision@10": 0.352752880921895,
"eval_dim_768_cosine_precision@3": 0.39820742637644047,
"eval_dim_768_cosine_precision@5": 0.3868117797695263,
"eval_dim_768_cosine_recall@1": 0.046132270416131195,
"eval_dim_768_cosine_recall@10": 0.29681183299989666,
"eval_dim_768_cosine_recall@3": 0.13453018491697852,
"eval_dim_768_cosine_recall@5": 0.20078864250336506,
"eval_runtime": 98.6751,
"eval_samples_per_second": 0.0,
"eval_sequential_score": 0.3275369456141822,
"eval_steps_per_second": 0.0,
"step": 52
}
],
"logging_steps": 10,
"max_steps": 240,
"num_input_tokens_seen": 0,
"num_train_epochs": 20,
"save_steps": 500,
"stateful_callbacks": {
"EarlyStoppingCallback": {
"args": {
"early_stopping_patience": 2,
"early_stopping_threshold": 0.0
},
"attributes": {
"early_stopping_patience_counter": 1
}
},
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": false
},
"attributes": {}
}
},
"total_flos": 0.0,
"train_batch_size": 8,
"trial_name": null,
"trial_params": null
}