smikulas's picture
Upload folder using huggingface_hub
4c1bea0 verified
{
"best_global_step": 72,
"best_metric": 0.7275517192718437,
"best_model_checkpoint": "MNLP_M3_document_encoder_sciqa/checkpoint-72",
"epoch": 3.8135593220338984,
"eval_steps": 500,
"global_step": 72,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.5423728813559322,
"grad_norm": 164.72093200683594,
"learning_rate": 1.9987954562051724e-05,
"loss": 22.4049,
"step": 10
},
{
"epoch": 1.0,
"eval_dim_128_cosine_accuracy@1": 0.5452812202097236,
"eval_dim_128_cosine_accuracy@10": 0.8760724499523356,
"eval_dim_128_cosine_accuracy@3": 0.7416587225929456,
"eval_dim_128_cosine_accuracy@5": 0.8074356530028599,
"eval_dim_128_cosine_map@100": 0.6605612754102786,
"eval_dim_128_cosine_mrr@10": 0.6559349796480402,
"eval_dim_128_cosine_ndcg@10": 0.7092688022688834,
"eval_dim_128_cosine_precision@1": 0.5452812202097236,
"eval_dim_128_cosine_precision@10": 0.08760724499523356,
"eval_dim_128_cosine_precision@3": 0.24721957419764853,
"eval_dim_128_cosine_precision@5": 0.161487130600572,
"eval_dim_128_cosine_recall@1": 0.5452812202097236,
"eval_dim_128_cosine_recall@10": 0.8760724499523356,
"eval_dim_128_cosine_recall@3": 0.7416587225929456,
"eval_dim_128_cosine_recall@5": 0.8074356530028599,
"eval_dim_192_cosine_accuracy@1": 0.5624404194470924,
"eval_dim_192_cosine_accuracy@10": 0.8932316491897044,
"eval_dim_192_cosine_accuracy@3": 0.7597712106768351,
"eval_dim_192_cosine_accuracy@5": 0.8188751191611058,
"eval_dim_192_cosine_map@100": 0.677245219852975,
"eval_dim_192_cosine_mrr@10": 0.6730234388003697,
"eval_dim_192_cosine_ndcg@10": 0.7262712999939527,
"eval_dim_192_cosine_precision@1": 0.5624404194470924,
"eval_dim_192_cosine_precision@10": 0.08932316491897044,
"eval_dim_192_cosine_precision@3": 0.25325707022561167,
"eval_dim_192_cosine_precision@5": 0.16377502383222117,
"eval_dim_192_cosine_recall@1": 0.5624404194470924,
"eval_dim_192_cosine_recall@10": 0.8932316491897044,
"eval_dim_192_cosine_recall@3": 0.7597712106768351,
"eval_dim_192_cosine_recall@5": 0.8188751191611058,
"eval_dim_256_cosine_accuracy@1": 0.5653002859866539,
"eval_dim_256_cosine_accuracy@10": 0.8960915157292659,
"eval_dim_256_cosine_accuracy@3": 0.7683508102955195,
"eval_dim_256_cosine_accuracy@5": 0.8236415633937083,
"eval_dim_256_cosine_map@100": 0.6831583296339104,
"eval_dim_256_cosine_mrr@10": 0.6786784844220503,
"eval_dim_256_cosine_ndcg@10": 0.7314611486548883,
"eval_dim_256_cosine_precision@1": 0.5653002859866539,
"eval_dim_256_cosine_precision@10": 0.08960915157292659,
"eval_dim_256_cosine_precision@3": 0.25611693676517316,
"eval_dim_256_cosine_precision@5": 0.16472831267874166,
"eval_dim_256_cosine_recall@1": 0.5653002859866539,
"eval_dim_256_cosine_recall@10": 0.8960915157292659,
"eval_dim_256_cosine_recall@3": 0.7683508102955195,
"eval_dim_256_cosine_recall@5": 0.8236415633937083,
"eval_dim_384_cosine_accuracy@1": 0.5786463298379408,
"eval_dim_384_cosine_accuracy@10": 0.9075309818875119,
"eval_dim_384_cosine_accuracy@3": 0.776930409914204,
"eval_dim_384_cosine_accuracy@5": 0.8417540514775977,
"eval_dim_384_cosine_map@100": 0.6932934943306605,
"eval_dim_384_cosine_mrr@10": 0.6894563227261042,
"eval_dim_384_cosine_ndcg@10": 0.7423737824827953,
"eval_dim_384_cosine_precision@1": 0.5786463298379408,
"eval_dim_384_cosine_precision@10": 0.0907530981887512,
"eval_dim_384_cosine_precision@3": 0.2589768033047346,
"eval_dim_384_cosine_precision@5": 0.16835081029551957,
"eval_dim_384_cosine_recall@1": 0.5786463298379408,
"eval_dim_384_cosine_recall@10": 0.9075309818875119,
"eval_dim_384_cosine_recall@3": 0.776930409914204,
"eval_dim_384_cosine_recall@5": 0.8417540514775977,
"eval_dim_64_cosine_accuracy@1": 0.49285033365109626,
"eval_dim_64_cosine_accuracy@10": 0.8274547187797903,
"eval_dim_64_cosine_accuracy@3": 0.684461391801716,
"eval_dim_64_cosine_accuracy@5": 0.7578646329837941,
"eval_dim_64_cosine_map@100": 0.6088952628032813,
"eval_dim_64_cosine_mrr@10": 0.6032237807738285,
"eval_dim_64_cosine_ndcg@10": 0.6575406372744073,
"eval_dim_64_cosine_precision@1": 0.49285033365109626,
"eval_dim_64_cosine_precision@10": 0.08274547187797902,
"eval_dim_64_cosine_precision@3": 0.2281537972672386,
"eval_dim_64_cosine_precision@5": 0.1515729265967588,
"eval_dim_64_cosine_recall@1": 0.49285033365109626,
"eval_dim_64_cosine_recall@10": 0.8274547187797903,
"eval_dim_64_cosine_recall@3": 0.684461391801716,
"eval_dim_64_cosine_recall@5": 0.7578646329837941,
"eval_dim_96_cosine_accuracy@1": 0.5214489990467112,
"eval_dim_96_cosine_accuracy@10": 0.8636796949475691,
"eval_dim_96_cosine_accuracy@3": 0.7264061010486177,
"eval_dim_96_cosine_accuracy@5": 0.7893231649189705,
"eval_dim_96_cosine_map@100": 0.6418431352074736,
"eval_dim_96_cosine_mrr@10": 0.6369528046363133,
"eval_dim_96_cosine_ndcg@10": 0.6919097155042885,
"eval_dim_96_cosine_precision@1": 0.5214489990467112,
"eval_dim_96_cosine_precision@10": 0.0863679694947569,
"eval_dim_96_cosine_precision@3": 0.2421353670162059,
"eval_dim_96_cosine_precision@5": 0.15786463298379408,
"eval_dim_96_cosine_recall@1": 0.5214489990467112,
"eval_dim_96_cosine_recall@10": 0.8636796949475691,
"eval_dim_96_cosine_recall@3": 0.7264061010486177,
"eval_dim_96_cosine_recall@5": 0.7893231649189705,
"eval_runtime": 116.4269,
"eval_samples_per_second": 0.0,
"eval_sequential_score": 0.6575406372744073,
"eval_steps_per_second": 0.0,
"step": 19
},
{
"epoch": 1.0542372881355933,
"grad_norm": 107.04779815673828,
"learning_rate": 1.8577286100002723e-05,
"loss": 16.6616,
"step": 20
},
{
"epoch": 1.5966101694915253,
"grad_norm": 97.63832092285156,
"learning_rate": 1.5141027441932217e-05,
"loss": 16.8367,
"step": 30
},
{
"epoch": 2.0,
"eval_dim_128_cosine_accuracy@1": 0.567206863679695,
"eval_dim_128_cosine_accuracy@10": 0.886558627264061,
"eval_dim_128_cosine_accuracy@3": 0.7607244995233555,
"eval_dim_128_cosine_accuracy@5": 0.8236415633937083,
"eval_dim_128_cosine_map@100": 0.6790430112153837,
"eval_dim_128_cosine_mrr@10": 0.6746886679679823,
"eval_dim_128_cosine_ndcg@10": 0.7260517487265687,
"eval_dim_128_cosine_precision@1": 0.567206863679695,
"eval_dim_128_cosine_precision@10": 0.0886558627264061,
"eval_dim_128_cosine_precision@3": 0.25357483317445184,
"eval_dim_128_cosine_precision@5": 0.16472831267874166,
"eval_dim_128_cosine_recall@1": 0.567206863679695,
"eval_dim_128_cosine_recall@10": 0.886558627264061,
"eval_dim_128_cosine_recall@3": 0.7607244995233555,
"eval_dim_128_cosine_recall@5": 0.8236415633937083,
"eval_dim_192_cosine_accuracy@1": 0.5805529075309819,
"eval_dim_192_cosine_accuracy@10": 0.9008579599618685,
"eval_dim_192_cosine_accuracy@3": 0.782650142993327,
"eval_dim_192_cosine_accuracy@5": 0.8322211630123928,
"eval_dim_192_cosine_map@100": 0.6964841260809953,
"eval_dim_192_cosine_mrr@10": 0.6923562879234952,
"eval_dim_192_cosine_ndcg@10": 0.7430712975035773,
"eval_dim_192_cosine_precision@1": 0.5805529075309819,
"eval_dim_192_cosine_precision@10": 0.09008579599618685,
"eval_dim_192_cosine_precision@3": 0.26088338099777564,
"eval_dim_192_cosine_precision@5": 0.16644423260247856,
"eval_dim_192_cosine_recall@1": 0.5805529075309819,
"eval_dim_192_cosine_recall@10": 0.9008579599618685,
"eval_dim_192_cosine_recall@3": 0.782650142993327,
"eval_dim_192_cosine_recall@5": 0.8322211630123928,
"eval_dim_256_cosine_accuracy@1": 0.5919923736892279,
"eval_dim_256_cosine_accuracy@10": 0.9142040038131554,
"eval_dim_256_cosine_accuracy@3": 0.7902764537654909,
"eval_dim_256_cosine_accuracy@5": 0.8360343183984748,
"eval_dim_256_cosine_map@100": 0.7038093293311698,
"eval_dim_256_cosine_mrr@10": 0.700305279404422,
"eval_dim_256_cosine_ndcg@10": 0.7520267351833514,
"eval_dim_256_cosine_precision@1": 0.5919923736892279,
"eval_dim_256_cosine_precision@10": 0.09142040038131555,
"eval_dim_256_cosine_precision@3": 0.26342548458849696,
"eval_dim_256_cosine_precision@5": 0.16720686367969492,
"eval_dim_256_cosine_recall@1": 0.5919923736892279,
"eval_dim_256_cosine_recall@10": 0.9142040038131554,
"eval_dim_256_cosine_recall@3": 0.7902764537654909,
"eval_dim_256_cosine_recall@5": 0.8360343183984748,
"eval_dim_384_cosine_accuracy@1": 0.6015252621544328,
"eval_dim_384_cosine_accuracy@10": 0.9199237368922784,
"eval_dim_384_cosine_accuracy@3": 0.7959961868446139,
"eval_dim_384_cosine_accuracy@5": 0.8531935176358436,
"eval_dim_384_cosine_map@100": 0.713601684515785,
"eval_dim_384_cosine_mrr@10": 0.7104082497314151,
"eval_dim_384_cosine_ndcg@10": 0.761241503632434,
"eval_dim_384_cosine_precision@1": 0.6015252621544328,
"eval_dim_384_cosine_precision@10": 0.09199237368922783,
"eval_dim_384_cosine_precision@3": 0.26533206228153794,
"eval_dim_384_cosine_precision@5": 0.17063870352716873,
"eval_dim_384_cosine_recall@1": 0.6015252621544328,
"eval_dim_384_cosine_recall@10": 0.9199237368922784,
"eval_dim_384_cosine_recall@3": 0.7959961868446139,
"eval_dim_384_cosine_recall@5": 0.8531935176358436,
"eval_dim_64_cosine_accuracy@1": 0.5138226882745471,
"eval_dim_64_cosine_accuracy@10": 0.8341277407054337,
"eval_dim_64_cosine_accuracy@3": 0.7016205910390848,
"eval_dim_64_cosine_accuracy@5": 0.7645376549094376,
"eval_dim_64_cosine_map@100": 0.6242158272303533,
"eval_dim_64_cosine_mrr@10": 0.618670464690484,
"eval_dim_64_cosine_ndcg@10": 0.6707950308444217,
"eval_dim_64_cosine_precision@1": 0.5138226882745471,
"eval_dim_64_cosine_precision@10": 0.08341277407054337,
"eval_dim_64_cosine_precision@3": 0.2338735303463616,
"eval_dim_64_cosine_precision@5": 0.1529075309818875,
"eval_dim_64_cosine_recall@1": 0.5138226882745471,
"eval_dim_64_cosine_recall@10": 0.8341277407054337,
"eval_dim_64_cosine_recall@3": 0.7016205910390848,
"eval_dim_64_cosine_recall@5": 0.7645376549094376,
"eval_dim_96_cosine_accuracy@1": 0.5471877979027645,
"eval_dim_96_cosine_accuracy@10": 0.8722592945662536,
"eval_dim_96_cosine_accuracy@3": 0.7407054337464252,
"eval_dim_96_cosine_accuracy@5": 0.8017159199237369,
"eval_dim_96_cosine_map@100": 0.6622003643008398,
"eval_dim_96_cosine_mrr@10": 0.6576811627097615,
"eval_dim_96_cosine_ndcg@10": 0.7097194683573752,
"eval_dim_96_cosine_precision@1": 0.5471877979027645,
"eval_dim_96_cosine_precision@10": 0.08722592945662536,
"eval_dim_96_cosine_precision@3": 0.2469018112488084,
"eval_dim_96_cosine_precision@5": 0.16034318398474737,
"eval_dim_96_cosine_recall@1": 0.5471877979027645,
"eval_dim_96_cosine_recall@10": 0.8722592945662536,
"eval_dim_96_cosine_recall@3": 0.7407054337464252,
"eval_dim_96_cosine_recall@5": 0.8017159199237369,
"eval_runtime": 119.8934,
"eval_samples_per_second": 0.0,
"eval_sequential_score": 0.6707950308444217,
"eval_steps_per_second": 0.0,
"step": 38
},
{
"epoch": 2.1084745762711865,
"grad_norm": 113.89473724365234,
"learning_rate": 1.0490676743274181e-05,
"loss": 12.8169,
"step": 40
},
{
"epoch": 2.6508474576271186,
"grad_norm": 81.27326965332031,
"learning_rate": 5.724449065697182e-06,
"loss": 13.7826,
"step": 50
},
{
"epoch": 3.0,
"eval_dim_128_cosine_accuracy@1": 0.567206863679695,
"eval_dim_128_cosine_accuracy@10": 0.8903717826501429,
"eval_dim_128_cosine_accuracy@3": 0.7616777883698761,
"eval_dim_128_cosine_accuracy@5": 0.8265014299332698,
"eval_dim_128_cosine_map@100": 0.6794753898354032,
"eval_dim_128_cosine_mrr@10": 0.6752920392815543,
"eval_dim_128_cosine_ndcg@10": 0.7273531110418706,
"eval_dim_128_cosine_precision@1": 0.567206863679695,
"eval_dim_128_cosine_precision@10": 0.08903717826501431,
"eval_dim_128_cosine_precision@3": 0.253892596123292,
"eval_dim_128_cosine_precision@5": 0.16530028598665394,
"eval_dim_128_cosine_recall@1": 0.567206863679695,
"eval_dim_128_cosine_recall@10": 0.8903717826501429,
"eval_dim_128_cosine_recall@3": 0.7616777883698761,
"eval_dim_128_cosine_recall@5": 0.8265014299332698,
"eval_dim_192_cosine_accuracy@1": 0.5910390848427073,
"eval_dim_192_cosine_accuracy@10": 0.9046711153479504,
"eval_dim_192_cosine_accuracy@3": 0.7778836987607245,
"eval_dim_192_cosine_accuracy@5": 0.8360343183984748,
"eval_dim_192_cosine_map@100": 0.7014228144337117,
"eval_dim_192_cosine_mrr@10": 0.6975449029309853,
"eval_dim_192_cosine_ndcg@10": 0.7477240665900656,
"eval_dim_192_cosine_precision@1": 0.5910390848427073,
"eval_dim_192_cosine_precision@10": 0.09046711153479504,
"eval_dim_192_cosine_precision@3": 0.25929456625357483,
"eval_dim_192_cosine_precision@5": 0.16720686367969495,
"eval_dim_192_cosine_recall@1": 0.5910390848427073,
"eval_dim_192_cosine_recall@10": 0.9046711153479504,
"eval_dim_192_cosine_recall@3": 0.7778836987607245,
"eval_dim_192_cosine_recall@5": 0.8360343183984748,
"eval_dim_256_cosine_accuracy@1": 0.5948522402287894,
"eval_dim_256_cosine_accuracy@10": 0.9151572926596759,
"eval_dim_256_cosine_accuracy@3": 0.792183031458532,
"eval_dim_256_cosine_accuracy@5": 0.8398474737845567,
"eval_dim_256_cosine_map@100": 0.7070932589939358,
"eval_dim_256_cosine_mrr@10": 0.7035797509343749,
"eval_dim_256_cosine_ndcg@10": 0.7548435122429773,
"eval_dim_256_cosine_precision@1": 0.5948522402287894,
"eval_dim_256_cosine_precision@10": 0.09151572926596759,
"eval_dim_256_cosine_precision@3": 0.2640610104861773,
"eval_dim_256_cosine_precision@5": 0.16796949475691134,
"eval_dim_256_cosine_recall@1": 0.5948522402287894,
"eval_dim_256_cosine_recall@10": 0.9151572926596759,
"eval_dim_256_cosine_recall@3": 0.792183031458532,
"eval_dim_256_cosine_recall@5": 0.8398474737845567,
"eval_dim_384_cosine_accuracy@1": 0.6101048617731173,
"eval_dim_384_cosine_accuracy@10": 0.9256434699714013,
"eval_dim_384_cosine_accuracy@3": 0.8007626310772163,
"eval_dim_384_cosine_accuracy@5": 0.8541468064823642,
"eval_dim_384_cosine_map@100": 0.7197084605820631,
"eval_dim_384_cosine_mrr@10": 0.7170116664396936,
"eval_dim_384_cosine_ndcg@10": 0.7675175612283535,
"eval_dim_384_cosine_precision@1": 0.6101048617731173,
"eval_dim_384_cosine_precision@10": 0.09256434699714014,
"eval_dim_384_cosine_precision@3": 0.2669208770257388,
"eval_dim_384_cosine_precision@5": 0.17082936129647283,
"eval_dim_384_cosine_recall@1": 0.6101048617731173,
"eval_dim_384_cosine_recall@10": 0.9256434699714013,
"eval_dim_384_cosine_recall@3": 0.8007626310772163,
"eval_dim_384_cosine_recall@5": 0.8541468064823642,
"eval_dim_64_cosine_accuracy@1": 0.5166825548141086,
"eval_dim_64_cosine_accuracy@10": 0.8369876072449952,
"eval_dim_64_cosine_accuracy@3": 0.7054337464251669,
"eval_dim_64_cosine_accuracy@5": 0.7673975214489991,
"eval_dim_64_cosine_map@100": 0.629350282837756,
"eval_dim_64_cosine_mrr@10": 0.6240088822309986,
"eval_dim_64_cosine_ndcg@10": 0.6755921916053389,
"eval_dim_64_cosine_precision@1": 0.5166825548141086,
"eval_dim_64_cosine_precision@10": 0.08369876072449953,
"eval_dim_64_cosine_precision@3": 0.23514458214172226,
"eval_dim_64_cosine_precision@5": 0.1534795042897998,
"eval_dim_64_cosine_recall@1": 0.5166825548141086,
"eval_dim_64_cosine_recall@10": 0.8369876072449952,
"eval_dim_64_cosine_recall@3": 0.7054337464251669,
"eval_dim_64_cosine_recall@5": 0.7673975214489991,
"eval_dim_96_cosine_accuracy@1": 0.5529075309818875,
"eval_dim_96_cosine_accuracy@10": 0.8741658722592945,
"eval_dim_96_cosine_accuracy@3": 0.7416587225929456,
"eval_dim_96_cosine_accuracy@5": 0.8093422306959008,
"eval_dim_96_cosine_map@100": 0.6652525185575742,
"eval_dim_96_cosine_mrr@10": 0.6608247461679306,
"eval_dim_96_cosine_ndcg@10": 0.7125237648315317,
"eval_dim_96_cosine_precision@1": 0.5529075309818875,
"eval_dim_96_cosine_precision@10": 0.08741658722592945,
"eval_dim_96_cosine_precision@3": 0.24721957419764853,
"eval_dim_96_cosine_precision@5": 0.1618684461391802,
"eval_dim_96_cosine_recall@1": 0.5529075309818875,
"eval_dim_96_cosine_recall@10": 0.8741658722592945,
"eval_dim_96_cosine_recall@3": 0.7416587225929456,
"eval_dim_96_cosine_recall@5": 0.8093422306959008,
"eval_runtime": 120.2085,
"eval_samples_per_second": 0.0,
"eval_sequential_score": 0.6755921916053389,
"eval_steps_per_second": 0.0,
"step": 57
},
{
"epoch": 3.1627118644067798,
"grad_norm": 102.55581665039062,
"learning_rate": 1.967924685193552e-06,
"loss": 12.4455,
"step": 60
},
{
"epoch": 3.705084745762712,
"grad_norm": 84.57442474365234,
"learning_rate": 1.0823490035218986e-07,
"loss": 12.2968,
"step": 70
},
{
"epoch": 3.8135593220338984,
"eval_dim_128_cosine_accuracy@1": 0.5662535748331744,
"eval_dim_128_cosine_accuracy@10": 0.8913250714966635,
"eval_dim_128_cosine_accuracy@3": 0.7626310772163966,
"eval_dim_128_cosine_accuracy@5": 0.8265014299332698,
"eval_dim_128_cosine_map@100": 0.6793502491099088,
"eval_dim_128_cosine_mrr@10": 0.6752375656331816,
"eval_dim_128_cosine_ndcg@10": 0.7275517192718437,
"eval_dim_128_cosine_precision@1": 0.5662535748331744,
"eval_dim_128_cosine_precision@10": 0.08913250714966635,
"eval_dim_128_cosine_precision@3": 0.25421035907213213,
"eval_dim_128_cosine_precision@5": 0.16530028598665394,
"eval_dim_128_cosine_recall@1": 0.5662535748331744,
"eval_dim_128_cosine_recall@10": 0.8913250714966635,
"eval_dim_128_cosine_recall@3": 0.7626310772163966,
"eval_dim_128_cosine_recall@5": 0.8265014299332698,
"eval_dim_192_cosine_accuracy@1": 0.5891325071496664,
"eval_dim_192_cosine_accuracy@10": 0.90371782650143,
"eval_dim_192_cosine_accuracy@3": 0.778836987607245,
"eval_dim_192_cosine_accuracy@5": 0.8331744518589133,
"eval_dim_192_cosine_map@100": 0.7004357679049269,
"eval_dim_192_cosine_mrr@10": 0.6964694266648511,
"eval_dim_192_cosine_ndcg@10": 0.7467179313530818,
"eval_dim_192_cosine_precision@1": 0.5891325071496664,
"eval_dim_192_cosine_precision@10": 0.090371782650143,
"eval_dim_192_cosine_precision@3": 0.259612329202415,
"eval_dim_192_cosine_precision@5": 0.16663489037178267,
"eval_dim_192_cosine_recall@1": 0.5891325071496664,
"eval_dim_192_cosine_recall@10": 0.90371782650143,
"eval_dim_192_cosine_recall@3": 0.778836987607245,
"eval_dim_192_cosine_recall@5": 0.8331744518589133,
"eval_dim_256_cosine_accuracy@1": 0.5977121067683508,
"eval_dim_256_cosine_accuracy@10": 0.9151572926596759,
"eval_dim_256_cosine_accuracy@3": 0.7912297426120114,
"eval_dim_256_cosine_accuracy@5": 0.8398474737845567,
"eval_dim_256_cosine_map@100": 0.7084736712852033,
"eval_dim_256_cosine_mrr@10": 0.7049529408204341,
"eval_dim_256_cosine_ndcg@10": 0.7558547240171754,
"eval_dim_256_cosine_precision@1": 0.5977121067683508,
"eval_dim_256_cosine_precision@10": 0.09151572926596759,
"eval_dim_256_cosine_precision@3": 0.26374324753733713,
"eval_dim_256_cosine_precision@5": 0.16796949475691134,
"eval_dim_256_cosine_recall@1": 0.5977121067683508,
"eval_dim_256_cosine_recall@10": 0.9151572926596759,
"eval_dim_256_cosine_recall@3": 0.7912297426120114,
"eval_dim_256_cosine_recall@5": 0.8398474737845567,
"eval_dim_384_cosine_accuracy@1": 0.6120114394661582,
"eval_dim_384_cosine_accuracy@10": 0.9275500476644424,
"eval_dim_384_cosine_accuracy@3": 0.8017159199237369,
"eval_dim_384_cosine_accuracy@5": 0.8541468064823642,
"eval_dim_384_cosine_map@100": 0.7210073638258574,
"eval_dim_384_cosine_mrr@10": 0.7184669450875366,
"eval_dim_384_cosine_ndcg@10": 0.7690377395004954,
"eval_dim_384_cosine_precision@1": 0.6120114394661582,
"eval_dim_384_cosine_precision@10": 0.09275500476644424,
"eval_dim_384_cosine_precision@3": 0.267238639974579,
"eval_dim_384_cosine_precision@5": 0.17082936129647283,
"eval_dim_384_cosine_recall@1": 0.6120114394661582,
"eval_dim_384_cosine_recall@10": 0.9275500476644424,
"eval_dim_384_cosine_recall@3": 0.8017159199237369,
"eval_dim_384_cosine_recall@5": 0.8541468064823642,
"eval_dim_64_cosine_accuracy@1": 0.5166825548141086,
"eval_dim_64_cosine_accuracy@10": 0.8369876072449952,
"eval_dim_64_cosine_accuracy@3": 0.7044804575786463,
"eval_dim_64_cosine_accuracy@5": 0.7683508102955195,
"eval_dim_64_cosine_map@100": 0.6292715088820261,
"eval_dim_64_cosine_mrr@10": 0.6239059875618503,
"eval_dim_64_cosine_ndcg@10": 0.6755211859192654,
"eval_dim_64_cosine_precision@1": 0.5166825548141086,
"eval_dim_64_cosine_precision@10": 0.08369876072449953,
"eval_dim_64_cosine_precision@3": 0.2348268191928821,
"eval_dim_64_cosine_precision@5": 0.1536701620591039,
"eval_dim_64_cosine_recall@1": 0.5166825548141086,
"eval_dim_64_cosine_recall@10": 0.8369876072449952,
"eval_dim_64_cosine_recall@3": 0.7044804575786463,
"eval_dim_64_cosine_recall@5": 0.7683508102955195,
"eval_dim_96_cosine_accuracy@1": 0.551954242135367,
"eval_dim_96_cosine_accuracy@10": 0.8732125834127741,
"eval_dim_96_cosine_accuracy@3": 0.7416587225929456,
"eval_dim_96_cosine_accuracy@5": 0.8093422306959008,
"eval_dim_96_cosine_map@100": 0.6648689218069684,
"eval_dim_96_cosine_mrr@10": 0.660333348464903,
"eval_dim_96_cosine_ndcg@10": 0.7119774118711802,
"eval_dim_96_cosine_precision@1": 0.551954242135367,
"eval_dim_96_cosine_precision@10": 0.08732125834127741,
"eval_dim_96_cosine_precision@3": 0.24721957419764853,
"eval_dim_96_cosine_precision@5": 0.1618684461391802,
"eval_dim_96_cosine_recall@1": 0.551954242135367,
"eval_dim_96_cosine_recall@10": 0.8732125834127741,
"eval_dim_96_cosine_recall@3": 0.7416587225929456,
"eval_dim_96_cosine_recall@5": 0.8093422306959008,
"eval_runtime": 122.4656,
"eval_samples_per_second": 0.0,
"eval_sequential_score": 0.6755211859192654,
"eval_steps_per_second": 0.0,
"step": 72
}
],
"logging_steps": 10,
"max_steps": 72,
"num_input_tokens_seen": 0,
"num_train_epochs": 4,
"save_steps": 500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 0.0,
"train_batch_size": 32,
"trial_name": null,
"trial_params": null
}