Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

add micracle results for russian models #29

Merged
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
16 changes: 16 additions & 0 deletions paths.json
Original file line number Diff line number Diff line change
Expand Up @@ -1246,6 +1246,7 @@
"results/sergeyzh__rubert-tiny-turbo/8ce0cf757446ce9bb2d5f5a4ac8103c7a1049054/MedrxivClusteringS2S.json",
"results/sergeyzh__rubert-tiny-turbo/8ce0cf757446ce9bb2d5f5a4ac8103c7a1049054/Diversity5LegalBenchClassification.json",
"results/sergeyzh__rubert-tiny-turbo/8ce0cf757446ce9bb2d5f5a4ac8103c7a1049054/RiaNewsRetrieval.json",
"results/sergeyzh__rubert-tiny-turbo/8ce0cf757446ce9bb2d5f5a4ac8103c7a1049054/MIRACLRetrieval.json",
"results/sergeyzh__rubert-tiny-turbo/8ce0cf757446ce9bb2d5f5a4ac8103c7a1049054/YahooAnswersTopicsClassification.json",
"results/sergeyzh__rubert-tiny-turbo/8ce0cf757446ce9bb2d5f5a4ac8103c7a1049054/ContractNLIPermissiblePostAgreementPossessionLegalBenchClassification.json",
"results/sergeyzh__rubert-tiny-turbo/8ce0cf757446ce9bb2d5f5a4ac8103c7a1049054/OPP115PolicyChangeLegalBenchClassification.json",
Expand Down Expand Up @@ -1327,6 +1328,7 @@
"results/sergeyzh__rubert-tiny-turbo/8ce0cf757446ce9bb2d5f5a4ac8103c7a1049054/LearnedHandsCourtsLegalBenchClassification.json",
"results/sergeyzh__rubert-tiny-turbo/8ce0cf757446ce9bb2d5f5a4ac8103c7a1049054/TelemarketingSalesRuleLegalBenchClassification.json",
"results/sergeyzh__rubert-tiny-turbo/8ce0cf757446ce9bb2d5f5a4ac8103c7a1049054/NYSJudicialEthicsLegalBenchClassification.json",
"results/sergeyzh__rubert-tiny-turbo/8ce0cf757446ce9bb2d5f5a4ac8103c7a1049054/MIRACLReranking.json",
"results/sergeyzh__rubert-tiny-turbo/8ce0cf757446ce9bb2d5f5a4ac8103c7a1049054/XNLI.json",
"results/sergeyzh__rubert-tiny-turbo/8ce0cf757446ce9bb2d5f5a4ac8103c7a1049054/ContractNLIPermissibleCopyLegalBenchClassification.json",
"results/sergeyzh__rubert-tiny-turbo/8ce0cf757446ce9bb2d5f5a4ac8103c7a1049054/SCDDTrainingLegalBenchClassification.json",
Expand Down Expand Up @@ -3574,6 +3576,7 @@
"results/DeepPavlov__distilrubert-small-cased-conversational/e348066b4a7279b97138038299bddc6580a9169a/RuSTSBenchmarkSTS.json",
"results/DeepPavlov__distilrubert-small-cased-conversational/e348066b4a7279b97138038299bddc6580a9169a/CyrillicTurkicLangClassification.json",
"results/DeepPavlov__distilrubert-small-cased-conversational/e348066b4a7279b97138038299bddc6580a9169a/RiaNewsRetrieval.json",
"results/DeepPavlov__distilrubert-small-cased-conversational/e348066b4a7279b97138038299bddc6580a9169a/MIRACLRetrieval.json",
"results/DeepPavlov__distilrubert-small-cased-conversational/e348066b4a7279b97138038299bddc6580a9169a/GeoreviewClassification.json",
"results/DeepPavlov__distilrubert-small-cased-conversational/e348066b4a7279b97138038299bddc6580a9169a/SensitiveTopicsClassification.json",
"results/DeepPavlov__distilrubert-small-cased-conversational/e348066b4a7279b97138038299bddc6580a9169a/KinopoiskClassification.json",
Expand All @@ -3589,6 +3592,7 @@
"results/DeepPavlov__distilrubert-small-cased-conversational/e348066b4a7279b97138038299bddc6580a9169a/HeadlineClassification.json",
"results/DeepPavlov__distilrubert-small-cased-conversational/e348066b4a7279b97138038299bddc6580a9169a/XQuADRetrieval.json",
"results/DeepPavlov__distilrubert-small-cased-conversational/e348066b4a7279b97138038299bddc6580a9169a/BUCC.v2.json",
"results/DeepPavlov__distilrubert-small-cased-conversational/e348066b4a7279b97138038299bddc6580a9169a/MIRACLReranking.json",
"results/DeepPavlov__distilrubert-small-cased-conversational/e348066b4a7279b97138038299bddc6580a9169a/XNLI.json",
"results/DeepPavlov__distilrubert-small-cased-conversational/e348066b4a7279b97138038299bddc6580a9169a/XNLIV2.json",
"results/DeepPavlov__distilrubert-small-cased-conversational/e348066b4a7279b97138038299bddc6580a9169a/STS22.json",
Expand Down Expand Up @@ -9928,6 +9932,7 @@
"results/deepvk__USER-bge-m3/0cc6cfe48e260fb0474c753087a69369e88709ae/RuSTSBenchmarkSTS.json",
"results/deepvk__USER-bge-m3/0cc6cfe48e260fb0474c753087a69369e88709ae/CyrillicTurkicLangClassification.json",
"results/deepvk__USER-bge-m3/0cc6cfe48e260fb0474c753087a69369e88709ae/RiaNewsRetrieval.json",
"results/deepvk__USER-bge-m3/0cc6cfe48e260fb0474c753087a69369e88709ae/MIRACLRetrieval.json",
"results/deepvk__USER-bge-m3/0cc6cfe48e260fb0474c753087a69369e88709ae/GeoreviewClassification.json",
"results/deepvk__USER-bge-m3/0cc6cfe48e260fb0474c753087a69369e88709ae/SensitiveTopicsClassification.json",
"results/deepvk__USER-bge-m3/0cc6cfe48e260fb0474c753087a69369e88709ae/KinopoiskClassification.json",
Expand All @@ -9942,6 +9947,7 @@
"results/deepvk__USER-bge-m3/0cc6cfe48e260fb0474c753087a69369e88709ae/HeadlineClassification.json",
"results/deepvk__USER-bge-m3/0cc6cfe48e260fb0474c753087a69369e88709ae/XQuADRetrieval.json",
"results/deepvk__USER-bge-m3/0cc6cfe48e260fb0474c753087a69369e88709ae/BUCC.v2.json",
"results/deepvk__USER-bge-m3/0cc6cfe48e260fb0474c753087a69369e88709ae/MIRACLReranking.json",
"results/deepvk__USER-bge-m3/0cc6cfe48e260fb0474c753087a69369e88709ae/XNLI.json",
"results/deepvk__USER-bge-m3/0cc6cfe48e260fb0474c753087a69369e88709ae/XNLIV2.json",
"results/deepvk__USER-bge-m3/0cc6cfe48e260fb0474c753087a69369e88709ae/STS22.json",
Expand Down Expand Up @@ -11951,6 +11957,7 @@
"results/cointegrated__LaBSE-en-ru/cf0714e606d4af551e14ad69a7929cd6b0da7f7e/RuSTSBenchmarkSTS.json",
"results/cointegrated__LaBSE-en-ru/cf0714e606d4af551e14ad69a7929cd6b0da7f7e/CyrillicTurkicLangClassification.json",
"results/cointegrated__LaBSE-en-ru/cf0714e606d4af551e14ad69a7929cd6b0da7f7e/RiaNewsRetrieval.json",
"results/cointegrated__LaBSE-en-ru/cf0714e606d4af551e14ad69a7929cd6b0da7f7e/MIRACLRetrieval.json",
"results/cointegrated__LaBSE-en-ru/cf0714e606d4af551e14ad69a7929cd6b0da7f7e/GeoreviewClassification.json",
"results/cointegrated__LaBSE-en-ru/cf0714e606d4af551e14ad69a7929cd6b0da7f7e/SensitiveTopicsClassification.json",
"results/cointegrated__LaBSE-en-ru/cf0714e606d4af551e14ad69a7929cd6b0da7f7e/KinopoiskClassification.json",
Expand All @@ -11965,6 +11972,7 @@
"results/cointegrated__LaBSE-en-ru/cf0714e606d4af551e14ad69a7929cd6b0da7f7e/HeadlineClassification.json",
"results/cointegrated__LaBSE-en-ru/cf0714e606d4af551e14ad69a7929cd6b0da7f7e/XQuADRetrieval.json",
"results/cointegrated__LaBSE-en-ru/cf0714e606d4af551e14ad69a7929cd6b0da7f7e/BUCC.v2.json",
"results/cointegrated__LaBSE-en-ru/cf0714e606d4af551e14ad69a7929cd6b0da7f7e/MIRACLReranking.json",
"results/cointegrated__LaBSE-en-ru/cf0714e606d4af551e14ad69a7929cd6b0da7f7e/XNLI.json",
"results/cointegrated__LaBSE-en-ru/cf0714e606d4af551e14ad69a7929cd6b0da7f7e/XNLIV2.json",
"results/cointegrated__LaBSE-en-ru/cf0714e606d4af551e14ad69a7929cd6b0da7f7e/STS22.json",
Expand Down Expand Up @@ -12477,6 +12485,7 @@
"results/DeepPavlov__rubert-base-cased-sentence/78b5122d6365337dd4114281b0d08cd1edbb3bc8/RuSTSBenchmarkSTS.json",
"results/DeepPavlov__rubert-base-cased-sentence/78b5122d6365337dd4114281b0d08cd1edbb3bc8/CyrillicTurkicLangClassification.json",
"results/DeepPavlov__rubert-base-cased-sentence/78b5122d6365337dd4114281b0d08cd1edbb3bc8/RiaNewsRetrieval.json",
"results/DeepPavlov__rubert-base-cased-sentence/78b5122d6365337dd4114281b0d08cd1edbb3bc8/MIRACLRetrieval.json",
"results/DeepPavlov__rubert-base-cased-sentence/78b5122d6365337dd4114281b0d08cd1edbb3bc8/GeoreviewClassification.json",
"results/DeepPavlov__rubert-base-cased-sentence/78b5122d6365337dd4114281b0d08cd1edbb3bc8/SensitiveTopicsClassification.json",
"results/DeepPavlov__rubert-base-cased-sentence/78b5122d6365337dd4114281b0d08cd1edbb3bc8/KinopoiskClassification.json",
Expand All @@ -12492,6 +12501,7 @@
"results/DeepPavlov__rubert-base-cased-sentence/78b5122d6365337dd4114281b0d08cd1edbb3bc8/HeadlineClassification.json",
"results/DeepPavlov__rubert-base-cased-sentence/78b5122d6365337dd4114281b0d08cd1edbb3bc8/XQuADRetrieval.json",
"results/DeepPavlov__rubert-base-cased-sentence/78b5122d6365337dd4114281b0d08cd1edbb3bc8/BUCC.v2.json",
"results/DeepPavlov__rubert-base-cased-sentence/78b5122d6365337dd4114281b0d08cd1edbb3bc8/MIRACLReranking.json",
"results/DeepPavlov__rubert-base-cased-sentence/78b5122d6365337dd4114281b0d08cd1edbb3bc8/XNLI.json",
"results/DeepPavlov__rubert-base-cased-sentence/78b5122d6365337dd4114281b0d08cd1edbb3bc8/XNLIV2.json",
"results/DeepPavlov__rubert-base-cased-sentence/78b5122d6365337dd4114281b0d08cd1edbb3bc8/STS22.json",
Expand Down Expand Up @@ -13662,6 +13672,7 @@
"results/sergeyzh__LaBSE-ru-turbo/1940b046c6b5e125df11722b899130329d0a46da/RuSTSBenchmarkSTS.json",
"results/sergeyzh__LaBSE-ru-turbo/1940b046c6b5e125df11722b899130329d0a46da/CyrillicTurkicLangClassification.json",
"results/sergeyzh__LaBSE-ru-turbo/1940b046c6b5e125df11722b899130329d0a46da/RiaNewsRetrieval.json",
"results/sergeyzh__LaBSE-ru-turbo/1940b046c6b5e125df11722b899130329d0a46da/MIRACLRetrieval.json",
"results/sergeyzh__LaBSE-ru-turbo/1940b046c6b5e125df11722b899130329d0a46da/GeoreviewClassification.json",
"results/sergeyzh__LaBSE-ru-turbo/1940b046c6b5e125df11722b899130329d0a46da/SensitiveTopicsClassification.json",
"results/sergeyzh__LaBSE-ru-turbo/1940b046c6b5e125df11722b899130329d0a46da/KinopoiskClassification.json",
Expand All @@ -13676,6 +13687,7 @@
"results/sergeyzh__LaBSE-ru-turbo/1940b046c6b5e125df11722b899130329d0a46da/HeadlineClassification.json",
"results/sergeyzh__LaBSE-ru-turbo/1940b046c6b5e125df11722b899130329d0a46da/XQuADRetrieval.json",
"results/sergeyzh__LaBSE-ru-turbo/1940b046c6b5e125df11722b899130329d0a46da/BUCC.v2.json",
"results/sergeyzh__LaBSE-ru-turbo/1940b046c6b5e125df11722b899130329d0a46da/MIRACLReranking.json",
"results/sergeyzh__LaBSE-ru-turbo/1940b046c6b5e125df11722b899130329d0a46da/XNLI.json",
"results/sergeyzh__LaBSE-ru-turbo/1940b046c6b5e125df11722b899130329d0a46da/XNLIV2.json",
"results/sergeyzh__LaBSE-ru-turbo/1940b046c6b5e125df11722b899130329d0a46da/STS22.json",
Expand Down Expand Up @@ -13708,6 +13720,7 @@
"results/DeepPavlov__rubert-base-cased/4036cab694767a299f2b9e6492909664d9414229/RuSTSBenchmarkSTS.json",
"results/DeepPavlov__rubert-base-cased/4036cab694767a299f2b9e6492909664d9414229/CyrillicTurkicLangClassification.json",
"results/DeepPavlov__rubert-base-cased/4036cab694767a299f2b9e6492909664d9414229/RiaNewsRetrieval.json",
"results/DeepPavlov__rubert-base-cased/4036cab694767a299f2b9e6492909664d9414229/MIRACLRetrieval.json",
"results/DeepPavlov__rubert-base-cased/4036cab694767a299f2b9e6492909664d9414229/GeoreviewClassification.json",
"results/DeepPavlov__rubert-base-cased/4036cab694767a299f2b9e6492909664d9414229/SensitiveTopicsClassification.json",
"results/DeepPavlov__rubert-base-cased/4036cab694767a299f2b9e6492909664d9414229/KinopoiskClassification.json",
Expand All @@ -13723,6 +13736,7 @@
"results/DeepPavlov__rubert-base-cased/4036cab694767a299f2b9e6492909664d9414229/HeadlineClassification.json",
"results/DeepPavlov__rubert-base-cased/4036cab694767a299f2b9e6492909664d9414229/XQuADRetrieval.json",
"results/DeepPavlov__rubert-base-cased/4036cab694767a299f2b9e6492909664d9414229/BUCC.v2.json",
"results/DeepPavlov__rubert-base-cased/4036cab694767a299f2b9e6492909664d9414229/MIRACLReranking.json",
"results/DeepPavlov__rubert-base-cased/4036cab694767a299f2b9e6492909664d9414229/XNLI.json",
"results/DeepPavlov__rubert-base-cased/4036cab694767a299f2b9e6492909664d9414229/XNLIV2.json",
"results/DeepPavlov__rubert-base-cased/4036cab694767a299f2b9e6492909664d9414229/STS22.json",
Expand Down Expand Up @@ -15092,6 +15106,7 @@
"results/deepvk__USER-base/436a489a2087d61aa670b3496a9915f84e46c861/RuSTSBenchmarkSTS.json",
"results/deepvk__USER-base/436a489a2087d61aa670b3496a9915f84e46c861/CyrillicTurkicLangClassification.json",
"results/deepvk__USER-base/436a489a2087d61aa670b3496a9915f84e46c861/RiaNewsRetrieval.json",
"results/deepvk__USER-base/436a489a2087d61aa670b3496a9915f84e46c861/MIRACLRetrieval.json",
"results/deepvk__USER-base/436a489a2087d61aa670b3496a9915f84e46c861/GeoreviewClassification.json",
"results/deepvk__USER-base/436a489a2087d61aa670b3496a9915f84e46c861/SensitiveTopicsClassification.json",
"results/deepvk__USER-base/436a489a2087d61aa670b3496a9915f84e46c861/KinopoiskClassification.json",
Expand All @@ -15106,6 +15121,7 @@
"results/deepvk__USER-base/436a489a2087d61aa670b3496a9915f84e46c861/HeadlineClassification.json",
"results/deepvk__USER-base/436a489a2087d61aa670b3496a9915f84e46c861/XQuADRetrieval.json",
"results/deepvk__USER-base/436a489a2087d61aa670b3496a9915f84e46c861/BUCC.v2.json",
"results/deepvk__USER-base/436a489a2087d61aa670b3496a9915f84e46c861/MIRACLReranking.json",
"results/deepvk__USER-base/436a489a2087d61aa670b3496a9915f84e46c861/XNLI.json",
"results/deepvk__USER-base/436a489a2087d61aa670b3496a9915f84e46c861/XNLIV2.json",
"results/deepvk__USER-base/436a489a2087d61aa670b3496a9915f84e46c861/STS22.json",
Expand Down
Original file line number Diff line number Diff line change
@@ -0,0 +1,130 @@
{
"dataset_revision": "6d1962c527217f8927fca80f890f14f36b2802af",
"evaluation_time": 102.19886922836304,
"kg_co2_emissions": null,
"mteb_version": "1.12.94",
"scores": {
"dev": [
{
"MAP@1(MIRACL)": 0.03793,
"MAP@10(MIRACL)": 0.08492,
"MAP@100(MIRACL)": 0.11854,
"MAP@1000(MIRACL)": 0.11854,
"MAP@20(MIRACL)": 0.09699,
"MAP@3(MIRACL)": 0.0599,
"MAP@5(MIRACL)": 0.07087,
"NDCG@1(MIRACL)": 0.06576,
"NDCG@10(MIRACL)": 0.13094,
"NDCG@100(MIRACL)": 0.27866,
"NDCG@1000(MIRACL)": 0.27866,
"NDCG@20(MIRACL)": 0.16843,
"NDCG@3(MIRACL)": 0.08274,
"NDCG@5(MIRACL)": 0.09898,
"P@1(MIRACL)": 0.06576,
"P@10(MIRACL)": 0.04707,
"P@100(MIRACL)": 0.01953,
"P@1000(MIRACL)": 0.00195,
"P@20(MIRACL)": 0.03773,
"P@3(MIRACL)": 0.05801,
"P@5(MIRACL)": 0.05277,
"Recall@1(MIRACL)": 0.03793,
"Recall@10(MIRACL)": 0.20941,
"Recall@100(MIRACL)": 0.79952,
"Recall@1000(MIRACL)": 0.79952,
"Recall@20(MIRACL)": 0.32753,
"Recall@3(MIRACL)": 0.08533,
"Recall@5(MIRACL)": 0.12619,
"hf_subset": "ru",
"languages": [
"rus-Cyrl"
],
"main_score": 0.13094,
"nAUC_MAP@1000_diff1(MIRACL)": 0.11656879622209783,
"nAUC_MAP@1000_max(MIRACL)": -0.02184173429173281,
"nAUC_MAP@1000_std(MIRACL)": -0.0005910451991668005,
"nAUC_MAP@100_diff1(MIRACL)": 0.11656879622209783,
"nAUC_MAP@100_max(MIRACL)": -0.02184173429173281,
"nAUC_MAP@100_std(MIRACL)": -0.0005910451991668005,
"nAUC_MAP@10_diff1(MIRACL)": 0.12820268321122477,
"nAUC_MAP@10_max(MIRACL)": -0.006007170516302484,
"nAUC_MAP@10_std(MIRACL)": 0.004887023887105919,
"nAUC_MAP@1_diff1(MIRACL)": 0.19979024924352953,
"nAUC_MAP@1_max(MIRACL)": 0.0965067328936865,
"nAUC_MAP@1_std(MIRACL)": -0.01469295152548763,
"nAUC_MAP@20_diff1(MIRACL)": 0.11943138095364866,
"nAUC_MAP@20_max(MIRACL)": -0.014742898115901397,
"nAUC_MAP@20_std(MIRACL)": 0.007627922730200203,
"nAUC_MAP@3_diff1(MIRACL)": 0.16247267806292065,
"nAUC_MAP@3_max(MIRACL)": 0.01916771582088975,
"nAUC_MAP@3_std(MIRACL)": -0.024768207978978725,
"nAUC_MAP@5_diff1(MIRACL)": 0.13153704499454139,
"nAUC_MAP@5_max(MIRACL)": 0.007096539434435867,
"nAUC_MAP@5_std(MIRACL)": -0.013659018365901245,
"nAUC_NDCG@1000_diff1(MIRACL)": 0.09046593862073116,
"nAUC_NDCG@1000_max(MIRACL)": -0.049656945308565785,
"nAUC_NDCG@1000_std(MIRACL)": -0.02852729085649775,
"nAUC_NDCG@100_diff1(MIRACL)": 0.09046593862073116,
"nAUC_NDCG@100_max(MIRACL)": -0.049656945308565785,
"nAUC_NDCG@100_std(MIRACL)": -0.02852729085649775,
"nAUC_NDCG@10_diff1(MIRACL)": 0.10077472820623631,
"nAUC_NDCG@10_max(MIRACL)": -0.033319860687037434,
"nAUC_NDCG@10_std(MIRACL)": 0.008223662807163275,
"nAUC_NDCG@1_diff1(MIRACL)": 0.151186819507912,
"nAUC_NDCG@1_max(MIRACL)": 0.11537026630871994,
"nAUC_NDCG@1_std(MIRACL)": -0.045578082017163145,
"nAUC_NDCG@20_diff1(MIRACL)": 0.08640831332839452,
"nAUC_NDCG@20_max(MIRACL)": -0.05269863130012071,
"nAUC_NDCG@20_std(MIRACL)": 0.007783868824801839,
"nAUC_NDCG@3_diff1(MIRACL)": 0.13178318008309772,
"nAUC_NDCG@3_max(MIRACL)": 0.0035297506848497,
"nAUC_NDCG@3_std(MIRACL)": -0.042422835970525714,
"nAUC_NDCG@5_diff1(MIRACL)": 0.10348566598107344,
"nAUC_NDCG@5_max(MIRACL)": -0.015154481875360658,
"nAUC_NDCG@5_std(MIRACL)": -0.02018522684348813,
"nAUC_P@1000_diff1(MIRACL)": 0.006436408505254566,
"nAUC_P@1000_max(MIRACL)": -0.062365784452251265,
"nAUC_P@1000_std(MIRACL)": -0.06679081786133326,
"nAUC_P@100_diff1(MIRACL)": 0.006436408505254932,
"nAUC_P@100_max(MIRACL)": -0.06236578445225068,
"nAUC_P@100_std(MIRACL)": -0.06679081786133294,
"nAUC_P@10_diff1(MIRACL)": 0.035924513017525805,
"nAUC_P@10_max(MIRACL)": -0.07407327390595522,
"nAUC_P@10_std(MIRACL)": 0.011824346308663887,
"nAUC_P@1_diff1(MIRACL)": 0.151186819507912,
"nAUC_P@1_max(MIRACL)": 0.11537026630871994,
"nAUC_P@1_std(MIRACL)": -0.045578082017163145,
"nAUC_P@20_diff1(MIRACL)": 0.020405546456346138,
"nAUC_P@20_max(MIRACL)": -0.09600408910657676,
"nAUC_P@20_std(MIRACL)": -0.0001021731695539199,
"nAUC_P@3_diff1(MIRACL)": 0.08187396234458519,
"nAUC_P@3_max(MIRACL)": -0.02981991700564444,
"nAUC_P@3_std(MIRACL)": -0.04315477063398759,
"nAUC_P@5_diff1(MIRACL)": 0.029326475776068565,
"nAUC_P@5_max(MIRACL)": -0.05538591644280579,
"nAUC_P@5_std(MIRACL)": -0.013627413052371293,
"nAUC_Recall@1000_diff1(MIRACL)": 0.0626568052254435,
"nAUC_Recall@1000_max(MIRACL)": -0.056351555553082765,
"nAUC_Recall@1000_std(MIRACL)": -0.07720527712702241,
"nAUC_Recall@100_diff1(MIRACL)": 0.0626568052254435,
"nAUC_Recall@100_max(MIRACL)": -0.056351555553082765,
"nAUC_Recall@100_std(MIRACL)": -0.07720527712702241,
"nAUC_Recall@10_diff1(MIRACL)": 0.0699596207061801,
"nAUC_Recall@10_max(MIRACL)": -0.06623123931077808,
"nAUC_Recall@10_std(MIRACL)": 0.04314390563870134,
"nAUC_Recall@1_diff1(MIRACL)": 0.19979024924352953,
"nAUC_Recall@1_max(MIRACL)": 0.0965067328936865,
"nAUC_Recall@1_std(MIRACL)": -0.01469295152548763,
"nAUC_Recall@20_diff1(MIRACL)": 0.04151985357457182,
"nAUC_Recall@20_max(MIRACL)": -0.09346206581673573,
"nAUC_Recall@20_std(MIRACL)": 0.03867752916801929,
"nAUC_Recall@3_diff1(MIRACL)": 0.15002227895926992,
"nAUC_Recall@3_max(MIRACL)": -0.03085604524638985,
"nAUC_Recall@3_std(MIRACL)": -0.04078077585553242,
"nAUC_Recall@5_diff1(MIRACL)": 0.08035497411159716,
"nAUC_Recall@5_max(MIRACL)": -0.053504090706605265,
"nAUC_Recall@5_std(MIRACL)": -0.009017940713406399
}
]
},
"task_name": "MIRACLReranking"
}
Loading
Loading