From e5fb89728547ae5d7aca0b617ba5acae74cd1b18 Mon Sep 17 00:00:00 2001 From: Kenneth Enevoldsen Date: Tue, 9 Jul 2024 10:44:07 +0200 Subject: [PATCH 01/15] Remove "mteb_version": "test". Just assume that version number is unknown. --- .../no_revision_available/LEMBNarrativeQARetrieval.json | 1 - .../no_revision_available/LEMBNeedleRetrieval.json | 1 - .../no_revision_available/LEMBPasskeyRetrieval.json | 1 - .../no_revision_available/LEMBQMSumRetrieval.json | 1 - .../no_revision_available/LEMBSummScreenFDRetrieval.json | 1 - .../no_revision_available/LEMBWikimQARetrieval.json | 1 - .../no_revision_available/AlloProfClusteringP2P.json | 1 - .../no_revision_available/AlloProfClusteringS2S.json | 1 - .../voyage-law-2/no_revision_available/AlloprofReranking.json | 1 - .../voyage-law-2/no_revision_available/AlloprofRetrieval.json | 1 - .../no_revision_available/AmazonReviewsClassification.json | 1 - results/voyage-law-2/no_revision_available/BSARDRetrieval.json | 1 - results/voyage-law-2/no_revision_available/HALClusteringS2S.json | 1 - .../no_revision_available/LEMBNarrativeQARetrieval.json | 1 - .../voyage-law-2/no_revision_available/LEMBNeedleRetrieval.json | 1 - .../voyage-law-2/no_revision_available/LEMBPasskeyRetrieval.json | 1 - .../voyage-law-2/no_revision_available/LEMBQMSumRetrieval.json | 1 - .../no_revision_available/LEMBSummScreenFDRetrieval.json | 1 - .../voyage-law-2/no_revision_available/LEMBWikimQARetrieval.json | 1 - .../voyage-law-2/no_revision_available/MLSUMClusteringP2P.json | 1 - .../voyage-law-2/no_revision_available/MLSUMClusteringS2S.json | 1 - .../no_revision_available/MTOPDomainClassification.json | 1 - .../no_revision_available/MTOPIntentClassification.json | 1 - .../no_revision_available/MasakhaNEWSClassification.json | 1 - .../no_revision_available/MasakhaNEWSClusteringP2P.json | 1 - .../no_revision_available/MasakhaNEWSClusteringS2S.json | 1 - .../no_revision_available/MassiveIntentClassification.json | 1 - .../no_revision_available/MassiveScenarioClassification.json | 1 - results/voyage-law-2/no_revision_available/MintakaRetrieval.json | 1 - results/voyage-law-2/no_revision_available/OpusparcusPC.json | 1 - .../no_revision_available/PawsXPairClassification.json | 1 - results/voyage-law-2/no_revision_available/SICKFr.json | 1 - results/voyage-law-2/no_revision_available/STS22.json | 1 - .../no_revision_available/STSBenchmarkMultilingualSTS.json | 1 - results/voyage-law-2/no_revision_available/SummEvalFr.json | 1 - results/voyage-law-2/no_revision_available/SyntecReranking.json | 1 - results/voyage-law-2/no_revision_available/SyntecRetrieval.json | 1 - results/voyage-law-2/no_revision_available/XPQARetrieval.json | 1 - .../no_revision_available/AlloProfClusteringP2P.json | 1 - .../no_revision_available/AlloProfClusteringS2S.json | 1 - .../no_revision_available/AlloprofReranking.json | 1 - .../no_revision_available/AlloprofRetrieval.json | 1 - .../no_revision_available/AmazonReviewsClassification.json | 1 - .../no_revision_available/BSARDRetrieval.json | 1 - .../no_revision_available/HALClusteringS2S.json | 1 - .../no_revision_available/LEMBNarrativeQARetrieval.json | 1 - .../no_revision_available/LEMBNeedleRetrieval.json | 1 - .../no_revision_available/LEMBPasskeyRetrieval.json | 1 - .../no_revision_available/LEMBQMSumRetrieval.json | 1 - .../no_revision_available/LEMBSummScreenFDRetrieval.json | 1 - .../no_revision_available/LEMBWikimQARetrieval.json | 1 - .../no_revision_available/MLSUMClusteringP2P.json | 1 - .../no_revision_available/MLSUMClusteringS2S.json | 1 - .../no_revision_available/MTOPDomainClassification.json | 1 - .../no_revision_available/MTOPIntentClassification.json | 1 - .../no_revision_available/MasakhaNEWSClassification.json | 1 - .../no_revision_available/MasakhaNEWSClusteringP2P.json | 1 - .../no_revision_available/MasakhaNEWSClusteringS2S.json | 1 - .../no_revision_available/MassiveIntentClassification.json | 1 - .../no_revision_available/MassiveScenarioClassification.json | 1 - .../no_revision_available/MintakaRetrieval.json | 1 - .../no_revision_available/OpusparcusPC.json | 1 - .../no_revision_available/PawsXPairClassification.json | 1 - results/voyage-multilingual-2/no_revision_available/SICKFr.json | 1 - results/voyage-multilingual-2/no_revision_available/STS22.json | 1 - .../voyage-multilingual-2/no_revision_available/SummEvalFr.json | 1 - .../no_revision_available/SyntecReranking.json | 1 - .../no_revision_available/SyntecRetrieval.json | 1 - .../no_revision_available/XPQARetrieval.json | 1 - 69 files changed, 69 deletions(-) diff --git a/results/text-embedding-3-large/no_revision_available/LEMBNarrativeQARetrieval.json b/results/text-embedding-3-large/no_revision_available/LEMBNarrativeQARetrieval.json index ad904412..8121f36b 100644 --- a/results/text-embedding-3-large/no_revision_available/LEMBNarrativeQARetrieval.json +++ b/results/text-embedding-3-large/no_revision_available/LEMBNarrativeQARetrieval.json @@ -1,7 +1,6 @@ { "dataset_revision": "6e346642246bfb4928c560ee08640dc84d074e8c", "mteb_dataset_name": "LEMBNarrativeQARetrieval", - "mteb_version": "test", "test": { "evaluation_time": 489.32, "map_at_1": 0.32836, diff --git a/results/text-embedding-3-large/no_revision_available/LEMBNeedleRetrieval.json b/results/text-embedding-3-large/no_revision_available/LEMBNeedleRetrieval.json index 9fe32a6e..69d67b69 100644 --- a/results/text-embedding-3-large/no_revision_available/LEMBNeedleRetrieval.json +++ b/results/text-embedding-3-large/no_revision_available/LEMBNeedleRetrieval.json @@ -1,7 +1,6 @@ { "dataset_revision": "6e346642246bfb4928c560ee08640dc84d074e8c", "mteb_dataset_name": "LEMBNeedleRetrieval", - "mteb_version": "test", "test_1024": { "evaluation_time": 2.14, "map_at_1": 0.42, diff --git a/results/text-embedding-3-large/no_revision_available/LEMBPasskeyRetrieval.json b/results/text-embedding-3-large/no_revision_available/LEMBPasskeyRetrieval.json index b13a9ecf..5cf95a7d 100644 --- a/results/text-embedding-3-large/no_revision_available/LEMBPasskeyRetrieval.json +++ b/results/text-embedding-3-large/no_revision_available/LEMBPasskeyRetrieval.json @@ -1,7 +1,6 @@ { "dataset_revision": "6e346642246bfb4928c560ee08640dc84d074e8c", "mteb_dataset_name": "LEMBPasskeyRetrieval", - "mteb_version": "test", "test_1024": { "evaluation_time": 2.36, "map_at_1": 0.9, diff --git a/results/text-embedding-3-large/no_revision_available/LEMBQMSumRetrieval.json b/results/text-embedding-3-large/no_revision_available/LEMBQMSumRetrieval.json index 3a74b4b5..15d26344 100644 --- a/results/text-embedding-3-large/no_revision_available/LEMBQMSumRetrieval.json +++ b/results/text-embedding-3-large/no_revision_available/LEMBQMSumRetrieval.json @@ -1,7 +1,6 @@ { "dataset_revision": "6e346642246bfb4928c560ee08640dc84d074e8c", "mteb_dataset_name": "LEMBQMSumRetrieval", - "mteb_version": "test", "test": { "evaluation_time": 78.37, "map_at_1": 0.18861, diff --git a/results/text-embedding-3-large/no_revision_available/LEMBSummScreenFDRetrieval.json b/results/text-embedding-3-large/no_revision_available/LEMBSummScreenFDRetrieval.json index 5ab625fd..22ba469a 100644 --- a/results/text-embedding-3-large/no_revision_available/LEMBSummScreenFDRetrieval.json +++ b/results/text-embedding-3-large/no_revision_available/LEMBSummScreenFDRetrieval.json @@ -1,7 +1,6 @@ { "dataset_revision": "6e346642246bfb4928c560ee08640dc84d074e8c", "mteb_dataset_name": "LEMBSummScreenFDRetrieval", - "mteb_version": "test", "validation": { "evaluation_time": 24.15, "map_at_1": 0.72024, diff --git a/results/text-embedding-3-large/no_revision_available/LEMBWikimQARetrieval.json b/results/text-embedding-3-large/no_revision_available/LEMBWikimQARetrieval.json index 11100fe2..a31670e6 100644 --- a/results/text-embedding-3-large/no_revision_available/LEMBWikimQARetrieval.json +++ b/results/text-embedding-3-large/no_revision_available/LEMBWikimQARetrieval.json @@ -1,7 +1,6 @@ { "dataset_revision": "6e346642246bfb4928c560ee08640dc84d074e8c", "mteb_dataset_name": "LEMBWikimQARetrieval", - "mteb_version": "test", "test": { "evaluation_time": 22.67, "map_at_1": 0.39667, diff --git a/results/voyage-law-2/no_revision_available/AlloProfClusteringP2P.json b/results/voyage-law-2/no_revision_available/AlloProfClusteringP2P.json index 89e5743b..41022364 100644 --- a/results/voyage-law-2/no_revision_available/AlloProfClusteringP2P.json +++ b/results/voyage-law-2/no_revision_available/AlloProfClusteringP2P.json @@ -1,7 +1,6 @@ { "dataset_revision": "392ba3f5bcc8c51f578786c1fc3dae648662cb9b", "mteb_dataset_name": "AlloProfClusteringP2P", - "mteb_version": "test", "test": { "evaluation_time": 287.74, "main_score": 0.6249653710237563, diff --git a/results/voyage-law-2/no_revision_available/AlloProfClusteringS2S.json b/results/voyage-law-2/no_revision_available/AlloProfClusteringS2S.json index f890640c..2b2fc388 100644 --- a/results/voyage-law-2/no_revision_available/AlloProfClusteringS2S.json +++ b/results/voyage-law-2/no_revision_available/AlloProfClusteringS2S.json @@ -1,7 +1,6 @@ { "dataset_revision": "392ba3f5bcc8c51f578786c1fc3dae648662cb9b", "mteb_dataset_name": "AlloProfClusteringS2S", - "mteb_version": "test", "test": { "evaluation_time": 7.98, "main_score": 0.44276840537872414, diff --git a/results/voyage-law-2/no_revision_available/AlloprofReranking.json b/results/voyage-law-2/no_revision_available/AlloprofReranking.json index 58329d73..61579016 100644 --- a/results/voyage-law-2/no_revision_available/AlloprofReranking.json +++ b/results/voyage-law-2/no_revision_available/AlloprofReranking.json @@ -1,7 +1,6 @@ { "dataset_revision": "e40c8a63ce02da43200eccb5b0846fcaa888f562", "mteb_dataset_name": "AlloprofReranking", - "mteb_version": "test", "test": { "evaluation_time": 2342.07, "map": 0.7291614763981776, diff --git a/results/voyage-law-2/no_revision_available/AlloprofRetrieval.json b/results/voyage-law-2/no_revision_available/AlloprofRetrieval.json index b8ebf296..431a606d 100644 --- a/results/voyage-law-2/no_revision_available/AlloprofRetrieval.json +++ b/results/voyage-law-2/no_revision_available/AlloprofRetrieval.json @@ -1,7 +1,6 @@ { "dataset_revision": "fcf295ea64c750f41fadbaa37b9b861558e1bfbd", "mteb_dataset_name": "AlloprofRetrieval", - "mteb_version": "test", "test": { "evaluation_time": 282.79, "map_at_1": 0.3968, diff --git a/results/voyage-law-2/no_revision_available/AmazonReviewsClassification.json b/results/voyage-law-2/no_revision_available/AmazonReviewsClassification.json index 510250df..55f66d11 100644 --- a/results/voyage-law-2/no_revision_available/AmazonReviewsClassification.json +++ b/results/voyage-law-2/no_revision_available/AmazonReviewsClassification.json @@ -1,7 +1,6 @@ { "dataset_revision": "1399c76144fd37290681b995c656ef9b2e06e26d", "mteb_dataset_name": "AmazonReviewsClassification", - "mteb_version": "test", "test": { "evaluation_time": 38.55, "fr": { diff --git a/results/voyage-law-2/no_revision_available/BSARDRetrieval.json b/results/voyage-law-2/no_revision_available/BSARDRetrieval.json index cb98f6d1..c2f898a8 100644 --- a/results/voyage-law-2/no_revision_available/BSARDRetrieval.json +++ b/results/voyage-law-2/no_revision_available/BSARDRetrieval.json @@ -1,7 +1,6 @@ { "dataset_revision": "5effa1b9b5fa3b0f9e12523e6e43e5f86a6e6d59", "mteb_dataset_name": "BSARDRetrieval", - "mteb_version": "test", "test": { "evaluation_time": 526.42, "map_at_1": 0.06306, diff --git a/results/voyage-law-2/no_revision_available/HALClusteringS2S.json b/results/voyage-law-2/no_revision_available/HALClusteringS2S.json index 8b760490..57f384d5 100644 --- a/results/voyage-law-2/no_revision_available/HALClusteringS2S.json +++ b/results/voyage-law-2/no_revision_available/HALClusteringS2S.json @@ -1,7 +1,6 @@ { "dataset_revision": "e06ebbbb123f8144bef1a5d18796f3dec9ae2915", "mteb_dataset_name": "HALClusteringS2S", - "mteb_version": "test", "test": { "evaluation_time": 308.56, "main_score": 0.2635522952949986, diff --git a/results/voyage-law-2/no_revision_available/LEMBNarrativeQARetrieval.json b/results/voyage-law-2/no_revision_available/LEMBNarrativeQARetrieval.json index 3f3fc239..cb5b6878 100644 --- a/results/voyage-law-2/no_revision_available/LEMBNarrativeQARetrieval.json +++ b/results/voyage-law-2/no_revision_available/LEMBNarrativeQARetrieval.json @@ -1,7 +1,6 @@ { "dataset_revision": "6e346642246bfb4928c560ee08640dc84d074e8c", "mteb_dataset_name": "LEMBNarrativeQARetrieval", - "mteb_version": "test", "test": { "evaluation_time": 729.79, "map_at_1": 0.43574, diff --git a/results/voyage-law-2/no_revision_available/LEMBNeedleRetrieval.json b/results/voyage-law-2/no_revision_available/LEMBNeedleRetrieval.json index 3447add1..fe6d7d61 100644 --- a/results/voyage-law-2/no_revision_available/LEMBNeedleRetrieval.json +++ b/results/voyage-law-2/no_revision_available/LEMBNeedleRetrieval.json @@ -1,7 +1,6 @@ { "dataset_revision": "6e346642246bfb4928c560ee08640dc84d074e8c", "mteb_dataset_name": "LEMBNeedleRetrieval", - "mteb_version": "test", "test_1024": { "evaluation_time": 7.98, "map_at_1": 0.92, diff --git a/results/voyage-law-2/no_revision_available/LEMBPasskeyRetrieval.json b/results/voyage-law-2/no_revision_available/LEMBPasskeyRetrieval.json index 547254a2..604035df 100644 --- a/results/voyage-law-2/no_revision_available/LEMBPasskeyRetrieval.json +++ b/results/voyage-law-2/no_revision_available/LEMBPasskeyRetrieval.json @@ -1,7 +1,6 @@ { "dataset_revision": "6e346642246bfb4928c560ee08640dc84d074e8c", "mteb_dataset_name": "LEMBPasskeyRetrieval", - "mteb_version": "test", "test_1024": { "evaluation_time": 7.81, "map_at_1": 0.98, diff --git a/results/voyage-law-2/no_revision_available/LEMBQMSumRetrieval.json b/results/voyage-law-2/no_revision_available/LEMBQMSumRetrieval.json index 57afb2e3..e156a4ac 100644 --- a/results/voyage-law-2/no_revision_available/LEMBQMSumRetrieval.json +++ b/results/voyage-law-2/no_revision_available/LEMBQMSumRetrieval.json @@ -1,7 +1,6 @@ { "dataset_revision": "6e346642246bfb4928c560ee08640dc84d074e8c", "mteb_dataset_name": "LEMBQMSumRetrieval", - "mteb_version": "test", "test": { "evaluation_time": 298.09, "map_at_1": 0.41454, diff --git a/results/voyage-law-2/no_revision_available/LEMBSummScreenFDRetrieval.json b/results/voyage-law-2/no_revision_available/LEMBSummScreenFDRetrieval.json index 20cba324..23c9f901 100644 --- a/results/voyage-law-2/no_revision_available/LEMBSummScreenFDRetrieval.json +++ b/results/voyage-law-2/no_revision_available/LEMBSummScreenFDRetrieval.json @@ -1,7 +1,6 @@ { "dataset_revision": "6e346642246bfb4928c560ee08640dc84d074e8c", "mteb_dataset_name": "LEMBSummScreenFDRetrieval", - "mteb_version": "test", "validation": { "evaluation_time": 357.75, "map_at_1": 0.97321, diff --git a/results/voyage-law-2/no_revision_available/LEMBWikimQARetrieval.json b/results/voyage-law-2/no_revision_available/LEMBWikimQARetrieval.json index b214fdf4..c3e9fd18 100644 --- a/results/voyage-law-2/no_revision_available/LEMBWikimQARetrieval.json +++ b/results/voyage-law-2/no_revision_available/LEMBWikimQARetrieval.json @@ -1,7 +1,6 @@ { "dataset_revision": "6e346642246bfb4928c560ee08640dc84d074e8c", "mteb_dataset_name": "LEMBWikimQARetrieval", - "mteb_version": "test", "test": { "evaluation_time": 335.15, "map_at_1": 0.8, diff --git a/results/voyage-law-2/no_revision_available/MLSUMClusteringP2P.json b/results/voyage-law-2/no_revision_available/MLSUMClusteringP2P.json index 0b6735f6..6d9fbe56 100644 --- a/results/voyage-law-2/no_revision_available/MLSUMClusteringP2P.json +++ b/results/voyage-law-2/no_revision_available/MLSUMClusteringP2P.json @@ -1,7 +1,6 @@ { "dataset_revision": "b5d54f8f3b61ae17845046286940f03c6bc79bc7", "mteb_dataset_name": "MLSUMClusteringP2P", - "mteb_version": "test", "test": { "evaluation_time": 1511.32, "fr": { diff --git a/results/voyage-law-2/no_revision_available/MLSUMClusteringS2S.json b/results/voyage-law-2/no_revision_available/MLSUMClusteringS2S.json index 6844f2fe..0d0c0496 100644 --- a/results/voyage-law-2/no_revision_available/MLSUMClusteringS2S.json +++ b/results/voyage-law-2/no_revision_available/MLSUMClusteringS2S.json @@ -1,7 +1,6 @@ { "dataset_revision": "b5d54f8f3b61ae17845046286940f03c6bc79bc7", "mteb_dataset_name": "MLSUMClusteringS2S", - "mteb_version": "test", "test": { "evaluation_time": 1485.47, "fr": { diff --git a/results/voyage-law-2/no_revision_available/MTOPDomainClassification.json b/results/voyage-law-2/no_revision_available/MTOPDomainClassification.json index d335e345..672d1590 100644 --- a/results/voyage-law-2/no_revision_available/MTOPDomainClassification.json +++ b/results/voyage-law-2/no_revision_available/MTOPDomainClassification.json @@ -1,7 +1,6 @@ { "dataset_revision": "d80d48c1eb48d3562165c59d59d0034df9fff0bf", "mteb_dataset_name": "MTOPDomainClassification", - "mteb_version": "test", "test": { "evaluation_time": 10.45, "fr": { diff --git a/results/voyage-law-2/no_revision_available/MTOPIntentClassification.json b/results/voyage-law-2/no_revision_available/MTOPIntentClassification.json index c0acf9d6..1f3eb29e 100644 --- a/results/voyage-law-2/no_revision_available/MTOPIntentClassification.json +++ b/results/voyage-law-2/no_revision_available/MTOPIntentClassification.json @@ -1,7 +1,6 @@ { "dataset_revision": "ae001d0e6b1228650b7bd1c2c65fb50ad11a8aba", "mteb_dataset_name": "MTOPIntentClassification", - "mteb_version": "test", "test": { "evaluation_time": 26.96, "fr": { diff --git a/results/voyage-law-2/no_revision_available/MasakhaNEWSClassification.json b/results/voyage-law-2/no_revision_available/MasakhaNEWSClassification.json index 34f898ca..6ea07666 100644 --- a/results/voyage-law-2/no_revision_available/MasakhaNEWSClassification.json +++ b/results/voyage-law-2/no_revision_available/MasakhaNEWSClassification.json @@ -1,7 +1,6 @@ { "dataset_revision": "8ccc72e69e65f40c70e117d8b3c08306bb788b60", "mteb_dataset_name": "MasakhaNEWSClassification", - "mteb_version": "test", "test": { "evaluation_time": 153.12, "fra": { diff --git a/results/voyage-law-2/no_revision_available/MasakhaNEWSClusteringP2P.json b/results/voyage-law-2/no_revision_available/MasakhaNEWSClusteringP2P.json index 368a48c8..e2bad94f 100644 --- a/results/voyage-law-2/no_revision_available/MasakhaNEWSClusteringP2P.json +++ b/results/voyage-law-2/no_revision_available/MasakhaNEWSClusteringP2P.json @@ -1,7 +1,6 @@ { "dataset_revision": "8ccc72e69e65f40c70e117d8b3c08306bb788b60", "mteb_dataset_name": "MasakhaNEWSClusteringP2P", - "mteb_version": "test", "test": { "evaluation_time": 72.59, "fra": { diff --git a/results/voyage-law-2/no_revision_available/MasakhaNEWSClusteringS2S.json b/results/voyage-law-2/no_revision_available/MasakhaNEWSClusteringS2S.json index 08e4aa11..ec15d8bd 100644 --- a/results/voyage-law-2/no_revision_available/MasakhaNEWSClusteringS2S.json +++ b/results/voyage-law-2/no_revision_available/MasakhaNEWSClusteringS2S.json @@ -1,7 +1,6 @@ { "dataset_revision": "8ccc72e69e65f40c70e117d8b3c08306bb788b60", "mteb_dataset_name": "MasakhaNEWSClusteringS2S", - "mteb_version": "test", "test": { "evaluation_time": 3.5, "fra": { diff --git a/results/voyage-law-2/no_revision_available/MassiveIntentClassification.json b/results/voyage-law-2/no_revision_available/MassiveIntentClassification.json index 6c340438..b3e2ccc9 100644 --- a/results/voyage-law-2/no_revision_available/MassiveIntentClassification.json +++ b/results/voyage-law-2/no_revision_available/MassiveIntentClassification.json @@ -1,7 +1,6 @@ { "dataset_revision": "31efe3c427b0bae9c22cbb560b8f15491cc6bed7", "mteb_dataset_name": "MassiveIntentClassification", - "mteb_version": "test", "test": { "evaluation_time": 18.76, "fr": { diff --git a/results/voyage-law-2/no_revision_available/MassiveScenarioClassification.json b/results/voyage-law-2/no_revision_available/MassiveScenarioClassification.json index 8b5a31e5..a8c5edd3 100644 --- a/results/voyage-law-2/no_revision_available/MassiveScenarioClassification.json +++ b/results/voyage-law-2/no_revision_available/MassiveScenarioClassification.json @@ -1,7 +1,6 @@ { "dataset_revision": "7d571f92784cd94a019292a1f45445077d0ef634", "mteb_dataset_name": "MassiveScenarioClassification", - "mteb_version": "test", "test": { "evaluation_time": 11.98, "fr": { diff --git a/results/voyage-law-2/no_revision_available/MintakaRetrieval.json b/results/voyage-law-2/no_revision_available/MintakaRetrieval.json index a2f3237c..f839704a 100644 --- a/results/voyage-law-2/no_revision_available/MintakaRetrieval.json +++ b/results/voyage-law-2/no_revision_available/MintakaRetrieval.json @@ -1,7 +1,6 @@ { "dataset_revision": "efa78cc2f74bbcd21eff2261f9e13aebe40b814e", "mteb_dataset_name": "MintakaRetrieval", - "mteb_version": "test", "test": { "evaluation_time": 15.21, "fr": { diff --git a/results/voyage-law-2/no_revision_available/OpusparcusPC.json b/results/voyage-law-2/no_revision_available/OpusparcusPC.json index 04baf164..0d3bb50f 100644 --- a/results/voyage-law-2/no_revision_available/OpusparcusPC.json +++ b/results/voyage-law-2/no_revision_available/OpusparcusPC.json @@ -1,7 +1,6 @@ { "dataset_revision": "9e9b1f8ef51616073f47f306f7f47dd91663f86a", "mteb_dataset_name": "OpusparcusPC", - "mteb_version": "test", "test.full": { "evaluation_time": 7.12, "fr": { diff --git a/results/voyage-law-2/no_revision_available/PawsXPairClassification.json b/results/voyage-law-2/no_revision_available/PawsXPairClassification.json index 2e01cb1e..a2c7f1c6 100644 --- a/results/voyage-law-2/no_revision_available/PawsXPairClassification.json +++ b/results/voyage-law-2/no_revision_available/PawsXPairClassification.json @@ -1,7 +1,6 @@ { "dataset_revision": "8a04d940a42cd40658986fdd8e3da561533a3646", "mteb_dataset_name": "PawsXPairClassification", - "mteb_version": "test", "test": { "evaluation_time": 17.61, "fr": { diff --git a/results/voyage-law-2/no_revision_available/SICKFr.json b/results/voyage-law-2/no_revision_available/SICKFr.json index 39b6436b..fdad8c46 100644 --- a/results/voyage-law-2/no_revision_available/SICKFr.json +++ b/results/voyage-law-2/no_revision_available/SICKFr.json @@ -1,7 +1,6 @@ { "dataset_revision": "e077ab4cf4774a1e36d86d593b150422fafd8e8a", "mteb_dataset_name": "SICKFr", - "mteb_version": "test", "test": { "cos_sim": { "pearson": 0.8167665128935123, diff --git a/results/voyage-law-2/no_revision_available/STS22.json b/results/voyage-law-2/no_revision_available/STS22.json index 4ec1a2cb..2420b90c 100644 --- a/results/voyage-law-2/no_revision_available/STS22.json +++ b/results/voyage-law-2/no_revision_available/STS22.json @@ -1,7 +1,6 @@ { "dataset_revision": "eea2b4fe26a775864c896887d910b76a8098ad3f", "mteb_dataset_name": "STS22", - "mteb_version": "test", "test": { "evaluation_time": 25.2, "fr": { diff --git a/results/voyage-law-2/no_revision_available/STSBenchmarkMultilingualSTS.json b/results/voyage-law-2/no_revision_available/STSBenchmarkMultilingualSTS.json index db38e0d9..51a79f65 100644 --- a/results/voyage-law-2/no_revision_available/STSBenchmarkMultilingualSTS.json +++ b/results/voyage-law-2/no_revision_available/STSBenchmarkMultilingualSTS.json @@ -1,7 +1,6 @@ { "dataset_revision": "93d57ef91790589e3ce9c365164337a8a78b7632", "mteb_dataset_name": "STSBenchmarkMultilingualSTS", - "mteb_version": "test", "test": { "evaluation_time": 7.49, "fr": { diff --git a/results/voyage-law-2/no_revision_available/SummEvalFr.json b/results/voyage-law-2/no_revision_available/SummEvalFr.json index 2f15220a..43aa2992 100644 --- a/results/voyage-law-2/no_revision_available/SummEvalFr.json +++ b/results/voyage-law-2/no_revision_available/SummEvalFr.json @@ -1,7 +1,6 @@ { "dataset_revision": "b385812de6a9577b6f4d0f88c6a6e35395a94054", "mteb_dataset_name": "SummEvalFr", - "mteb_version": "test", "test": { "cos_sim": { "pearson": 0.31700541200366006, diff --git a/results/voyage-law-2/no_revision_available/SyntecReranking.json b/results/voyage-law-2/no_revision_available/SyntecReranking.json index 2461eadd..b76ed61f 100644 --- a/results/voyage-law-2/no_revision_available/SyntecReranking.json +++ b/results/voyage-law-2/no_revision_available/SyntecReranking.json @@ -1,7 +1,6 @@ { "dataset_revision": "b205c5084a0934ce8af14338bf03feb19499c84d", "mteb_dataset_name": "SyntecReranking", - "mteb_version": "test", "test": { "evaluation_time": 18.59, "map": 0.9119999999999999, diff --git a/results/voyage-law-2/no_revision_available/SyntecRetrieval.json b/results/voyage-law-2/no_revision_available/SyntecRetrieval.json index e3339675..46068f34 100644 --- a/results/voyage-law-2/no_revision_available/SyntecRetrieval.json +++ b/results/voyage-law-2/no_revision_available/SyntecRetrieval.json @@ -1,7 +1,6 @@ { "dataset_revision": "19661ccdca4dfc2d15122d776b61685f48c68ca9", "mteb_dataset_name": "SyntecRetrieval", - "mteb_version": "test", "test": { "evaluation_time": 7.82, "map_at_1": 0.72, diff --git a/results/voyage-law-2/no_revision_available/XPQARetrieval.json b/results/voyage-law-2/no_revision_available/XPQARetrieval.json index 4bf4d8a8..408e6b60 100644 --- a/results/voyage-law-2/no_revision_available/XPQARetrieval.json +++ b/results/voyage-law-2/no_revision_available/XPQARetrieval.json @@ -1,7 +1,6 @@ { "dataset_revision": "c99d599f0a6ab9b85b065da6f9d94f9cf731679f", "mteb_dataset_name": "XPQARetrieval", - "mteb_version": "test", "test": { "evaluation_time": 9.67, "fr": { diff --git a/results/voyage-multilingual-2/no_revision_available/AlloProfClusteringP2P.json b/results/voyage-multilingual-2/no_revision_available/AlloProfClusteringP2P.json index f6a349dd..0e27c47d 100644 --- a/results/voyage-multilingual-2/no_revision_available/AlloProfClusteringP2P.json +++ b/results/voyage-multilingual-2/no_revision_available/AlloProfClusteringP2P.json @@ -1,7 +1,6 @@ { "dataset_revision": "392ba3f5bcc8c51f578786c1fc3dae648662cb9b", "mteb_dataset_name": "AlloProfClusteringP2P", - "mteb_version": "test", "test": { "evaluation_time": 315.13, "main_score": 0.6536875126730821, diff --git a/results/voyage-multilingual-2/no_revision_available/AlloProfClusteringS2S.json b/results/voyage-multilingual-2/no_revision_available/AlloProfClusteringS2S.json index e59cdfcf..359543de 100644 --- a/results/voyage-multilingual-2/no_revision_available/AlloProfClusteringS2S.json +++ b/results/voyage-multilingual-2/no_revision_available/AlloProfClusteringS2S.json @@ -1,7 +1,6 @@ { "dataset_revision": "392ba3f5bcc8c51f578786c1fc3dae648662cb9b", "mteb_dataset_name": "AlloProfClusteringS2S", - "mteb_version": "test", "test": { "evaluation_time": 17.13, "main_score": 0.4703040848663136, diff --git a/results/voyage-multilingual-2/no_revision_available/AlloprofReranking.json b/results/voyage-multilingual-2/no_revision_available/AlloprofReranking.json index e98863f0..ff296563 100644 --- a/results/voyage-multilingual-2/no_revision_available/AlloprofReranking.json +++ b/results/voyage-multilingual-2/no_revision_available/AlloprofReranking.json @@ -1,7 +1,6 @@ { "dataset_revision": "e40c8a63ce02da43200eccb5b0846fcaa888f562", "mteb_dataset_name": "AlloprofReranking", - "mteb_version": "test", "test": { "evaluation_time": 2635.25, "map": 0.7478259710767642, diff --git a/results/voyage-multilingual-2/no_revision_available/AlloprofRetrieval.json b/results/voyage-multilingual-2/no_revision_available/AlloprofRetrieval.json index d9edfab0..7b646109 100644 --- a/results/voyage-multilingual-2/no_revision_available/AlloprofRetrieval.json +++ b/results/voyage-multilingual-2/no_revision_available/AlloprofRetrieval.json @@ -1,7 +1,6 @@ { "dataset_revision": "fcf295ea64c750f41fadbaa37b9b861558e1bfbd", "mteb_dataset_name": "AlloprofRetrieval", - "mteb_version": "test", "test": { "evaluation_time": 302.8, "map_at_1": 0.40112, diff --git a/results/voyage-multilingual-2/no_revision_available/AmazonReviewsClassification.json b/results/voyage-multilingual-2/no_revision_available/AmazonReviewsClassification.json index de953431..72f86db4 100644 --- a/results/voyage-multilingual-2/no_revision_available/AmazonReviewsClassification.json +++ b/results/voyage-multilingual-2/no_revision_available/AmazonReviewsClassification.json @@ -1,7 +1,6 @@ { "dataset_revision": "1399c76144fd37290681b995c656ef9b2e06e26d", "mteb_dataset_name": "AmazonReviewsClassification", - "mteb_version": "test", "test": { "evaluation_time": 49.28, "fr": { diff --git a/results/voyage-multilingual-2/no_revision_available/BSARDRetrieval.json b/results/voyage-multilingual-2/no_revision_available/BSARDRetrieval.json index b43bb9e9..3369c440 100644 --- a/results/voyage-multilingual-2/no_revision_available/BSARDRetrieval.json +++ b/results/voyage-multilingual-2/no_revision_available/BSARDRetrieval.json @@ -1,7 +1,6 @@ { "dataset_revision": "5effa1b9b5fa3b0f9e12523e6e43e5f86a6e6d59", "mteb_dataset_name": "BSARDRetrieval", - "mteb_version": "test", "test": { "evaluation_time": 607.54, "map_at_1": 0.01351, diff --git a/results/voyage-multilingual-2/no_revision_available/HALClusteringS2S.json b/results/voyage-multilingual-2/no_revision_available/HALClusteringS2S.json index 47eb1c9e..0ea1433c 100644 --- a/results/voyage-multilingual-2/no_revision_available/HALClusteringS2S.json +++ b/results/voyage-multilingual-2/no_revision_available/HALClusteringS2S.json @@ -1,7 +1,6 @@ { "dataset_revision": "e06ebbbb123f8144bef1a5d18796f3dec9ae2915", "mteb_dataset_name": "HALClusteringS2S", - "mteb_version": "test", "test": { "evaluation_time": 605.26, "main_score": 0.27669961551374833, diff --git a/results/voyage-multilingual-2/no_revision_available/LEMBNarrativeQARetrieval.json b/results/voyage-multilingual-2/no_revision_available/LEMBNarrativeQARetrieval.json index 513e5113..79eb6346 100644 --- a/results/voyage-multilingual-2/no_revision_available/LEMBNarrativeQARetrieval.json +++ b/results/voyage-multilingual-2/no_revision_available/LEMBNarrativeQARetrieval.json @@ -1,7 +1,6 @@ { "dataset_revision": "6e346642246bfb4928c560ee08640dc84d074e8c", "mteb_dataset_name": "LEMBNarrativeQARetrieval", - "mteb_version": "test", "test": { "evaluation_time": 1985.85, "map_at_1": 0.539, diff --git a/results/voyage-multilingual-2/no_revision_available/LEMBNeedleRetrieval.json b/results/voyage-multilingual-2/no_revision_available/LEMBNeedleRetrieval.json index a006f9eb..d4897a8d 100644 --- a/results/voyage-multilingual-2/no_revision_available/LEMBNeedleRetrieval.json +++ b/results/voyage-multilingual-2/no_revision_available/LEMBNeedleRetrieval.json @@ -1,7 +1,6 @@ { "dataset_revision": "6e346642246bfb4928c560ee08640dc84d074e8c", "mteb_dataset_name": "LEMBNeedleRetrieval", - "mteb_version": "test", "test_1024": { "evaluation_time": 8.95, "map_at_1": 0.86, diff --git a/results/voyage-multilingual-2/no_revision_available/LEMBPasskeyRetrieval.json b/results/voyage-multilingual-2/no_revision_available/LEMBPasskeyRetrieval.json index 634a7416..0d3401be 100644 --- a/results/voyage-multilingual-2/no_revision_available/LEMBPasskeyRetrieval.json +++ b/results/voyage-multilingual-2/no_revision_available/LEMBPasskeyRetrieval.json @@ -1,7 +1,6 @@ { "dataset_revision": "6e346642246bfb4928c560ee08640dc84d074e8c", "mteb_dataset_name": "LEMBPasskeyRetrieval", - "mteb_version": "test", "test_1024": { "evaluation_time": 8.93, "map_at_1": 1.0, diff --git a/results/voyage-multilingual-2/no_revision_available/LEMBQMSumRetrieval.json b/results/voyage-multilingual-2/no_revision_available/LEMBQMSumRetrieval.json index 89cd39e3..0bd83601 100644 --- a/results/voyage-multilingual-2/no_revision_available/LEMBQMSumRetrieval.json +++ b/results/voyage-multilingual-2/no_revision_available/LEMBQMSumRetrieval.json @@ -1,7 +1,6 @@ { "dataset_revision": "6e346642246bfb4928c560ee08640dc84d074e8c", "mteb_dataset_name": "LEMBQMSumRetrieval", - "mteb_version": "test", "test": { "evaluation_time": 423.51, "map_at_1": 0.35363, diff --git a/results/voyage-multilingual-2/no_revision_available/LEMBSummScreenFDRetrieval.json b/results/voyage-multilingual-2/no_revision_available/LEMBSummScreenFDRetrieval.json index 36f7ec08..a2ac4d7a 100644 --- a/results/voyage-multilingual-2/no_revision_available/LEMBSummScreenFDRetrieval.json +++ b/results/voyage-multilingual-2/no_revision_available/LEMBSummScreenFDRetrieval.json @@ -1,7 +1,6 @@ { "dataset_revision": "6e346642246bfb4928c560ee08640dc84d074e8c", "mteb_dataset_name": "LEMBSummScreenFDRetrieval", - "mteb_version": "test", "validation": { "evaluation_time": 377.36, "map_at_1": 0.98512, diff --git a/results/voyage-multilingual-2/no_revision_available/LEMBWikimQARetrieval.json b/results/voyage-multilingual-2/no_revision_available/LEMBWikimQARetrieval.json index dcce410e..9b0cdf50 100644 --- a/results/voyage-multilingual-2/no_revision_available/LEMBWikimQARetrieval.json +++ b/results/voyage-multilingual-2/no_revision_available/LEMBWikimQARetrieval.json @@ -1,7 +1,6 @@ { "dataset_revision": "6e346642246bfb4928c560ee08640dc84d074e8c", "mteb_dataset_name": "LEMBWikimQARetrieval", - "mteb_version": "test", "test": { "evaluation_time": 370.88, "map_at_1": 0.79667, diff --git a/results/voyage-multilingual-2/no_revision_available/MLSUMClusteringP2P.json b/results/voyage-multilingual-2/no_revision_available/MLSUMClusteringP2P.json index 6fd7e66e..8098c205 100644 --- a/results/voyage-multilingual-2/no_revision_available/MLSUMClusteringP2P.json +++ b/results/voyage-multilingual-2/no_revision_available/MLSUMClusteringP2P.json @@ -1,7 +1,6 @@ { "dataset_revision": "b5d54f8f3b61ae17845046286940f03c6bc79bc7", "mteb_dataset_name": "MLSUMClusteringP2P", - "mteb_version": "test", "test": { "evaluation_time": 1770.91, "fr": { diff --git a/results/voyage-multilingual-2/no_revision_available/MLSUMClusteringS2S.json b/results/voyage-multilingual-2/no_revision_available/MLSUMClusteringS2S.json index f9d5c6bb..958067e6 100644 --- a/results/voyage-multilingual-2/no_revision_available/MLSUMClusteringS2S.json +++ b/results/voyage-multilingual-2/no_revision_available/MLSUMClusteringS2S.json @@ -1,7 +1,6 @@ { "dataset_revision": "b5d54f8f3b61ae17845046286940f03c6bc79bc7", "mteb_dataset_name": "MLSUMClusteringS2S", - "mteb_version": "test", "test": { "evaluation_time": 1736.82, "fr": { diff --git a/results/voyage-multilingual-2/no_revision_available/MTOPDomainClassification.json b/results/voyage-multilingual-2/no_revision_available/MTOPDomainClassification.json index 701b7831..00813410 100644 --- a/results/voyage-multilingual-2/no_revision_available/MTOPDomainClassification.json +++ b/results/voyage-multilingual-2/no_revision_available/MTOPDomainClassification.json @@ -1,7 +1,6 @@ { "dataset_revision": "d80d48c1eb48d3562165c59d59d0034df9fff0bf", "mteb_dataset_name": "MTOPDomainClassification", - "mteb_version": "test", "test": { "evaluation_time": 24.14, "fr": { diff --git a/results/voyage-multilingual-2/no_revision_available/MTOPIntentClassification.json b/results/voyage-multilingual-2/no_revision_available/MTOPIntentClassification.json index b904ba5c..45d2e813 100644 --- a/results/voyage-multilingual-2/no_revision_available/MTOPIntentClassification.json +++ b/results/voyage-multilingual-2/no_revision_available/MTOPIntentClassification.json @@ -1,7 +1,6 @@ { "dataset_revision": "ae001d0e6b1228650b7bd1c2c65fb50ad11a8aba", "mteb_dataset_name": "MTOPIntentClassification", - "mteb_version": "test", "test": { "evaluation_time": 71.69, "fr": { diff --git a/results/voyage-multilingual-2/no_revision_available/MasakhaNEWSClassification.json b/results/voyage-multilingual-2/no_revision_available/MasakhaNEWSClassification.json index ef305c2d..65e63259 100644 --- a/results/voyage-multilingual-2/no_revision_available/MasakhaNEWSClassification.json +++ b/results/voyage-multilingual-2/no_revision_available/MasakhaNEWSClassification.json @@ -1,7 +1,6 @@ { "dataset_revision": "8ccc72e69e65f40c70e117d8b3c08306bb788b60", "mteb_dataset_name": "MasakhaNEWSClassification", - "mteb_version": "test", "test": { "evaluation_time": 141.83, "fra": { diff --git a/results/voyage-multilingual-2/no_revision_available/MasakhaNEWSClusteringP2P.json b/results/voyage-multilingual-2/no_revision_available/MasakhaNEWSClusteringP2P.json index 7c907bac..085f160d 100644 --- a/results/voyage-multilingual-2/no_revision_available/MasakhaNEWSClusteringP2P.json +++ b/results/voyage-multilingual-2/no_revision_available/MasakhaNEWSClusteringP2P.json @@ -1,7 +1,6 @@ { "dataset_revision": "8ccc72e69e65f40c70e117d8b3c08306bb788b60", "mteb_dataset_name": "MasakhaNEWSClusteringP2P", - "mteb_version": "test", "test": { "evaluation_time": 76.21, "fra": { diff --git a/results/voyage-multilingual-2/no_revision_available/MasakhaNEWSClusteringS2S.json b/results/voyage-multilingual-2/no_revision_available/MasakhaNEWSClusteringS2S.json index 219c3670..2f7b6bf2 100644 --- a/results/voyage-multilingual-2/no_revision_available/MasakhaNEWSClusteringS2S.json +++ b/results/voyage-multilingual-2/no_revision_available/MasakhaNEWSClusteringS2S.json @@ -1,7 +1,6 @@ { "dataset_revision": "8ccc72e69e65f40c70e117d8b3c08306bb788b60", "mteb_dataset_name": "MasakhaNEWSClusteringS2S", - "mteb_version": "test", "test": { "evaluation_time": 4.87, "fra": { diff --git a/results/voyage-multilingual-2/no_revision_available/MassiveIntentClassification.json b/results/voyage-multilingual-2/no_revision_available/MassiveIntentClassification.json index d546386b..dd85a8fd 100644 --- a/results/voyage-multilingual-2/no_revision_available/MassiveIntentClassification.json +++ b/results/voyage-multilingual-2/no_revision_available/MassiveIntentClassification.json @@ -1,7 +1,6 @@ { "dataset_revision": "31efe3c427b0bae9c22cbb560b8f15491cc6bed7", "mteb_dataset_name": "MassiveIntentClassification", - "mteb_version": "test", "test": { "evaluation_time": 53.32, "fr": { diff --git a/results/voyage-multilingual-2/no_revision_available/MassiveScenarioClassification.json b/results/voyage-multilingual-2/no_revision_available/MassiveScenarioClassification.json index 04821622..dc3ba9e4 100644 --- a/results/voyage-multilingual-2/no_revision_available/MassiveScenarioClassification.json +++ b/results/voyage-multilingual-2/no_revision_available/MassiveScenarioClassification.json @@ -1,7 +1,6 @@ { "dataset_revision": "7d571f92784cd94a019292a1f45445077d0ef634", "mteb_dataset_name": "MassiveScenarioClassification", - "mteb_version": "test", "test": { "evaluation_time": 34.55, "fr": { diff --git a/results/voyage-multilingual-2/no_revision_available/MintakaRetrieval.json b/results/voyage-multilingual-2/no_revision_available/MintakaRetrieval.json index 39ce8a5c..6ec4749a 100644 --- a/results/voyage-multilingual-2/no_revision_available/MintakaRetrieval.json +++ b/results/voyage-multilingual-2/no_revision_available/MintakaRetrieval.json @@ -1,7 +1,6 @@ { "dataset_revision": "efa78cc2f74bbcd21eff2261f9e13aebe40b814e", "mteb_dataset_name": "MintakaRetrieval", - "mteb_version": "test", "test": { "evaluation_time": 20.29, "fr": { diff --git a/results/voyage-multilingual-2/no_revision_available/OpusparcusPC.json b/results/voyage-multilingual-2/no_revision_available/OpusparcusPC.json index fdc52530..6514b722 100644 --- a/results/voyage-multilingual-2/no_revision_available/OpusparcusPC.json +++ b/results/voyage-multilingual-2/no_revision_available/OpusparcusPC.json @@ -1,7 +1,6 @@ { "dataset_revision": "9e9b1f8ef51616073f47f306f7f47dd91663f86a", "mteb_dataset_name": "OpusparcusPC", - "mteb_version": "test", "test.full": { "evaluation_time": 17.77, "fr": { diff --git a/results/voyage-multilingual-2/no_revision_available/PawsXPairClassification.json b/results/voyage-multilingual-2/no_revision_available/PawsXPairClassification.json index d3aea87b..f7aa9ccf 100644 --- a/results/voyage-multilingual-2/no_revision_available/PawsXPairClassification.json +++ b/results/voyage-multilingual-2/no_revision_available/PawsXPairClassification.json @@ -1,7 +1,6 @@ { "dataset_revision": "8a04d940a42cd40658986fdd8e3da561533a3646", "mteb_dataset_name": "PawsXPairClassification", - "mteb_version": "test", "test": { "evaluation_time": 26.42, "fr": { diff --git a/results/voyage-multilingual-2/no_revision_available/SICKFr.json b/results/voyage-multilingual-2/no_revision_available/SICKFr.json index dfa0b84a..8582d0d4 100644 --- a/results/voyage-multilingual-2/no_revision_available/SICKFr.json +++ b/results/voyage-multilingual-2/no_revision_available/SICKFr.json @@ -1,7 +1,6 @@ { "dataset_revision": "e077ab4cf4774a1e36d86d593b150422fafd8e8a", "mteb_dataset_name": "SICKFr", - "mteb_version": "test", "test": { "cos_sim": { "pearson": 0.8160408707764789, diff --git a/results/voyage-multilingual-2/no_revision_available/STS22.json b/results/voyage-multilingual-2/no_revision_available/STS22.json index 6cd03d39..e6e547d5 100644 --- a/results/voyage-multilingual-2/no_revision_available/STS22.json +++ b/results/voyage-multilingual-2/no_revision_available/STS22.json @@ -1,7 +1,6 @@ { "dataset_revision": "eea2b4fe26a775864c896887d910b76a8098ad3f", "mteb_dataset_name": "STS22", - "mteb_version": "test", "test": { "evaluation_time": 19.36, "fr": { diff --git a/results/voyage-multilingual-2/no_revision_available/SummEvalFr.json b/results/voyage-multilingual-2/no_revision_available/SummEvalFr.json index abb09713..074cdc15 100644 --- a/results/voyage-multilingual-2/no_revision_available/SummEvalFr.json +++ b/results/voyage-multilingual-2/no_revision_available/SummEvalFr.json @@ -1,7 +1,6 @@ { "dataset_revision": "b385812de6a9577b6f4d0f88c6a6e35395a94054", "mteb_dataset_name": "SummEvalFr", - "mteb_version": "test", "test": { "cos_sim": { "pearson": 0.3096747641961261, diff --git a/results/voyage-multilingual-2/no_revision_available/SyntecReranking.json b/results/voyage-multilingual-2/no_revision_available/SyntecReranking.json index 77b380f8..073173f7 100644 --- a/results/voyage-multilingual-2/no_revision_available/SyntecReranking.json +++ b/results/voyage-multilingual-2/no_revision_available/SyntecReranking.json @@ -1,7 +1,6 @@ { "dataset_revision": "b205c5084a0934ce8af14338bf03feb19499c84d", "mteb_dataset_name": "SyntecReranking", - "mteb_version": "test", "test": { "evaluation_time": 19.09, "map": 0.904, diff --git a/results/voyage-multilingual-2/no_revision_available/SyntecRetrieval.json b/results/voyage-multilingual-2/no_revision_available/SyntecRetrieval.json index 52118b63..062b0c80 100644 --- a/results/voyage-multilingual-2/no_revision_available/SyntecRetrieval.json +++ b/results/voyage-multilingual-2/no_revision_available/SyntecRetrieval.json @@ -1,7 +1,6 @@ { "dataset_revision": "19661ccdca4dfc2d15122d776b61685f48c68ca9", "mteb_dataset_name": "SyntecRetrieval", - "mteb_version": "test", "test": { "evaluation_time": 6.01, "map_at_1": 0.75, diff --git a/results/voyage-multilingual-2/no_revision_available/XPQARetrieval.json b/results/voyage-multilingual-2/no_revision_available/XPQARetrieval.json index c2f278bb..64f3fb98 100644 --- a/results/voyage-multilingual-2/no_revision_available/XPQARetrieval.json +++ b/results/voyage-multilingual-2/no_revision_available/XPQARetrieval.json @@ -1,7 +1,6 @@ { "dataset_revision": "c99d599f0a6ab9b85b065da6f9d94f9cf731679f", "mteb_dataset_name": "XPQARetrieval", - "mteb_version": "test", "test": { "evaluation_time": 12.33, "fr": { From 1dff53730d64c6e715ea7251da53749476f6ec8b Mon Sep 17 00:00:00 2001 From: Kenneth Enevoldsen Date: Tue, 9 Jul 2024 10:51:58 +0200 Subject: [PATCH 02/15] remove task that does not exist within MTEB I also attempted to figure out if it was renamed. I could not find that to be the case. --- .../no_revision_available/Sohuddb.json | 20 ------------------- .../no_revision_available/Sohuddb.json | 20 ------------------- .../no_revision_available/Sohuddb.json | 20 ------------------- .../no_revision_available/Sohuddb.json | 20 ------------------- .../no_revision_available/Sohuddb.json | 20 ------------------- 5 files changed, 100 deletions(-) delete mode 100644 results/luotuo-bert-medium/no_revision_available/Sohuddb.json delete mode 100644 results/m3e-base/no_revision_available/Sohuddb.json delete mode 100644 results/m3e-large/no_revision_available/Sohuddb.json delete mode 100644 results/text2vec-base-chinese/no_revision_available/Sohuddb.json delete mode 100644 results/text2vec-large-chinese/no_revision_available/Sohuddb.json diff --git a/results/luotuo-bert-medium/no_revision_available/Sohuddb.json b/results/luotuo-bert-medium/no_revision_available/Sohuddb.json deleted file mode 100644 index 0f8fc80a..00000000 --- a/results/luotuo-bert-medium/no_revision_available/Sohuddb.json +++ /dev/null @@ -1,20 +0,0 @@ -{ - "dataset_revision": "a0d554a64d88156834ff5ae9920b964011b16384", - "mteb_dataset_name": "Sohuddb", - "mteb_version": "1.0.2", - "test": { - "cos_sim": { - "pearson": 0.5648113674900062, - "spearman": 0.49510564928129136 - }, - "euclidean": { - "pearson": 0.6248314862553384, - "spearman": 0.49510564928129136 - }, - "evaluation_time": 16.92, - "manhattan": { - "pearson": 0.6236587032362781, - "spearman": 0.4935004849256975 - } - } -} \ No newline at end of file diff --git a/results/m3e-base/no_revision_available/Sohuddb.json b/results/m3e-base/no_revision_available/Sohuddb.json deleted file mode 100644 index 1dc78e89..00000000 --- a/results/m3e-base/no_revision_available/Sohuddb.json +++ /dev/null @@ -1,20 +0,0 @@ -{ - "dataset_revision": "a0d554a64d88156834ff5ae9920b964011b16384", - "mteb_dataset_name": "Sohuddb", - "mteb_version": "1.0.2", - "test": { - "cos_sim": { - "pearson": 0.5789130591226548, - "spearman": 0.5143968063548823 - }, - "euclidean": { - "pearson": 0.6293093065760333, - "spearman": 0.5159901619461696 - }, - "evaluation_time": 2.44, - "manhattan": { - "pearson": 0.6310418873400123, - "spearman": 0.5175758633705007 - } - } -} \ No newline at end of file diff --git a/results/m3e-large/no_revision_available/Sohuddb.json b/results/m3e-large/no_revision_available/Sohuddb.json deleted file mode 100644 index 47f48ad6..00000000 --- a/results/m3e-large/no_revision_available/Sohuddb.json +++ /dev/null @@ -1,20 +0,0 @@ -{ - "dataset_revision": "a0d554a64d88156834ff5ae9920b964011b16384", - "mteb_dataset_name": "Sohuddb", - "mteb_version": "1.0.2", - "test": { - "cos_sim": { - "pearson": 0.5391132000950176, - "spearman": 0.4940841810550044 - }, - "euclidean": { - "pearson": 0.6115163371227998, - "spearman": 0.503858878248473 - }, - "evaluation_time": 7.4, - "manhattan": { - "pearson": 0.6114817074218368, - "spearman": 0.5033335540393461 - } - } -} \ No newline at end of file diff --git a/results/text2vec-base-chinese/no_revision_available/Sohuddb.json b/results/text2vec-base-chinese/no_revision_available/Sohuddb.json deleted file mode 100644 index e899c87d..00000000 --- a/results/text2vec-base-chinese/no_revision_available/Sohuddb.json +++ /dev/null @@ -1,20 +0,0 @@ -{ - "dataset_revision": "a0d554a64d88156834ff5ae9920b964011b16384", - "mteb_dataset_name": "Sohuddb", - "mteb_version": "1.0.2", - "test": { - "cos_sim": { - "pearson": 0.5412696060476951, - "spearman": 0.4879553716972826 - }, - "euclidean": { - "pearson": 0.5757404305726859, - "spearman": 0.4667264072663419 - }, - "evaluation_time": 2.31, - "manhattan": { - "pearson": 0.5757925475288034, - "spearman": 0.46606488765373755 - } - } -} \ No newline at end of file diff --git a/results/text2vec-large-chinese/no_revision_available/Sohuddb.json b/results/text2vec-large-chinese/no_revision_available/Sohuddb.json deleted file mode 100644 index b1a647a3..00000000 --- a/results/text2vec-large-chinese/no_revision_available/Sohuddb.json +++ /dev/null @@ -1,20 +0,0 @@ -{ - "dataset_revision": "a0d554a64d88156834ff5ae9920b964011b16384", - "mteb_dataset_name": "Sohuddb", - "mteb_version": "1.0.2", - "test": { - "cos_sim": { - "pearson": 0.6028313709149844, - "spearman": 0.5043572329308047 - }, - "euclidean": { - "pearson": 0.6309144445102868, - "spearman": 0.496932381268873 - }, - "evaluation_time": 7.49, - "manhattan": { - "pearson": 0.6312791087683431, - "spearman": 0.4984207998613994 - } - } -} \ No newline at end of file From d8d13c797962118fe74b76e7bb5385d29d56b29b Mon Sep 17 00:00:00 2001 From: Kenneth Enevoldsen Date: Tue, 9 Jul 2024 10:53:35 +0200 Subject: [PATCH 03/15] removed ChnSentiCorp --- .../no_revision_available/ChnSentiCorp.json | 15 --------------- .../no_revision_available/ChnSentiCorp.json | 15 --------------- .../no_revision_available/ChnSentiCorp.json | 15 --------------- .../no_revision_available/ChnSentiCorp.json | 15 --------------- .../no_revision_available/ChnSentiCorp.json | 15 --------------- .../no_revision_available/ChnSentiCorp.json | 15 --------------- 6 files changed, 90 deletions(-) delete mode 100644 results/luotuo-bert-medium/no_revision_available/ChnSentiCorp.json delete mode 100644 results/m3e-base/no_revision_available/ChnSentiCorp.json delete mode 100644 results/m3e-large/no_revision_available/ChnSentiCorp.json delete mode 100644 results/text-embedding-ada-002/no_revision_available/ChnSentiCorp.json delete mode 100644 results/text2vec-base-chinese/no_revision_available/ChnSentiCorp.json delete mode 100644 results/text2vec-large-chinese/no_revision_available/ChnSentiCorp.json diff --git a/results/luotuo-bert-medium/no_revision_available/ChnSentiCorp.json b/results/luotuo-bert-medium/no_revision_available/ChnSentiCorp.json deleted file mode 100644 index 7f714856..00000000 --- a/results/luotuo-bert-medium/no_revision_available/ChnSentiCorp.json +++ /dev/null @@ -1,15 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "ChnSentiCorp", - "mteb_version": "1.0.2", - "validation": { - "accuracy": 0.6553333333333333, - "accuracy_stderr": 0.04609501057598315, - "ap": 0.6010180678440944, - "ap_stderr": 0.0371080652735924, - "evaluation_time": 38.85, - "f1": 0.6513169545375643, - "f1_stderr": 0.04951477462576623, - "main_score": 0.6553333333333333 - } -} \ No newline at end of file diff --git a/results/m3e-base/no_revision_available/ChnSentiCorp.json b/results/m3e-base/no_revision_available/ChnSentiCorp.json deleted file mode 100644 index a70795bf..00000000 --- a/results/m3e-base/no_revision_available/ChnSentiCorp.json +++ /dev/null @@ -1,15 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "ChnSentiCorp", - "mteb_version": "1.0.2", - "validation": { - "accuracy": 0.8024166666666666, - "accuracy_stderr": 0.04477482241418967, - "ap": 0.7414707892290573, - "ap_stderr": 0.046370568575171627, - "evaluation_time": 9.05, - "f1": 0.8013898324482012, - "f1_stderr": 0.04563889173921327, - "main_score": 0.8024166666666666 - } -} \ No newline at end of file diff --git a/results/m3e-large/no_revision_available/ChnSentiCorp.json b/results/m3e-large/no_revision_available/ChnSentiCorp.json deleted file mode 100644 index 9af7ec4b..00000000 --- a/results/m3e-large/no_revision_available/ChnSentiCorp.json +++ /dev/null @@ -1,15 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "ChnSentiCorp", - "mteb_version": "1.0.2", - "validation": { - "accuracy": 0.8400000000000001, - "accuracy_stderr": 0.05413845419128832, - "ap": 0.785802857686188, - "ap_stderr": 0.06038453457326963, - "evaluation_time": 18.44, - "f1": 0.8392920841265727, - "f1_stderr": 0.055090454616793315, - "main_score": 0.8400000000000001 - } -} \ No newline at end of file diff --git a/results/text-embedding-ada-002/no_revision_available/ChnSentiCorp.json b/results/text-embedding-ada-002/no_revision_available/ChnSentiCorp.json deleted file mode 100644 index 2726367e..00000000 --- a/results/text-embedding-ada-002/no_revision_available/ChnSentiCorp.json +++ /dev/null @@ -1,15 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "ChnSentiCorp", - "mteb_version": "1.0.2", - "validation": { - "accuracy": 0.7038333333333333, - "accuracy_stderr": 0.06392182725798756, - "ap": 0.645102672253325, - "ap_stderr": 0.05738272469381464, - "evaluation_time": 445.37, - "f1": 0.7007715917485109, - "f1_stderr": 0.06690258473516557, - "main_score": 0.7038333333333333 - } -} \ No newline at end of file diff --git a/results/text2vec-base-chinese/no_revision_available/ChnSentiCorp.json b/results/text2vec-base-chinese/no_revision_available/ChnSentiCorp.json deleted file mode 100644 index fbf38257..00000000 --- a/results/text2vec-base-chinese/no_revision_available/ChnSentiCorp.json +++ /dev/null @@ -1,15 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "ChnSentiCorp", - "mteb_version": "1.0.2", - "validation": { - "accuracy": 0.72425, - "accuracy_stderr": 0.03573912033363753, - "ap": 0.6600581393389306, - "ap_stderr": 0.03189757658825878, - "evaluation_time": 6.72, - "f1": 0.7222664478797581, - "f1_stderr": 0.03741379195535388, - "main_score": 0.72425 - } -} \ No newline at end of file diff --git a/results/text2vec-large-chinese/no_revision_available/ChnSentiCorp.json b/results/text2vec-large-chinese/no_revision_available/ChnSentiCorp.json deleted file mode 100644 index 143af958..00000000 --- a/results/text2vec-large-chinese/no_revision_available/ChnSentiCorp.json +++ /dev/null @@ -1,15 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "ChnSentiCorp", - "mteb_version": "1.0.2", - "validation": { - "accuracy": 0.7260833333333333, - "accuracy_stderr": 0.02239497091362751, - "ap": 0.6655747577674844, - "ap_stderr": 0.023229724677964296, - "evaluation_time": 17.92, - "f1": 0.724237828512715, - "f1_stderr": 0.02302399158803661, - "main_score": 0.7260833333333333 - } -} \ No newline at end of file From dc0ae59c18a50396dcff8a279ac8f5824c70292b Mon Sep 17 00:00:00 2001 From: Kenneth Enevoldsen Date: Tue, 9 Jul 2024 10:54:23 +0200 Subject: [PATCH 04/15] Removed FoodSafety --- .../no_revision_available/FoodSafety.json | 15 --------------- .../no_revision_available/FoodSafety.json | 15 --------------- .../no_revision_available/FoodSafety.json | 15 --------------- .../no_revision_available/FoodSafety.json | 15 --------------- .../no_revision_available/FoodSafety.json | 15 --------------- .../no_revision_available/FoodSafety.json | 15 --------------- 6 files changed, 90 deletions(-) delete mode 100644 results/luotuo-bert-medium/no_revision_available/FoodSafety.json delete mode 100644 results/m3e-base/no_revision_available/FoodSafety.json delete mode 100644 results/m3e-large/no_revision_available/FoodSafety.json delete mode 100644 results/text-embedding-ada-002/no_revision_available/FoodSafety.json delete mode 100644 results/text2vec-base-chinese/no_revision_available/FoodSafety.json delete mode 100644 results/text2vec-large-chinese/no_revision_available/FoodSafety.json diff --git a/results/luotuo-bert-medium/no_revision_available/FoodSafety.json b/results/luotuo-bert-medium/no_revision_available/FoodSafety.json deleted file mode 100644 index 1bd6d6c0..00000000 --- a/results/luotuo-bert-medium/no_revision_available/FoodSafety.json +++ /dev/null @@ -1,15 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "FoodSafety", - "mteb_version": "1.0.2", - "validation": { - "accuracy": 0.963953488372093, - "accuracy_stderr": 0.03950801691208633, - "ap": 0.8977892995065202, - "ap_stderr": 0.08697431689159942, - "evaluation_time": 43.65, - "f1": 0.9583348668490537, - "f1_stderr": 0.042428697040349427, - "main_score": 0.963953488372093 - } -} \ No newline at end of file diff --git a/results/m3e-base/no_revision_available/FoodSafety.json b/results/m3e-base/no_revision_available/FoodSafety.json deleted file mode 100644 index 6005cdac..00000000 --- a/results/m3e-base/no_revision_available/FoodSafety.json +++ /dev/null @@ -1,15 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "FoodSafety", - "mteb_version": "1.0.2", - "validation": { - "accuracy": 0.9593635250917993, - "accuracy_stderr": 0.043948066827963435, - "ap": 0.8879721587303052, - "ap_stderr": 0.10089229687123932, - "evaluation_time": 4.66, - "f1": 0.9534156411525407, - "f1_stderr": 0.04779409334770204, - "main_score": 0.9593635250917993 - } -} \ No newline at end of file diff --git a/results/m3e-large/no_revision_available/FoodSafety.json b/results/m3e-large/no_revision_available/FoodSafety.json deleted file mode 100644 index d8bea265..00000000 --- a/results/m3e-large/no_revision_available/FoodSafety.json +++ /dev/null @@ -1,15 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "FoodSafety", - "mteb_version": "1.0.2", - "validation": { - "accuracy": 0.9629130966952266, - "accuracy_stderr": 0.033783238411552466, - "ap": 0.8923655986670944, - "ap_stderr": 0.08122975478075166, - "evaluation_time": 16.01, - "f1": 0.9568587305240636, - "f1_stderr": 0.03720898046060011, - "main_score": 0.9629130966952266 - } -} \ No newline at end of file diff --git a/results/text-embedding-ada-002/no_revision_available/FoodSafety.json b/results/text-embedding-ada-002/no_revision_available/FoodSafety.json deleted file mode 100644 index 3a96af4e..00000000 --- a/results/text-embedding-ada-002/no_revision_available/FoodSafety.json +++ /dev/null @@ -1,15 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "FoodSafety", - "mteb_version": "1.0.2", - "validation": { - "accuracy": 0.9469400244798042, - "accuracy_stderr": 0.0642705883047549, - "ap": 0.8668652439501472, - "ap_stderr": 0.12998303944580755, - "evaluation_time": 118.79, - "f1": 0.9408111093887586, - "f1_stderr": 0.06756889673428046, - "main_score": 0.9469400244798042 - } -} \ No newline at end of file diff --git a/results/text2vec-base-chinese/no_revision_available/FoodSafety.json b/results/text2vec-base-chinese/no_revision_available/FoodSafety.json deleted file mode 100644 index 16e3cba2..00000000 --- a/results/text2vec-base-chinese/no_revision_available/FoodSafety.json +++ /dev/null @@ -1,15 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "FoodSafety", - "mteb_version": "1.0.2", - "validation": { - "accuracy": 0.9245410036719706, - "accuracy_stderr": 0.07136925689945725, - "ap": 0.8141604893718837, - "ap_stderr": 0.1281298649778236, - "evaluation_time": 3.45, - "f1": 0.9164028379552166, - "f1_stderr": 0.07309990040200734, - "main_score": 0.9245410036719706 - } -} \ No newline at end of file diff --git a/results/text2vec-large-chinese/no_revision_available/FoodSafety.json b/results/text2vec-large-chinese/no_revision_available/FoodSafety.json deleted file mode 100644 index c860a935..00000000 --- a/results/text2vec-large-chinese/no_revision_available/FoodSafety.json +++ /dev/null @@ -1,15 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "FoodSafety", - "mteb_version": "1.0.2", - "validation": { - "accuracy": 0.9055691554467564, - "accuracy_stderr": 0.07973525890626366, - "ap": 0.7770689010532261, - "ap_stderr": 0.13381581787652058, - "evaluation_time": 16.13, - "f1": 0.8964792948741991, - "f1_stderr": 0.08048066592339458, - "main_score": 0.9055691554467564 - } -} \ No newline at end of file From f0298b0c6777a52dd40e6771732f6a5be94fbabc Mon Sep 17 00:00:00 2001 From: Kenneth Enevoldsen Date: Tue, 9 Jul 2024 10:55:13 +0200 Subject: [PATCH 05/15] remove Sohucca --- .../no_revision_available/Sohucca.json | 20 ------------------- .../no_revision_available/Sohucca.json | 20 ------------------- .../no_revision_available/Sohucca.json | 20 ------------------- .../no_revision_available/Sohucca.json | 20 ------------------- .../no_revision_available/Sohucca.json | 20 ------------------- 5 files changed, 100 deletions(-) delete mode 100644 results/luotuo-bert-medium/no_revision_available/Sohucca.json delete mode 100644 results/m3e-base/no_revision_available/Sohucca.json delete mode 100644 results/m3e-large/no_revision_available/Sohucca.json delete mode 100644 results/text2vec-base-chinese/no_revision_available/Sohucca.json delete mode 100644 results/text2vec-large-chinese/no_revision_available/Sohucca.json diff --git a/results/luotuo-bert-medium/no_revision_available/Sohucca.json b/results/luotuo-bert-medium/no_revision_available/Sohucca.json deleted file mode 100644 index 32f4c407..00000000 --- a/results/luotuo-bert-medium/no_revision_available/Sohucca.json +++ /dev/null @@ -1,20 +0,0 @@ -{ - "dataset_revision": "a0d554a64d88156834ff5ae9920b964011b16384", - "mteb_dataset_name": "Sohucca", - "mteb_version": "1.0.2", - "test": { - "cos_sim": { - "pearson": 0.6276674619147404, - "spearman": 0.6630774039557118 - }, - "euclidean": { - "pearson": 0.6364241942783397, - "spearman": 0.6630774039557118 - }, - "evaluation_time": 63.28, - "manhattan": { - "pearson": 0.6365050221493356, - "spearman": 0.6626387271471469 - } - } -} \ No newline at end of file diff --git a/results/m3e-base/no_revision_available/Sohucca.json b/results/m3e-base/no_revision_available/Sohucca.json deleted file mode 100644 index 406f2a91..00000000 --- a/results/m3e-base/no_revision_available/Sohucca.json +++ /dev/null @@ -1,20 +0,0 @@ -{ - "dataset_revision": "a0d554a64d88156834ff5ae9920b964011b16384", - "mteb_dataset_name": "Sohucca", - "mteb_version": "1.0.2", - "test": { - "cos_sim": { - "pearson": 0.6277804930281583, - "spearman": 0.6455233704257503 - }, - "euclidean": { - "pearson": 0.6011460566528497, - "spearman": 0.6450707654327145 - }, - "evaluation_time": 19.11, - "manhattan": { - "pearson": 0.6014135672961469, - "spearman": 0.6456208522244069 - } - } -} \ No newline at end of file diff --git a/results/m3e-large/no_revision_available/Sohucca.json b/results/m3e-large/no_revision_available/Sohucca.json deleted file mode 100644 index 5d5055a8..00000000 --- a/results/m3e-large/no_revision_available/Sohucca.json +++ /dev/null @@ -1,20 +0,0 @@ -{ - "dataset_revision": "a0d554a64d88156834ff5ae9920b964011b16384", - "mteb_dataset_name": "Sohucca", - "mteb_version": "1.0.2", - "test": { - "cos_sim": { - "pearson": 0.6258443851385096, - "spearman": 0.6374600709603107 - }, - "euclidean": { - "pearson": 0.6125951307157442, - "spearman": 0.6418259496741232 - }, - "evaluation_time": 59.55, - "manhattan": { - "pearson": 0.6120588937317608, - "spearman": 0.640266209910337 - } - } -} \ No newline at end of file diff --git a/results/text2vec-base-chinese/no_revision_available/Sohucca.json b/results/text2vec-base-chinese/no_revision_available/Sohucca.json deleted file mode 100644 index a26d452b..00000000 --- a/results/text2vec-base-chinese/no_revision_available/Sohucca.json +++ /dev/null @@ -1,20 +0,0 @@ -{ - "dataset_revision": "a0d554a64d88156834ff5ae9920b964011b16384", - "mteb_dataset_name": "Sohucca", - "mteb_version": "1.0.2", - "test": { - "cos_sim": { - "pearson": 0.5668449810303844, - "spearman": 0.5814436418968008 - }, - "euclidean": { - "pearson": 0.5341271493467923, - "spearman": 0.5750723626333543 - }, - "evaluation_time": 5.45, - "manhattan": { - "pearson": 0.5340910361262661, - "spearman": 0.5738816645414969 - } - } -} \ No newline at end of file diff --git a/results/text2vec-large-chinese/no_revision_available/Sohucca.json b/results/text2vec-large-chinese/no_revision_available/Sohucca.json deleted file mode 100644 index e11b9a0a..00000000 --- a/results/text2vec-large-chinese/no_revision_available/Sohucca.json +++ /dev/null @@ -1,20 +0,0 @@ -{ - "dataset_revision": "a0d554a64d88156834ff5ae9920b964011b16384", - "mteb_dataset_name": "Sohucca", - "mteb_version": "1.0.2", - "test": { - "cos_sim": { - "pearson": 0.6042074587488337, - "spearman": 0.6177962089382903 - }, - "euclidean": { - "pearson": 0.5701656572924783, - "spearman": 0.6136044083231146 - }, - "evaluation_time": 60.63, - "manhattan": { - "pearson": 0.5704560334093998, - "spearman": 0.6141196794950797 - } - } -} \ No newline at end of file From 03a0f23ebb03c4203160f273be770f1971452a36 Mon Sep 17 00:00:00 2001 From: Kenneth Enevoldsen Date: Tue, 9 Jul 2024 10:55:53 +0200 Subject: [PATCH 06/15] remove T2RankingRetrieval --- .../T2RankingRetrieval.json | 38 ------------------- .../T2RankingRetrieval.json | 38 ------------------- 2 files changed, 76 deletions(-) delete mode 100644 results/m3e-base/no_revision_available/T2RankingRetrieval.json delete mode 100644 results/m3e-large/no_revision_available/T2RankingRetrieval.json diff --git a/results/m3e-base/no_revision_available/T2RankingRetrieval.json b/results/m3e-base/no_revision_available/T2RankingRetrieval.json deleted file mode 100644 index 2d75ce10..00000000 --- a/results/m3e-base/no_revision_available/T2RankingRetrieval.json +++ /dev/null @@ -1,38 +0,0 @@ -{ - "dataset_revision": null, - "dev": { - "evaluation_time": 69.77, - "map_at_1": 0.62604, - "map_at_10": 0.76562, - "map_at_100": 0.76935, - "map_at_1000": 0.76946, - "map_at_3": 0.74276, - "map_at_5": 0.75673, - "mrr_at_1": 0.70472, - "mrr_at_10": 0.78407, - "mrr_at_100": 0.78648, - "mrr_at_1000": 0.78656, - "mrr_at_3": 0.77296, - "mrr_at_5": 0.77937, - "ndcg_at_1": 0.68812, - "ndcg_at_10": 0.80044, - "ndcg_at_100": 0.81481, - "ndcg_at_1000": 0.81749, - "ndcg_at_3": 0.76875, - "ndcg_at_5": 0.7854, - "precision_at_1": 0.70472, - "precision_at_10": 0.11404, - "precision_at_100": 0.01228, - "precision_at_1000": 0.00125, - "precision_at_3": 0.33378, - "precision_at_5": 0.21409, - "recall_at_1": 0.62604, - "recall_at_10": 0.90152, - "recall_at_100": 0.96435, - "recall_at_1000": 0.9852, - "recall_at_3": 0.81921, - "recall_at_5": 0.8585 - }, - "mteb_dataset_name": "T2RankingRetrieval", - "mteb_version": "1.0.2" -} \ No newline at end of file diff --git a/results/m3e-large/no_revision_available/T2RankingRetrieval.json b/results/m3e-large/no_revision_available/T2RankingRetrieval.json deleted file mode 100644 index aa3549f3..00000000 --- a/results/m3e-large/no_revision_available/T2RankingRetrieval.json +++ /dev/null @@ -1,38 +0,0 @@ -{ - "dataset_revision": null, - "dev": { - "evaluation_time": 219.6, - "map_at_1": 0.62561, - "map_at_10": 0.76272, - "map_at_100": 0.76664, - "map_at_1000": 0.76678, - "map_at_3": 0.73781, - "map_at_5": 0.75387, - "mrr_at_1": 0.70634, - "mrr_at_10": 0.78275, - "mrr_at_100": 0.78527, - "mrr_at_1000": 0.78536, - "mrr_at_3": 0.77013, - "mrr_at_5": 0.77828, - "ndcg_at_1": 0.68839, - "ndcg_at_10": 0.79741, - "ndcg_at_100": 0.8122, - "ndcg_at_1000": 0.81535, - "ndcg_at_3": 0.76235, - "ndcg_at_5": 0.78262, - "precision_at_1": 0.70634, - "precision_at_10": 0.11352, - "precision_at_100": 0.01225, - "precision_at_1000": 0.00126, - "precision_at_3": 0.3291, - "precision_at_5": 0.21306, - "recall_at_1": 0.62561, - "recall_at_10": 0.89815, - "recall_at_100": 0.96268, - "recall_at_1000": 0.98722, - "recall_at_3": 0.80887, - "recall_at_5": 0.85525 - }, - "mteb_dataset_name": "T2RankingRetrieval", - "mteb_version": "1.0.2" -} \ No newline at end of file From 8eb207aecf63352b315cde5fbb04278a0ff0da23 Mon Sep 17 00:00:00 2001 From: Kenneth Enevoldsen Date: Tue, 9 Jul 2024 10:56:36 +0200 Subject: [PATCH 07/15] remove StockComSentiment --- .../no_revision_available/StockComSentiment.json | 13 ------------- .../no_revision_available/StockComSentiment.json | 13 ------------- .../no_revision_available/StockComSentiment.json | 13 ------------- .../no_revision_available/StockComSentiment.json | 13 ------------- .../no_revision_available/StockComSentiment.json | 13 ------------- .../no_revision_available/StockComSentiment.json | 13 ------------- 6 files changed, 78 deletions(-) delete mode 100644 results/luotuo-bert-medium/no_revision_available/StockComSentiment.json delete mode 100644 results/m3e-base/no_revision_available/StockComSentiment.json delete mode 100644 results/m3e-large/no_revision_available/StockComSentiment.json delete mode 100644 results/text-embedding-ada-002/no_revision_available/StockComSentiment.json delete mode 100644 results/text2vec-base-chinese/no_revision_available/StockComSentiment.json delete mode 100644 results/text2vec-large-chinese/no_revision_available/StockComSentiment.json diff --git a/results/luotuo-bert-medium/no_revision_available/StockComSentiment.json b/results/luotuo-bert-medium/no_revision_available/StockComSentiment.json deleted file mode 100644 index 05b60a76..00000000 --- a/results/luotuo-bert-medium/no_revision_available/StockComSentiment.json +++ /dev/null @@ -1,13 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "StockComSentiment", - "mteb_version": "1.0.2", - "validation": { - "accuracy": 0.49160317986088103, - "accuracy_stderr": 0.029947798064656757, - "evaluation_time": 19.59, - "f1": 0.4236092333486535, - "f1_stderr": 0.016061521814735948, - "main_score": 0.49160317986088103 - } -} \ No newline at end of file diff --git a/results/m3e-base/no_revision_available/StockComSentiment.json b/results/m3e-base/no_revision_available/StockComSentiment.json deleted file mode 100644 index fbbd224f..00000000 --- a/results/m3e-base/no_revision_available/StockComSentiment.json +++ /dev/null @@ -1,13 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "StockComSentiment", - "mteb_version": "1.0.2", - "validation": { - "accuracy": 0.43631997350115936, - "accuracy_stderr": 0.02108272378736771, - "evaluation_time": 9.69, - "f1": 0.39191727583674246, - "f1_stderr": 0.013592955896830744, - "main_score": 0.43631997350115936 - } -} \ No newline at end of file diff --git a/results/m3e-large/no_revision_available/StockComSentiment.json b/results/m3e-large/no_revision_available/StockComSentiment.json deleted file mode 100644 index 25e82b8e..00000000 --- a/results/m3e-large/no_revision_available/StockComSentiment.json +++ /dev/null @@ -1,13 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "StockComSentiment", - "mteb_version": "1.0.2", - "validation": { - "accuracy": 0.4475819807883405, - "accuracy_stderr": 0.026257518450391776, - "evaluation_time": 12.15, - "f1": 0.3985774065189805, - "f1_stderr": 0.01669074480953102, - "main_score": 0.4475819807883405 - } -} \ No newline at end of file diff --git a/results/text-embedding-ada-002/no_revision_available/StockComSentiment.json b/results/text-embedding-ada-002/no_revision_available/StockComSentiment.json deleted file mode 100644 index 00482fa5..00000000 --- a/results/text-embedding-ada-002/no_revision_available/StockComSentiment.json +++ /dev/null @@ -1,13 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "StockComSentiment", - "mteb_version": "1.0.2", - "validation": { - "accuracy": 0.48108645246770454, - "accuracy_stderr": 0.028593683434879582, - "evaluation_time": 2153.46, - "f1": 0.4188284121111917, - "f1_stderr": 0.014389446535035723, - "main_score": 0.48108645246770454 - } -} \ No newline at end of file diff --git a/results/text2vec-base-chinese/no_revision_available/StockComSentiment.json b/results/text2vec-base-chinese/no_revision_available/StockComSentiment.json deleted file mode 100644 index 42a571e1..00000000 --- a/results/text2vec-base-chinese/no_revision_available/StockComSentiment.json +++ /dev/null @@ -1,13 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "StockComSentiment", - "mteb_version": "1.0.2", - "validation": { - "accuracy": 0.4306889698575687, - "accuracy_stderr": 0.0157211731762314, - "evaluation_time": 9.55, - "f1": 0.3865034560068128, - "f1_stderr": 0.010965251720154862, - "main_score": 0.4306889698575687 - } -} \ No newline at end of file diff --git a/results/text2vec-large-chinese/no_revision_available/StockComSentiment.json b/results/text2vec-large-chinese/no_revision_available/StockComSentiment.json deleted file mode 100644 index 7cc2b890..00000000 --- a/results/text2vec-large-chinese/no_revision_available/StockComSentiment.json +++ /dev/null @@ -1,13 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "StockComSentiment", - "mteb_version": "1.0.2", - "validation": { - "accuracy": 0.43867174561112954, - "accuracy_stderr": 0.012732558950426166, - "evaluation_time": 15.24, - "f1": 0.3921143673134987, - "f1_stderr": 0.009428725332622498, - "main_score": 0.43867174561112954 - } -} \ No newline at end of file From 0243d96149811bde48470977e090b3709f94ec7b Mon Sep 17 00:00:00 2001 From: Kenneth Enevoldsen Date: Tue, 9 Jul 2024 10:57:22 +0200 Subject: [PATCH 08/15] Remove MedQuationClustering --- .../no_revision_available/MedQuationClustering.json | 10 ---------- .../no_revision_available/MedQuationClustering.json | 10 ---------- .../no_revision_available/MedQuationClustering.json | 10 ---------- .../no_revision_available/MedQuationClustering.json | 10 ---------- .../no_revision_available/MedQuationClustering.json | 10 ---------- .../no_revision_available/MedQuationClustering.json | 10 ---------- 6 files changed, 60 deletions(-) delete mode 100644 results/luotuo-bert-medium/no_revision_available/MedQuationClustering.json delete mode 100644 results/m3e-base/no_revision_available/MedQuationClustering.json delete mode 100644 results/m3e-large/no_revision_available/MedQuationClustering.json delete mode 100644 results/text-embedding-ada-002/no_revision_available/MedQuationClustering.json delete mode 100644 results/text2vec-base-chinese/no_revision_available/MedQuationClustering.json delete mode 100644 results/text2vec-large-chinese/no_revision_available/MedQuationClustering.json diff --git a/results/luotuo-bert-medium/no_revision_available/MedQuationClustering.json b/results/luotuo-bert-medium/no_revision_available/MedQuationClustering.json deleted file mode 100644 index d04200f2..00000000 --- a/results/luotuo-bert-medium/no_revision_available/MedQuationClustering.json +++ /dev/null @@ -1,10 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "MedQuationClustering", - "mteb_version": "1.0.2", - "test": { - "evaluation_time": 1587.77, - "v_measure": 0.24736018758973996, - "v_measure_std": 0.009591996945365984 - } -} \ No newline at end of file diff --git a/results/m3e-base/no_revision_available/MedQuationClustering.json b/results/m3e-base/no_revision_available/MedQuationClustering.json deleted file mode 100644 index 6fb0582d..00000000 --- a/results/m3e-base/no_revision_available/MedQuationClustering.json +++ /dev/null @@ -1,10 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "MedQuationClustering", - "mteb_version": "1.0.2", - "validation": { - "evaluation_time": 81.91, - "v_measure": 0.29911480708851773, - "v_measure_std": 0.009879229296911667 - } -} \ No newline at end of file diff --git a/results/m3e-large/no_revision_available/MedQuationClustering.json b/results/m3e-large/no_revision_available/MedQuationClustering.json deleted file mode 100644 index 16966ad3..00000000 --- a/results/m3e-large/no_revision_available/MedQuationClustering.json +++ /dev/null @@ -1,10 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "MedQuationClustering", - "mteb_version": "1.0.2", - "validation": { - "evaluation_time": 231.35, - "v_measure": 0.31130407438868735, - "v_measure_std": 0.011665302902534785 - } -} \ No newline at end of file diff --git a/results/text-embedding-ada-002/no_revision_available/MedQuationClustering.json b/results/text-embedding-ada-002/no_revision_available/MedQuationClustering.json deleted file mode 100644 index 5a28ae6a..00000000 --- a/results/text-embedding-ada-002/no_revision_available/MedQuationClustering.json +++ /dev/null @@ -1,10 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "MedQuationClustering", - "mteb_version": "1.0.2", - "test": { - "evaluation_time": 2087.67, - "v_measure": 0.27539698666332857, - "v_measure_std": 0.012003855223840794 - } -} \ No newline at end of file diff --git a/results/text2vec-base-chinese/no_revision_available/MedQuationClustering.json b/results/text2vec-base-chinese/no_revision_available/MedQuationClustering.json deleted file mode 100644 index ca6b32b0..00000000 --- a/results/text2vec-base-chinese/no_revision_available/MedQuationClustering.json +++ /dev/null @@ -1,10 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "MedQuationClustering", - "mteb_version": "1.0.2", - "test": { - "evaluation_time": 74.96, - "v_measure": 0.2717411874462805, - "v_measure_std": 0.005760165400706075 - } -} \ No newline at end of file diff --git a/results/text2vec-large-chinese/no_revision_available/MedQuationClustering.json b/results/text2vec-large-chinese/no_revision_available/MedQuationClustering.json deleted file mode 100644 index 6ad0996b..00000000 --- a/results/text2vec-large-chinese/no_revision_available/MedQuationClustering.json +++ /dev/null @@ -1,10 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "MedQuationClustering", - "mteb_version": "1.0.2", - "test": { - "evaluation_time": 237.16, - "v_measure": 0.2882118938755341, - "v_measure_std": 0.004816952331803009 - } -} \ No newline at end of file From 7e434f47927917dc445c48fb2b879ff6c1d123be Mon Sep 17 00:00:00 2001 From: Kenneth Enevoldsen Date: Tue, 9 Jul 2024 10:58:11 +0200 Subject: [PATCH 09/15] remove Sohudca --- .../no_revision_available/Sohudca.json | 20 ------------------- .../no_revision_available/Sohudca.json | 20 ------------------- .../no_revision_available/Sohudca.json | 20 ------------------- .../no_revision_available/Sohudca.json | 20 ------------------- .../no_revision_available/Sohudca.json | 20 ------------------- 5 files changed, 100 deletions(-) delete mode 100644 results/luotuo-bert-medium/no_revision_available/Sohudca.json delete mode 100644 results/m3e-base/no_revision_available/Sohudca.json delete mode 100644 results/m3e-large/no_revision_available/Sohudca.json delete mode 100644 results/text2vec-base-chinese/no_revision_available/Sohudca.json delete mode 100644 results/text2vec-large-chinese/no_revision_available/Sohudca.json diff --git a/results/luotuo-bert-medium/no_revision_available/Sohudca.json b/results/luotuo-bert-medium/no_revision_available/Sohudca.json deleted file mode 100644 index ef5e63b5..00000000 --- a/results/luotuo-bert-medium/no_revision_available/Sohudca.json +++ /dev/null @@ -1,20 +0,0 @@ -{ - "dataset_revision": "a0d554a64d88156834ff5ae9920b964011b16384", - "mteb_dataset_name": "Sohudca", - "mteb_version": "1.0.2", - "test": { - "cos_sim": { - "pearson": 0.542437913551226, - "spearman": 0.5499463904636713 - }, - "euclidean": { - "pearson": 0.5497963592956565, - "spearman": 0.5499463888138304 - }, - "evaluation_time": 60.89, - "manhattan": { - "pearson": 0.5483711470168247, - "spearman": 0.5479573268256736 - } - } -} \ No newline at end of file diff --git a/results/m3e-base/no_revision_available/Sohudca.json b/results/m3e-base/no_revision_available/Sohudca.json deleted file mode 100644 index cb68e15d..00000000 --- a/results/m3e-base/no_revision_available/Sohudca.json +++ /dev/null @@ -1,20 +0,0 @@ -{ - "dataset_revision": "a0d554a64d88156834ff5ae9920b964011b16384", - "mteb_dataset_name": "Sohudca", - "mteb_version": "1.0.2", - "test": { - "cos_sim": { - "pearson": 0.5936370764195946, - "spearman": 0.6027808478742518 - }, - "euclidean": { - "pearson": 0.5972763991624006, - "spearman": 0.6015376841316536 - }, - "evaluation_time": 11.05, - "manhattan": { - "pearson": 0.5974296464839446, - "spearman": 0.6004188367633153 - } - } -} \ No newline at end of file diff --git a/results/m3e-large/no_revision_available/Sohudca.json b/results/m3e-large/no_revision_available/Sohudca.json deleted file mode 100644 index 4ae8cd5b..00000000 --- a/results/m3e-large/no_revision_available/Sohudca.json +++ /dev/null @@ -1,20 +0,0 @@ -{ - "dataset_revision": "a0d554a64d88156834ff5ae9920b964011b16384", - "mteb_dataset_name": "Sohudca", - "mteb_version": "1.0.2", - "test": { - "cos_sim": { - "pearson": 0.5879100198296194, - "spearman": 0.600828349525583 - }, - "euclidean": { - "pearson": 0.5816894475215411, - "spearman": 0.5898885085907193 - }, - "evaluation_time": 34.04, - "manhattan": { - "pearson": 0.5846497885770858, - "spearman": 0.5925393742312323 - } - } -} \ No newline at end of file diff --git a/results/text2vec-base-chinese/no_revision_available/Sohudca.json b/results/text2vec-base-chinese/no_revision_available/Sohudca.json deleted file mode 100644 index 645d3391..00000000 --- a/results/text2vec-base-chinese/no_revision_available/Sohudca.json +++ /dev/null @@ -1,20 +0,0 @@ -{ - "dataset_revision": "a0d554a64d88156834ff5ae9920b964011b16384", - "mteb_dataset_name": "Sohudca", - "mteb_version": "1.0.2", - "test": { - "cos_sim": { - "pearson": 0.4748384334614316, - "spearman": 0.4764388479867917 - }, - "euclidean": { - "pearson": 0.44985246179548066, - "spearman": 0.4431366851409566 - }, - "evaluation_time": 3.97, - "manhattan": { - "pearson": 0.4531146839227391, - "spearman": 0.44729762731471157 - } - } -} \ No newline at end of file diff --git a/results/text2vec-large-chinese/no_revision_available/Sohudca.json b/results/text2vec-large-chinese/no_revision_available/Sohudca.json deleted file mode 100644 index b45fd012..00000000 --- a/results/text2vec-large-chinese/no_revision_available/Sohudca.json +++ /dev/null @@ -1,20 +0,0 @@ -{ - "dataset_revision": "a0d554a64d88156834ff5ae9920b964011b16384", - "mteb_dataset_name": "Sohudca", - "mteb_version": "1.0.2", - "test": { - "cos_sim": { - "pearson": 0.5381859490271976, - "spearman": 0.5426482863719896 - }, - "euclidean": { - "pearson": 0.5187022671843646, - "spearman": 0.5212878081829944 - }, - "evaluation_time": 34.77, - "manhattan": { - "pearson": 0.5179489622509401, - "spearman": 0.5196058838841765 - } - } -} \ No newline at end of file From 79254500067f10d53b9fbbc7f85649a0fe2dd610 Mon Sep 17 00:00:00 2001 From: Kenneth Enevoldsen Date: Tue, 9 Jul 2024 10:59:05 +0200 Subject: [PATCH 10/15] remove WeiboSentiment --- .../no_revision_available/WeiboSentiment.json | 15 --------------- .../no_revision_available/WeiboSentiment.json | 15 --------------- .../no_revision_available/WeiboSentiment.json | 15 --------------- .../no_revision_available/WeiboSentiment.json | 15 --------------- .../no_revision_available/WeiboSentiment.json | 15 --------------- 5 files changed, 75 deletions(-) delete mode 100644 results/m3e-base/no_revision_available/WeiboSentiment.json delete mode 100644 results/m3e-large/no_revision_available/WeiboSentiment.json delete mode 100644 results/text-embedding-ada-002/no_revision_available/WeiboSentiment.json delete mode 100644 results/text2vec-base-chinese/no_revision_available/WeiboSentiment.json delete mode 100644 results/text2vec-large-chinese/no_revision_available/WeiboSentiment.json diff --git a/results/m3e-base/no_revision_available/WeiboSentiment.json b/results/m3e-base/no_revision_available/WeiboSentiment.json deleted file mode 100644 index 601bb48f..00000000 --- a/results/m3e-base/no_revision_available/WeiboSentiment.json +++ /dev/null @@ -1,15 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "WeiboSentiment", - "mteb_version": "1.0.2", - "validation": { - "accuracy": 0.6859000000000001, - "accuracy_stderr": 0.027336605495196342, - "ap": 0.6411379634459208, - "ap_stderr": 0.022816706825929463, - "evaluation_time": 7.45, - "f1": 0.6835071066153737, - "f1_stderr": 0.026757331192039872, - "main_score": 0.6859000000000001 - } -} \ No newline at end of file diff --git a/results/m3e-large/no_revision_available/WeiboSentiment.json b/results/m3e-large/no_revision_available/WeiboSentiment.json deleted file mode 100644 index 6f864695..00000000 --- a/results/m3e-large/no_revision_available/WeiboSentiment.json +++ /dev/null @@ -1,15 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "WeiboSentiment", - "mteb_version": "1.0.2", - "validation": { - "accuracy": 0.7251000000000001, - "accuracy_stderr": 0.029588680267967352, - "ap": 0.6755043090595506, - "ap_stderr": 0.023723375013606357, - "evaluation_time": 10.3, - "f1": 0.7231900363290196, - "f1_stderr": 0.02952337784995097, - "main_score": 0.7251000000000001 - } -} \ No newline at end of file diff --git a/results/text-embedding-ada-002/no_revision_available/WeiboSentiment.json b/results/text-embedding-ada-002/no_revision_available/WeiboSentiment.json deleted file mode 100644 index e95f0aa7..00000000 --- a/results/text-embedding-ada-002/no_revision_available/WeiboSentiment.json +++ /dev/null @@ -1,15 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "WeiboSentiment", - "mteb_version": "1.0.2", - "validation": { - "accuracy": 0.8003, - "accuracy_stderr": 0.021954726142678238, - "ap": 0.7503883528699425, - "ap_stderr": 0.021188003145962756, - "evaluation_time": 514.48, - "f1": 0.7993735448943509, - "f1_stderr": 0.022082510922554203, - "main_score": 0.8003 - } -} \ No newline at end of file diff --git a/results/text2vec-base-chinese/no_revision_available/WeiboSentiment.json b/results/text2vec-base-chinese/no_revision_available/WeiboSentiment.json deleted file mode 100644 index a629fb36..00000000 --- a/results/text2vec-base-chinese/no_revision_available/WeiboSentiment.json +++ /dev/null @@ -1,15 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "WeiboSentiment", - "mteb_version": "1.0.2", - "validation": { - "accuracy": 0.7879000000000002, - "accuracy_stderr": 0.026527155897306445, - "ap": 0.7355125764818398, - "ap_stderr": 0.026251890520340687, - "evaluation_time": 27.76, - "f1": 0.7869403865462794, - "f1_stderr": 0.026625542756976248, - "main_score": 0.7879000000000002 - } -} \ No newline at end of file diff --git a/results/text2vec-large-chinese/no_revision_available/WeiboSentiment.json b/results/text2vec-large-chinese/no_revision_available/WeiboSentiment.json deleted file mode 100644 index fd2627cf..00000000 --- a/results/text2vec-large-chinese/no_revision_available/WeiboSentiment.json +++ /dev/null @@ -1,15 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "WeiboSentiment", - "mteb_version": "1.0.2", - "validation": { - "accuracy": 0.8423999999999999, - "accuracy_stderr": 0.01134195750300627, - "ap": 0.7922345550352325, - "ap_stderr": 0.014423918590653954, - "evaluation_time": 26.39, - "f1": 0.8415791720898544, - "f1_stderr": 0.011413333043376193, - "main_score": 0.8423999999999999 - } -} \ No newline at end of file From 0ea99a334541db946696844a24fb117cc70fa077 Mon Sep 17 00:00:00 2001 From: Kenneth Enevoldsen Date: Tue, 9 Jul 2024 10:59:59 +0200 Subject: [PATCH 11/15] Remove Sohuccb --- .../no_revision_available/Sohuccb.json | 20 ------------------- .../no_revision_available/Sohuccb.json | 20 ------------------- .../no_revision_available/Sohuccb.json | 20 ------------------- .../no_revision_available/Sohuccb.json | 20 ------------------- .../no_revision_available/Sohuccb.json | 20 ------------------- 5 files changed, 100 deletions(-) delete mode 100644 results/luotuo-bert-medium/no_revision_available/Sohuccb.json delete mode 100644 results/m3e-base/no_revision_available/Sohuccb.json delete mode 100644 results/m3e-large/no_revision_available/Sohuccb.json delete mode 100644 results/text2vec-base-chinese/no_revision_available/Sohuccb.json delete mode 100644 results/text2vec-large-chinese/no_revision_available/Sohuccb.json diff --git a/results/luotuo-bert-medium/no_revision_available/Sohuccb.json b/results/luotuo-bert-medium/no_revision_available/Sohuccb.json deleted file mode 100644 index 9b41508b..00000000 --- a/results/luotuo-bert-medium/no_revision_available/Sohuccb.json +++ /dev/null @@ -1,20 +0,0 @@ -{ - "dataset_revision": "a0d554a64d88156834ff5ae9920b964011b16384", - "mteb_dataset_name": "Sohuccb", - "mteb_version": "1.0.2", - "test": { - "cos_sim": { - "pearson": 0.469189176032861, - "spearman": 0.514790211662874 - }, - "euclidean": { - "pearson": 0.5311215196921583, - "spearman": 0.514790211662874 - }, - "evaluation_time": 63.46, - "manhattan": { - "pearson": 0.5314198257209855, - "spearman": 0.5143657865508068 - } - } -} \ No newline at end of file diff --git a/results/m3e-base/no_revision_available/Sohuccb.json b/results/m3e-base/no_revision_available/Sohuccb.json deleted file mode 100644 index 2515f0d2..00000000 --- a/results/m3e-base/no_revision_available/Sohuccb.json +++ /dev/null @@ -1,20 +0,0 @@ -{ - "dataset_revision": "a0d554a64d88156834ff5ae9920b964011b16384", - "mteb_dataset_name": "Sohuccb", - "mteb_version": "1.0.2", - "test": { - "cos_sim": { - "pearson": 0.5053838963276963, - "spearman": 0.5012835066259131 - }, - "euclidean": { - "pearson": 0.535940365565754, - "spearman": 0.5025651040231355 - }, - "evaluation_time": 19.24, - "manhattan": { - "pearson": 0.5370298472046975, - "spearman": 0.5036053616507511 - } - } -} \ No newline at end of file diff --git a/results/m3e-large/no_revision_available/Sohuccb.json b/results/m3e-large/no_revision_available/Sohuccb.json deleted file mode 100644 index 8d7086a4..00000000 --- a/results/m3e-large/no_revision_available/Sohuccb.json +++ /dev/null @@ -1,20 +0,0 @@ -{ - "dataset_revision": "a0d554a64d88156834ff5ae9920b964011b16384", - "mteb_dataset_name": "Sohuccb", - "mteb_version": "1.0.2", - "test": { - "cos_sim": { - "pearson": 0.4915005475379004, - "spearman": 0.4990115839672006 - }, - "euclidean": { - "pearson": 0.538387666562128, - "spearman": 0.5082990040665526 - }, - "evaluation_time": 59.36, - "manhattan": { - "pearson": 0.5393943713252094, - "spearman": 0.509697110318068 - } - } -} \ No newline at end of file diff --git a/results/text2vec-base-chinese/no_revision_available/Sohuccb.json b/results/text2vec-base-chinese/no_revision_available/Sohuccb.json deleted file mode 100644 index 9e0e9a7e..00000000 --- a/results/text2vec-base-chinese/no_revision_available/Sohuccb.json +++ /dev/null @@ -1,20 +0,0 @@ -{ - "dataset_revision": "a0d554a64d88156834ff5ae9920b964011b16384", - "mteb_dataset_name": "Sohuccb", - "mteb_version": "1.0.2", - "test": { - "cos_sim": { - "pearson": 0.4848625329628114, - "spearman": 0.47025928637971776 - }, - "euclidean": { - "pearson": 0.5063418023577525, - "spearman": 0.4619705061428607 - }, - "evaluation_time": 5.47, - "manhattan": { - "pearson": 0.5083530101451736, - "spearman": 0.4639678025854769 - } - } -} \ No newline at end of file diff --git a/results/text2vec-large-chinese/no_revision_available/Sohuccb.json b/results/text2vec-large-chinese/no_revision_available/Sohuccb.json deleted file mode 100644 index 42a09e20..00000000 --- a/results/text2vec-large-chinese/no_revision_available/Sohuccb.json +++ /dev/null @@ -1,20 +0,0 @@ -{ - "dataset_revision": "a0d554a64d88156834ff5ae9920b964011b16384", - "mteb_dataset_name": "Sohuccb", - "mteb_version": "1.0.2", - "test": { - "cos_sim": { - "pearson": 0.4968885488684754, - "spearman": 0.48474757137733554 - }, - "euclidean": { - "pearson": 0.5217076923363101, - "spearman": 0.481934714752263 - }, - "evaluation_time": 60.58, - "manhattan": { - "pearson": 0.5218790797141282, - "spearman": 0.4824340384135185 - } - } -} \ No newline at end of file From b41346e4711656483a703ef71b5ce57da95d0992 Mon Sep 17 00:00:00 2001 From: Kenneth Enevoldsen Date: Tue, 9 Jul 2024 11:00:34 +0200 Subject: [PATCH 12/15] remove IFlyTekClutering --- .../no_revision_available/IFlyTekClutering.json | 10 ---------- .../no_revision_available/IFlyTekClutering.json | 10 ---------- .../no_revision_available/IFlyTekClutering.json | 10 ---------- .../no_revision_available/IFlyTekClutering.json | 10 ---------- .../no_revision_available/IFlyTekClutering.json | 10 ---------- .../no_revision_available/IFlyTekClutering.json | 10 ---------- 6 files changed, 60 deletions(-) delete mode 100644 results/luotuo-bert-medium/no_revision_available/IFlyTekClutering.json delete mode 100644 results/m3e-base/no_revision_available/IFlyTekClutering.json delete mode 100644 results/m3e-large/no_revision_available/IFlyTekClutering.json delete mode 100644 results/text-embedding-ada-002/no_revision_available/IFlyTekClutering.json delete mode 100644 results/text2vec-base-chinese/no_revision_available/IFlyTekClutering.json delete mode 100644 results/text2vec-large-chinese/no_revision_available/IFlyTekClutering.json diff --git a/results/luotuo-bert-medium/no_revision_available/IFlyTekClutering.json b/results/luotuo-bert-medium/no_revision_available/IFlyTekClutering.json deleted file mode 100644 index e8f45e50..00000000 --- a/results/luotuo-bert-medium/no_revision_available/IFlyTekClutering.json +++ /dev/null @@ -1,10 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "IFlyTekClutering", - "mteb_version": "1.0.2", - "test": { - "evaluation_time": 390.34, - "v_measure": 0.618217635198623, - "v_measure_std": 0.009145344699586482 - } -} \ No newline at end of file diff --git a/results/m3e-base/no_revision_available/IFlyTekClutering.json b/results/m3e-base/no_revision_available/IFlyTekClutering.json deleted file mode 100644 index 3d0bfe36..00000000 --- a/results/m3e-base/no_revision_available/IFlyTekClutering.json +++ /dev/null @@ -1,10 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "IFlyTekClutering", - "mteb_version": "1.0.2", - "test": { - "evaluation_time": 76.04, - "v_measure": 0.6112850458469564, - "v_measure_std": 0.009701335219332828 - } -} \ No newline at end of file diff --git a/results/m3e-large/no_revision_available/IFlyTekClutering.json b/results/m3e-large/no_revision_available/IFlyTekClutering.json deleted file mode 100644 index 656bd066..00000000 --- a/results/m3e-large/no_revision_available/IFlyTekClutering.json +++ /dev/null @@ -1,10 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "IFlyTekClutering", - "mteb_version": "1.0.2", - "test": { - "evaluation_time": 220.35, - "v_measure": 0.6198488693806539, - "v_measure_std": 0.006878910873130376 - } -} \ No newline at end of file diff --git a/results/text-embedding-ada-002/no_revision_available/IFlyTekClutering.json b/results/text-embedding-ada-002/no_revision_available/IFlyTekClutering.json deleted file mode 100644 index f3c10e92..00000000 --- a/results/text-embedding-ada-002/no_revision_available/IFlyTekClutering.json +++ /dev/null @@ -1,10 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "IFlyTekClutering", - "mteb_version": "1.0.2", - "test": { - "evaluation_time": 622.08, - "v_measure": 0.6169628862745183, - "v_measure_std": 0.010604795246430208 - } -} \ No newline at end of file diff --git a/results/text2vec-base-chinese/no_revision_available/IFlyTekClutering.json b/results/text2vec-base-chinese/no_revision_available/IFlyTekClutering.json deleted file mode 100644 index 50b0d117..00000000 --- a/results/text2vec-base-chinese/no_revision_available/IFlyTekClutering.json +++ /dev/null @@ -1,10 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "IFlyTekClutering", - "mteb_version": "1.0.2", - "test": { - "evaluation_time": 38.56, - "v_measure": 0.5863480465216687, - "v_measure_std": 0.008573136773751098 - } -} \ No newline at end of file diff --git a/results/text2vec-large-chinese/no_revision_available/IFlyTekClutering.json b/results/text2vec-large-chinese/no_revision_available/IFlyTekClutering.json deleted file mode 100644 index b275d317..00000000 --- a/results/text2vec-large-chinese/no_revision_available/IFlyTekClutering.json +++ /dev/null @@ -1,10 +0,0 @@ -{ - "dataset_revision": null, - "mteb_dataset_name": "IFlyTekClutering", - "mteb_version": "1.0.2", - "test": { - "evaluation_time": 225.47, - "v_measure": 0.5850791543049056, - "v_measure_std": 0.012146290969613569 - } -} \ No newline at end of file From b5e6609f00eef092ef46aa311cd2dc3233336b3e Mon Sep 17 00:00:00 2001 From: Kenneth Enevoldsen Date: Tue, 9 Jul 2024 11:05:18 +0200 Subject: [PATCH 13/15] remove Sohudda, overall_results --- .../overall_results.json | 40 ------------------- .../no_revision_available/Sohudda.json | 20 ---------- .../no_revision_available/Sohudda.json | 20 ---------- .../no_revision_available/Sohudda.json | 20 ---------- 4 files changed, 100 deletions(-) delete mode 100644 results/jina-embeddings-v2-base-en/no_revision_available/overall_results.json delete mode 100644 results/luotuo-bert-medium/no_revision_available/Sohudda.json delete mode 100644 results/m3e-base/no_revision_available/Sohudda.json delete mode 100644 results/m3e-large/no_revision_available/Sohudda.json diff --git a/results/jina-embeddings-v2-base-en/no_revision_available/overall_results.json b/results/jina-embeddings-v2-base-en/no_revision_available/overall_results.json deleted file mode 100644 index 087e0f9b..00000000 --- a/results/jina-embeddings-v2-base-en/no_revision_available/overall_results.json +++ /dev/null @@ -1,40 +0,0 @@ -{ - "LEMBNeedleRetrieval": { - "256": 0.86, - "512": 0.72, - "1024": 0.7, - "2048": 0.7, - "4096": 0.54, - "8192": 0.42, - "16384": 0.24, - "32768": 0.16, - "avg": 0.5425000000000001 - }, - "LEMBPasskeyRetrieval": { - "256": 1.0, - "512": 0.68, - "1024": 0.56, - "2048": 0.14, - "4096": 0.54, - "8192": 0.58, - "16384": 0.34, - "32768": 0.18, - "avg": 0.5025000000000001 - }, - "LEMBNarrativeQARetrieval": { - "ndcg@1": 0.27811, - "ndcg@10": 0.37893 - }, - "LEMBQMSumRetrieval": { - "ndcg@1": 0.23772, - "ndcg@10": 0.38866 - }, - "LEMBSummScreenFDRetrieval": { - "ndcg@1": 0.875, - "ndcg@10": 0.93479 - }, - "LEMBWikimQARetrieval": { - "ndcg@1": 0.66333, - "ndcg@10": 0.73988 - } -} \ No newline at end of file diff --git a/results/luotuo-bert-medium/no_revision_available/Sohudda.json b/results/luotuo-bert-medium/no_revision_available/Sohudda.json deleted file mode 100644 index 752b0e73..00000000 --- a/results/luotuo-bert-medium/no_revision_available/Sohudda.json +++ /dev/null @@ -1,20 +0,0 @@ -{ - "dataset_revision": "a0d554a64d88156834ff5ae9920b964011b16384", - "mteb_dataset_name": "Sohudda", - "mteb_version": "1.0.2", - "test": { - "cos_sim": { - "pearson": 0.6002501387294787, - "spearman": 0.5809597956772022 - }, - "euclidean": { - "pearson": 0.5960056429965963, - "spearman": 0.5809559440071916 - }, - "evaluation_time": 16.95, - "manhattan": { - "pearson": 0.5948977548001798, - "spearman": 0.5796419284658363 - } - } -} \ No newline at end of file diff --git a/results/m3e-base/no_revision_available/Sohudda.json b/results/m3e-base/no_revision_available/Sohudda.json deleted file mode 100644 index f5c26f9f..00000000 --- a/results/m3e-base/no_revision_available/Sohudda.json +++ /dev/null @@ -1,20 +0,0 @@ -{ - "dataset_revision": "a0d554a64d88156834ff5ae9920b964011b16384", - "mteb_dataset_name": "Sohudda", - "mteb_version": "1.0.2", - "test": { - "cos_sim": { - "pearson": 0.6299846392251068, - "spearman": 0.6102226132301666 - }, - "euclidean": { - "pearson": 0.6148706394464605, - "spearman": 0.6079465352770246 - }, - "evaluation_time": 2.52, - "manhattan": { - "pearson": 0.6146504770155468, - "spearman": 0.6076382635454286 - } - } -} \ No newline at end of file diff --git a/results/m3e-large/no_revision_available/Sohudda.json b/results/m3e-large/no_revision_available/Sohudda.json deleted file mode 100644 index 16609ce3..00000000 --- a/results/m3e-large/no_revision_available/Sohudda.json +++ /dev/null @@ -1,20 +0,0 @@ -{ - "dataset_revision": "a0d554a64d88156834ff5ae9920b964011b16384", - "mteb_dataset_name": "Sohudda", - "mteb_version": "1.0.2", - "test": { - "cos_sim": { - "pearson": 0.6137556772736376, - "spearman": 0.6060994614285242 - }, - "euclidean": { - "pearson": 0.6214689591193363, - "spearman": 0.6062899312194179 - }, - "evaluation_time": 7.61, - "manhattan": { - "pearson": 0.6226755835385295, - "spearman": 0.6077118372406303 - } - } -} \ No newline at end of file From f5619187e65c5feeed4f81492adce6a1e8e97d64 Mon Sep 17 00:00:00 2001 From: Kenneth Enevoldsen Date: Tue, 9 Jul 2024 11:05:34 +0200 Subject: [PATCH 14/15] Remove comments from results files --- .../no_revision_available/MSMARCO-PL.json | 1 - .../no_revision_available/MSMARCO-PL.json | 1 - .../no_revision_available/MSMARCO-PL.json | 1 - .../no_revision_available/MSMARCO-PL.json | 1 - .../no_revision_available/MSMARCO-PL.json | 1 - .../no_revision_available/Sohudda.json | 20 ------------------- .../no_revision_available/Sohudda.json | 20 ------------------- 7 files changed, 45 deletions(-) delete mode 100644 results/text2vec-base-chinese/no_revision_available/Sohudda.json delete mode 100644 results/text2vec-large-chinese/no_revision_available/Sohudda.json diff --git a/results/paraphrase-multilingual-MiniLM-L12-v2/no_revision_available/MSMARCO-PL.json b/results/paraphrase-multilingual-MiniLM-L12-v2/no_revision_available/MSMARCO-PL.json index 60e6343e..e422642e 100644 --- a/results/paraphrase-multilingual-MiniLM-L12-v2/no_revision_available/MSMARCO-PL.json +++ b/results/paraphrase-multilingual-MiniLM-L12-v2/no_revision_available/MSMARCO-PL.json @@ -2,7 +2,6 @@ "dataset_revision": null, "mteb_dataset_name": "MSMARCO-PL", "mteb_version": "1.1.1", - "comment": "This is a validation split that has been marked as test for the purposes of the https://huggingface.co/spaces/mteb/leaderboard/blob/main/app.py script.", "test": { "evaluation_time": 3808.37, "map_at_1": 0.04651, diff --git a/results/paraphrase-multilingual-mpnet-base-v2/no_revision_available/MSMARCO-PL.json b/results/paraphrase-multilingual-mpnet-base-v2/no_revision_available/MSMARCO-PL.json index a2c2cc0f..87e86da1 100644 --- a/results/paraphrase-multilingual-mpnet-base-v2/no_revision_available/MSMARCO-PL.json +++ b/results/paraphrase-multilingual-mpnet-base-v2/no_revision_available/MSMARCO-PL.json @@ -2,7 +2,6 @@ "dataset_revision": null, "mteb_dataset_name": "MSMARCO-PL", "mteb_version": "1.1.1", - "comment": "This is a validation split that has been marked as test for the purposes of the https://huggingface.co/spaces/mteb/leaderboard/blob/main/app.py script.", "test": { "evaluation_time": 7281.28, "map_at_1": 0.05528, diff --git a/results/silver-retriever-base-v1/no_revision_available/MSMARCO-PL.json b/results/silver-retriever-base-v1/no_revision_available/MSMARCO-PL.json index 34bec8d3..eeab90f5 100644 --- a/results/silver-retriever-base-v1/no_revision_available/MSMARCO-PL.json +++ b/results/silver-retriever-base-v1/no_revision_available/MSMARCO-PL.json @@ -2,7 +2,6 @@ "dataset_revision": null, "mteb_dataset_name": "MSMARCO-PL", "mteb_version": "1.1.1", - "comment": "This is a validation split that has been marked as test for the purposes of the https://huggingface.co/spaces/mteb/leaderboard/blob/main/app.py script.", "test": { "evaluation_time": 8814.37, "map_at_1": 0.11603, diff --git a/results/st-polish-paraphrase-from-distilroberta/no_revision_available/MSMARCO-PL.json b/results/st-polish-paraphrase-from-distilroberta/no_revision_available/MSMARCO-PL.json index 9ec94741..c48e2bd2 100644 --- a/results/st-polish-paraphrase-from-distilroberta/no_revision_available/MSMARCO-PL.json +++ b/results/st-polish-paraphrase-from-distilroberta/no_revision_available/MSMARCO-PL.json @@ -2,7 +2,6 @@ "dataset_revision": null, "mteb_dataset_name": "MSMARCO-PL", "mteb_version": "1.1.1", - "comment": "This is a validation split that has been marked as test for the purposes of the https://huggingface.co/spaces/mteb/leaderboard/blob/main/app.py script.", "test": { "evaluation_time": 10716.01, "map_at_1": 0.07538, diff --git a/results/st-polish-paraphrase-from-mpnet/no_revision_available/MSMARCO-PL.json b/results/st-polish-paraphrase-from-mpnet/no_revision_available/MSMARCO-PL.json index 15fbdf9e..7a64484b 100644 --- a/results/st-polish-paraphrase-from-mpnet/no_revision_available/MSMARCO-PL.json +++ b/results/st-polish-paraphrase-from-mpnet/no_revision_available/MSMARCO-PL.json @@ -2,7 +2,6 @@ "dataset_revision": null, "mteb_dataset_name": "MSMARCO-PL", "mteb_version": "1.1.1", - "comment": "This is a validation split that has been marked as test for the purposes of the https://huggingface.co/spaces/mteb/leaderboard/blob/main/app.py script.", "test": { "evaluation_time": 8535.58, "map_at_1": 0.0852, diff --git a/results/text2vec-base-chinese/no_revision_available/Sohudda.json b/results/text2vec-base-chinese/no_revision_available/Sohudda.json deleted file mode 100644 index f2d7fec8..00000000 --- a/results/text2vec-base-chinese/no_revision_available/Sohudda.json +++ /dev/null @@ -1,20 +0,0 @@ -{ - "dataset_revision": "a0d554a64d88156834ff5ae9920b964011b16384", - "mteb_dataset_name": "Sohudda", - "mteb_version": "1.0.2", - "test": { - "cos_sim": { - "pearson": 0.5269179681250432, - "spearman": 0.5093714774621678 - }, - "euclidean": { - "pearson": 0.506683256572653, - "spearman": 0.4706116073284235 - }, - "evaluation_time": 2.34, - "manhattan": { - "pearson": 0.5080765532241487, - "spearman": 0.4712975121184771 - } - } -} \ No newline at end of file diff --git a/results/text2vec-large-chinese/no_revision_available/Sohudda.json b/results/text2vec-large-chinese/no_revision_available/Sohudda.json deleted file mode 100644 index 9a3444b7..00000000 --- a/results/text2vec-large-chinese/no_revision_available/Sohudda.json +++ /dev/null @@ -1,20 +0,0 @@ -{ - "dataset_revision": "a0d554a64d88156834ff5ae9920b964011b16384", - "mteb_dataset_name": "Sohudda", - "mteb_version": "1.0.2", - "test": { - "cos_sim": { - "pearson": 0.5984744682842694, - "spearman": 0.5730757128863982 - }, - "euclidean": { - "pearson": 0.5560408126388445, - "spearman": 0.5455680711837269 - }, - "evaluation_time": 7.75, - "manhattan": { - "pearson": 0.5562645845539591, - "spearman": 0.5470554831632787 - } - } -} \ No newline at end of file From d2b7c0f101bd9142e84b28f32ec287478614f971 Mon Sep 17 00:00:00 2001 From: Kenneth Enevoldsen Date: Tue, 9 Jul 2024 12:57:02 +0200 Subject: [PATCH 15/15] remove mteb version = test --- .../no_revision_available/STSBenchmarkMultilingualSTS.json | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/results/voyage-multilingual-2/no_revision_available/STSBenchmarkMultilingualSTS.json b/results/voyage-multilingual-2/no_revision_available/STSBenchmarkMultilingualSTS.json index 841191a3..fad88904 100644 --- a/results/voyage-multilingual-2/no_revision_available/STSBenchmarkMultilingualSTS.json +++ b/results/voyage-multilingual-2/no_revision_available/STSBenchmarkMultilingualSTS.json @@ -17,6 +17,5 @@ } } }, - "mteb_dataset_name": "STSBenchmarkMultilingualSTS", - "mteb_version": "test" + "mteb_dataset_name": "STSBenchmarkMultilingualSTS" } \ No newline at end of file