Muennighoff
commited on
Commit
·
aa91968
1
Parent(s):
41063e3
Add MTEB eval
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- {eval → evaluation/beir}/beir.json +0 -0
- evaluation/mteb/AmazonCounterfactualClassification.json +16 -0
- evaluation/mteb/AmazonPolarityClassification.json +14 -0
- evaluation/mteb/AmazonReviewsClassification.json +14 -0
- evaluation/mteb/ArguAna.json +37 -0
- evaluation/mteb/ArxivClusteringP2P.json +9 -0
- evaluation/mteb/ArxivClusteringS2S.json +9 -0
- evaluation/mteb/AskUbuntuDupQuestions.json +9 -0
- evaluation/mteb/BIOSSES.json +19 -0
- evaluation/mteb/Banking77Classification.json +12 -0
- evaluation/mteb/BiorxivClusteringP2P.json +9 -0
- evaluation/mteb/BiorxivClusteringS2S.json +9 -0
- evaluation/mteb/CQADupstackAndroidRetrieval.json +37 -0
- evaluation/mteb/CQADupstackEnglishRetrieval.json +37 -0
- evaluation/mteb/CQADupstackGamingRetrieval.json +37 -0
- evaluation/mteb/CQADupstackGisRetrieval.json +37 -0
- evaluation/mteb/CQADupstackMathematicaRetrieval.json +37 -0
- evaluation/mteb/CQADupstackPhysicsRetrieval.json +37 -0
- evaluation/mteb/CQADupstackProgrammersRetrieval.json +37 -0
- evaluation/mteb/CQADupstackRetrieval.json +1 -0
- evaluation/mteb/CQADupstackStatsRetrieval.json +37 -0
- evaluation/mteb/CQADupstackTexRetrieval.json +37 -0
- evaluation/mteb/CQADupstackUnixRetrieval.json +37 -0
- evaluation/mteb/CQADupstackWebmastersRetrieval.json +37 -0
- evaluation/mteb/CQADupstackWordpressRetrieval.json +37 -0
- evaluation/mteb/ClimateFEVER.json +37 -0
- evaluation/mteb/DBPedia.json +37 -0
- evaluation/mteb/EmotionClassification.json +12 -0
- evaluation/mteb/FEVER.json +37 -0
- evaluation/mteb/FiQA2018.json +37 -0
- evaluation/mteb/HotpotQA.json +37 -0
- evaluation/mteb/ImdbClassification.json +14 -0
- evaluation/mteb/MSMARCO.json +37 -0
- evaluation/mteb/MTOPDomainClassification.json +14 -0
- evaluation/mteb/MTOPIntentClassification.json +14 -0
- evaluation/mteb/MassiveIntentClassification.json +14 -0
- evaluation/mteb/MassiveScenarioClassification.json +14 -0
- evaluation/mteb/MedrxivClusteringP2P.json +9 -0
- evaluation/mteb/MedrxivClusteringS2S.json +9 -0
- evaluation/mteb/NFCorpus.json +37 -0
- evaluation/mteb/NQ.json +37 -0
- evaluation/mteb/QuoraRetrieval.json +37 -0
- evaluation/mteb/RedditClustering.json +9 -0
- evaluation/mteb/RedditClusteringP2P.json +9 -0
- evaluation/mteb/SCIDOCS.json +37 -0
- evaluation/mteb/SGPT-2.7B-weightedmean-msmarco-specb-bitfit_results.csv +354 -0
- evaluation/mteb/SICK-R.json +19 -0
- evaluation/mteb/STS12.json +19 -0
- evaluation/mteb/STS13.json +19 -0
- evaluation/mteb/STS14.json +19 -0
{eval → evaluation/beir}/beir.json
RENAMED
File without changes
|
evaluation/mteb/AmazonCounterfactualClassification.json
ADDED
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"en": {
|
6 |
+
"accuracy": 0.6756716417910448,
|
7 |
+
"accuracy_stderr": 0.035149491395717075,
|
8 |
+
"ap": 0.3075574629595259,
|
9 |
+
"ap_stderr": 0.022378514563472136,
|
10 |
+
"f1": 0.6180512130185866,
|
11 |
+
"f1_stderr": 0.027752667739340424,
|
12 |
+
"main_score": 0.6756716417910448
|
13 |
+
},
|
14 |
+
"evaluation_time": 33.75
|
15 |
+
}
|
16 |
+
}
|
evaluation/mteb/AmazonPolarityClassification.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"accuracy": 0.71439575,
|
6 |
+
"accuracy_stderr": 0.04118535930779893,
|
7 |
+
"ap": 0.6591341330532453,
|
8 |
+
"ap_stderr": 0.039567766080541335,
|
9 |
+
"evaluation_time": 15193.17,
|
10 |
+
"f1": 0.7090561852619555,
|
11 |
+
"f1_stderr": 0.04610604328985526,
|
12 |
+
"main_score": 0.71439575
|
13 |
+
}
|
14 |
+
}
|
evaluation/mteb/AmazonReviewsClassification.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"en": {
|
6 |
+
"accuracy": 0.35748,
|
7 |
+
"accuracy_stderr": 0.017313624692709504,
|
8 |
+
"f1": 0.35485762871863474,
|
9 |
+
"f1_stderr": 0.016676501915976406,
|
10 |
+
"main_score": 0.35748
|
11 |
+
},
|
12 |
+
"evaluation_time": 125.24
|
13 |
+
}
|
14 |
+
}
|
evaluation/mteb/ArguAna.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 254.16,
|
6 |
+
"map_at_1": 0.2596,
|
7 |
+
"map_at_10": 0.41619,
|
8 |
+
"map_at_100": 0.42673,
|
9 |
+
"map_at_1000": 0.42684,
|
10 |
+
"map_at_3": 0.36569,
|
11 |
+
"map_at_5": 0.39397,
|
12 |
+
"mrr_at_1": 0.26316,
|
13 |
+
"mrr_at_10": 0.41772,
|
14 |
+
"mrr_at_100": 0.4282,
|
15 |
+
"mrr_at_1000": 0.4283,
|
16 |
+
"mrr_at_3": 0.36724,
|
17 |
+
"mrr_at_5": 0.39529,
|
18 |
+
"ndcg_at_1": 0.2596,
|
19 |
+
"ndcg_at_10": 0.50491,
|
20 |
+
"ndcg_at_100": 0.54865,
|
21 |
+
"ndcg_at_1000": 0.55107,
|
22 |
+
"ndcg_at_3": 0.40053,
|
23 |
+
"ndcg_at_5": 0.45134,
|
24 |
+
"precision_at_1": 0.2596,
|
25 |
+
"precision_at_10": 0.07895,
|
26 |
+
"precision_at_100": 0.00978,
|
27 |
+
"precision_at_1000": 0.001,
|
28 |
+
"precision_at_3": 0.16714,
|
29 |
+
"precision_at_5": 0.12489,
|
30 |
+
"recall_at_1": 0.2596,
|
31 |
+
"recall_at_10": 0.78947,
|
32 |
+
"recall_at_100": 0.97795,
|
33 |
+
"recall_at_1000": 0.99644,
|
34 |
+
"recall_at_3": 0.50142,
|
35 |
+
"recall_at_5": 0.62447
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/ArxivClusteringP2P.json
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 57365.88,
|
6 |
+
"v_measure": 0.44721257146422017,
|
7 |
+
"v_measure_std": 0.135218958073186
|
8 |
+
}
|
9 |
+
}
|
evaluation/mteb/ArxivClusteringS2S.json
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 6983.79,
|
6 |
+
"v_measure": 0.35081451519142065,
|
7 |
+
"v_measure_std": 0.14064701566219873
|
8 |
+
}
|
9 |
+
}
|
evaluation/mteb/AskUbuntuDupQuestions.json
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 56.03,
|
6 |
+
"map": 0.5963466199039206,
|
7 |
+
"mrr": 0.736813525040672
|
8 |
+
}
|
9 |
+
}
|
evaluation/mteb/BIOSSES.json
ADDED
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"cos_sim": {
|
6 |
+
"pearson": 0.8742754550496836,
|
7 |
+
"spearman": 0.8484289705838665
|
8 |
+
},
|
9 |
+
"euclidean": {
|
10 |
+
"pearson": 0.8559331970450859,
|
11 |
+
"spearman": 0.858525586184271
|
12 |
+
},
|
13 |
+
"evaluation_time": 6.0,
|
14 |
+
"manhattan": {
|
15 |
+
"pearson": 0.8541233134466698,
|
16 |
+
"spearman": 0.8552303303767403
|
17 |
+
}
|
18 |
+
}
|
19 |
+
}
|
evaluation/mteb/Banking77Classification.json
ADDED
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"accuracy": 0.8321753246753246,
|
6 |
+
"accuracy_stderr": 0.008047037149251285,
|
7 |
+
"evaluation_time": 109.45,
|
8 |
+
"f1": 0.8315394543120915,
|
9 |
+
"f1_stderr": 0.008443343664861741,
|
10 |
+
"main_score": 0.8321753246753246
|
11 |
+
}
|
12 |
+
}
|
evaluation/mteb/BiorxivClusteringP2P.json
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 6657.01,
|
6 |
+
"v_measure": 0.3441414219680629,
|
7 |
+
"v_measure_std": 0.010243021348181702
|
8 |
+
}
|
9 |
+
}
|
evaluation/mteb/BiorxivClusteringS2S.json
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 843.62,
|
6 |
+
"v_measure": 0.30533275862270026,
|
7 |
+
"v_measure_std": 0.011135486000086606
|
8 |
+
}
|
9 |
+
}
|
evaluation/mteb/CQADupstackAndroidRetrieval.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 1118.91,
|
6 |
+
"map_at_1": 0.30809,
|
7 |
+
"map_at_10": 0.40617,
|
8 |
+
"map_at_100": 0.41895,
|
9 |
+
"map_at_1000": 0.42025,
|
10 |
+
"map_at_3": 0.37,
|
11 |
+
"map_at_5": 0.38993,
|
12 |
+
"mrr_at_1": 0.37482,
|
13 |
+
"mrr_at_10": 0.46497,
|
14 |
+
"mrr_at_100": 0.47144,
|
15 |
+
"mrr_at_1000": 0.47189,
|
16 |
+
"mrr_at_3": 0.43705,
|
17 |
+
"mrr_at_5": 0.45193,
|
18 |
+
"ndcg_at_1": 0.37482,
|
19 |
+
"ndcg_at_10": 0.46688,
|
20 |
+
"ndcg_at_100": 0.51726,
|
21 |
+
"ndcg_at_1000": 0.53825,
|
22 |
+
"ndcg_at_3": 0.41242,
|
23 |
+
"ndcg_at_5": 0.43657,
|
24 |
+
"precision_at_1": 0.37482,
|
25 |
+
"precision_at_10": 0.08827,
|
26 |
+
"precision_at_100": 0.01393,
|
27 |
+
"precision_at_1000": 0.00186,
|
28 |
+
"precision_at_3": 0.19361,
|
29 |
+
"precision_at_5": 0.14106,
|
30 |
+
"recall_at_1": 0.30809,
|
31 |
+
"recall_at_10": 0.5847,
|
32 |
+
"recall_at_100": 0.80519,
|
33 |
+
"recall_at_1000": 0.93809,
|
34 |
+
"recall_at_3": 0.42462,
|
35 |
+
"recall_at_5": 0.49385
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/CQADupstackEnglishRetrieval.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 1732.23,
|
6 |
+
"map_at_1": 0.26962,
|
7 |
+
"map_at_10": 0.3693,
|
8 |
+
"map_at_100": 0.38102,
|
9 |
+
"map_at_1000": 0.3822,
|
10 |
+
"map_at_3": 0.34065,
|
11 |
+
"map_at_5": 0.3572,
|
12 |
+
"mrr_at_1": 0.33567,
|
13 |
+
"mrr_at_10": 0.42269,
|
14 |
+
"mrr_at_100": 0.4299,
|
15 |
+
"mrr_at_1000": 0.43033,
|
16 |
+
"mrr_at_3": 0.40064,
|
17 |
+
"mrr_at_5": 0.41258,
|
18 |
+
"ndcg_at_1": 0.33567,
|
19 |
+
"ndcg_at_10": 0.42405,
|
20 |
+
"ndcg_at_100": 0.46847,
|
21 |
+
"ndcg_at_1000": 0.48951,
|
22 |
+
"ndcg_at_3": 0.38312,
|
23 |
+
"ndcg_at_5": 0.40242,
|
24 |
+
"precision_at_1": 0.33567,
|
25 |
+
"precision_at_10": 0.08032,
|
26 |
+
"precision_at_100": 0.01295,
|
27 |
+
"precision_at_1000": 0.00176,
|
28 |
+
"precision_at_3": 0.18662,
|
29 |
+
"precision_at_5": 0.13299,
|
30 |
+
"recall_at_1": 0.26962,
|
31 |
+
"recall_at_10": 0.52489,
|
32 |
+
"recall_at_100": 0.71635,
|
33 |
+
"recall_at_1000": 0.85141,
|
34 |
+
"recall_at_3": 0.4028,
|
35 |
+
"recall_at_5": 0.45757
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/CQADupstackGamingRetrieval.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 1830.25,
|
6 |
+
"map_at_1": 0.36318,
|
7 |
+
"map_at_10": 0.4797,
|
8 |
+
"map_at_100": 0.49003,
|
9 |
+
"map_at_1000": 0.49066,
|
10 |
+
"map_at_3": 0.45031,
|
11 |
+
"map_at_5": 0.46633,
|
12 |
+
"mrr_at_1": 0.41505,
|
13 |
+
"mrr_at_10": 0.51431,
|
14 |
+
"mrr_at_100": 0.52129,
|
15 |
+
"mrr_at_1000": 0.52161,
|
16 |
+
"mrr_at_3": 0.48934,
|
17 |
+
"mrr_at_5": 0.5042,
|
18 |
+
"ndcg_at_1": 0.41505,
|
19 |
+
"ndcg_at_10": 0.53676,
|
20 |
+
"ndcg_at_100": 0.57867,
|
21 |
+
"ndcg_at_1000": 0.59166,
|
22 |
+
"ndcg_at_3": 0.48516,
|
23 |
+
"ndcg_at_5": 0.50984,
|
24 |
+
"precision_at_1": 0.41505,
|
25 |
+
"precision_at_10": 0.08608,
|
26 |
+
"precision_at_100": 0.01156,
|
27 |
+
"precision_at_1000": 0.00133,
|
28 |
+
"precision_at_3": 0.21463,
|
29 |
+
"precision_at_5": 0.14721,
|
30 |
+
"recall_at_1": 0.36318,
|
31 |
+
"recall_at_10": 0.67066,
|
32 |
+
"recall_at_100": 0.8534,
|
33 |
+
"recall_at_1000": 0.94491,
|
34 |
+
"recall_at_3": 0.53216,
|
35 |
+
"recall_at_5": 0.59214
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/CQADupstackGisRetrieval.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 2522.93,
|
6 |
+
"map_at_1": 0.22167,
|
7 |
+
"map_at_10": 0.29544,
|
8 |
+
"map_at_100": 0.30579,
|
9 |
+
"map_at_1000": 0.3067,
|
10 |
+
"map_at_3": 0.26982,
|
11 |
+
"map_at_5": 0.28474,
|
12 |
+
"mrr_at_1": 0.24068,
|
13 |
+
"mrr_at_10": 0.31237,
|
14 |
+
"mrr_at_100": 0.32222,
|
15 |
+
"mrr_at_1000": 0.32292,
|
16 |
+
"mrr_at_3": 0.28776,
|
17 |
+
"mrr_at_5": 0.30234,
|
18 |
+
"ndcg_at_1": 0.24068,
|
19 |
+
"ndcg_at_10": 0.33973,
|
20 |
+
"ndcg_at_100": 0.39135,
|
21 |
+
"ndcg_at_1000": 0.41444,
|
22 |
+
"ndcg_at_3": 0.29018,
|
23 |
+
"ndcg_at_5": 0.31559,
|
24 |
+
"precision_at_1": 0.24068,
|
25 |
+
"precision_at_10": 0.05299,
|
26 |
+
"precision_at_100": 0.00823,
|
27 |
+
"precision_at_1000": 0.00106,
|
28 |
+
"precision_at_3": 0.12166,
|
29 |
+
"precision_at_5": 0.08768,
|
30 |
+
"recall_at_1": 0.22167,
|
31 |
+
"recall_at_10": 0.46115,
|
32 |
+
"recall_at_100": 0.69867,
|
33 |
+
"recall_at_1000": 0.87234,
|
34 |
+
"recall_at_3": 0.32798,
|
35 |
+
"recall_at_5": 0.38951
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/CQADupstackMathematicaRetrieval.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 1350.85,
|
6 |
+
"map_at_1": 0.12033,
|
7 |
+
"map_at_10": 0.19314,
|
8 |
+
"map_at_100": 0.20562,
|
9 |
+
"map_at_1000": 0.20695,
|
10 |
+
"map_at_3": 0.16946,
|
11 |
+
"map_at_5": 0.18077,
|
12 |
+
"mrr_at_1": 0.14801,
|
13 |
+
"mrr_at_10": 0.2274,
|
14 |
+
"mrr_at_100": 0.23876,
|
15 |
+
"mrr_at_1000": 0.23949,
|
16 |
+
"mrr_at_3": 0.20211,
|
17 |
+
"mrr_at_5": 0.21573,
|
18 |
+
"ndcg_at_1": 0.14801,
|
19 |
+
"ndcg_at_10": 0.24038,
|
20 |
+
"ndcg_at_100": 0.30186,
|
21 |
+
"ndcg_at_1000": 0.33321,
|
22 |
+
"ndcg_at_3": 0.19431,
|
23 |
+
"ndcg_at_5": 0.2134,
|
24 |
+
"precision_at_1": 0.14801,
|
25 |
+
"precision_at_10": 0.04776,
|
26 |
+
"precision_at_100": 0.00897,
|
27 |
+
"precision_at_1000": 0.00133,
|
28 |
+
"precision_at_3": 0.0966,
|
29 |
+
"precision_at_5": 0.07239,
|
30 |
+
"recall_at_1": 0.12033,
|
31 |
+
"recall_at_10": 0.35098,
|
32 |
+
"recall_at_100": 0.62175,
|
33 |
+
"recall_at_1000": 0.84171,
|
34 |
+
"recall_at_3": 0.2261,
|
35 |
+
"recall_at_5": 0.27279
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/CQADupstackPhysicsRetrieval.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 2467.52,
|
6 |
+
"map_at_1": 0.26651,
|
7 |
+
"map_at_10": 0.36901,
|
8 |
+
"map_at_100": 0.38249,
|
9 |
+
"map_at_1000": 0.38361,
|
10 |
+
"map_at_3": 0.33891,
|
11 |
+
"map_at_5": 0.35439,
|
12 |
+
"mrr_at_1": 0.32724,
|
13 |
+
"mrr_at_10": 0.42504,
|
14 |
+
"mrr_at_100": 0.43392,
|
15 |
+
"mrr_at_1000": 0.43436,
|
16 |
+
"mrr_at_3": 0.3999,
|
17 |
+
"mrr_at_5": 0.41347,
|
18 |
+
"ndcg_at_1": 0.32724,
|
19 |
+
"ndcg_at_10": 0.43007,
|
20 |
+
"ndcg_at_100": 0.48601,
|
21 |
+
"ndcg_at_1000": 0.50697,
|
22 |
+
"ndcg_at_3": 0.3799,
|
23 |
+
"ndcg_at_5": 0.40084,
|
24 |
+
"precision_at_1": 0.32724,
|
25 |
+
"precision_at_10": 0.07873,
|
26 |
+
"precision_at_100": 0.01247,
|
27 |
+
"precision_at_1000": 0.00162,
|
28 |
+
"precision_at_3": 0.18062,
|
29 |
+
"precision_at_5": 0.12666,
|
30 |
+
"recall_at_1": 0.26651,
|
31 |
+
"recall_at_10": 0.55674,
|
32 |
+
"recall_at_100": 0.78904,
|
33 |
+
"recall_at_1000": 0.92558,
|
34 |
+
"recall_at_3": 0.4136,
|
35 |
+
"recall_at_5": 0.46984
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/CQADupstackProgrammersRetrieval.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 2301.71,
|
6 |
+
"map_at_1": 0.22589,
|
7 |
+
"map_at_10": 0.32244,
|
8 |
+
"map_at_100": 0.3346,
|
9 |
+
"map_at_1000": 0.33593,
|
10 |
+
"map_at_3": 0.2921,
|
11 |
+
"map_at_5": 0.3102,
|
12 |
+
"mrr_at_1": 0.28425,
|
13 |
+
"mrr_at_10": 0.37282,
|
14 |
+
"mrr_at_100": 0.38187,
|
15 |
+
"mrr_at_1000": 0.38248,
|
16 |
+
"mrr_at_3": 0.34684,
|
17 |
+
"mrr_at_5": 0.36123,
|
18 |
+
"ndcg_at_1": 0.28425,
|
19 |
+
"ndcg_at_10": 0.37942,
|
20 |
+
"ndcg_at_100": 0.43443,
|
21 |
+
"ndcg_at_1000": 0.45996,
|
22 |
+
"ndcg_at_3": 0.32874,
|
23 |
+
"ndcg_at_5": 0.35325,
|
24 |
+
"precision_at_1": 0.28425,
|
25 |
+
"precision_at_10": 0.071,
|
26 |
+
"precision_at_100": 0.01166,
|
27 |
+
"precision_at_1000": 0.00158,
|
28 |
+
"precision_at_3": 0.1602,
|
29 |
+
"precision_at_5": 0.11644,
|
30 |
+
"recall_at_1": 0.22589,
|
31 |
+
"recall_at_10": 0.5004,
|
32 |
+
"recall_at_100": 0.73973,
|
33 |
+
"recall_at_1000": 0.91128,
|
34 |
+
"recall_at_3": 0.35883,
|
35 |
+
"recall_at_5": 0.42188
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/CQADupstackRetrieval.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"dataset_version": null, "mteb_version": "0.0.2", "test": {"evaluation_time": 3522.66, "map_at_1": 0.23190833333333336, "map_at_10": 0.31504916666666666, "map_at_100": 0.32649083333333334, "map_at_1000": 0.3277075, "map_at_3": 0.2882575, "map_at_5": 0.302755, "mrr_at_1": 0.27427499999999994, "mrr_at_10": 0.35364833333333334, "mrr_at_100": 0.36234416666666663, "mrr_at_1000": 0.36297583333333333, "mrr_at_3": 0.3297966666666667, "mrr_at_5": 0.34294583333333334, "ndcg_at_1": 0.27427499999999994, "ndcg_at_10": 0.3653358333333333, "ndcg_at_100": 0.4164508333333333, "ndcg_at_1000": 0.4414499999999999, "ndcg_at_3": 0.3188908333333333, "ndcg_at_5": 0.33984333333333333, "precision_at_1": 0.27427499999999994, "precision_at_10": 0.06481083333333333, "precision_at_100": 0.010610833333333333, "precision_at_1000": 0.0014691666666666666, "precision_at_3": 0.1465675, "precision_at_5": 0.10493583333333333, "recall_at_1": 0.23190833333333336, "recall_at_10": 0.4765175, "recall_at_100": 0.7041016666666666, "recall_at_1000": 0.8782708333333332, "recall_at_3": 0.34637583333333327, "recall_at_5": 0.4005008333333333}}
|
evaluation/mteb/CQADupstackStatsRetrieval.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 3154.61,
|
6 |
+
"map_at_1": 0.20409,
|
7 |
+
"map_at_10": 0.26794,
|
8 |
+
"map_at_100": 0.27682,
|
9 |
+
"map_at_1000": 0.27783,
|
10 |
+
"map_at_3": 0.24461,
|
11 |
+
"map_at_5": 0.25668,
|
12 |
+
"mrr_at_1": 0.22853,
|
13 |
+
"mrr_at_10": 0.29296,
|
14 |
+
"mrr_at_100": 0.30103,
|
15 |
+
"mrr_at_1000": 0.30179,
|
16 |
+
"mrr_at_3": 0.27173,
|
17 |
+
"mrr_at_5": 0.28223,
|
18 |
+
"ndcg_at_1": 0.22853,
|
19 |
+
"ndcg_at_10": 0.31007,
|
20 |
+
"ndcg_at_100": 0.35581,
|
21 |
+
"ndcg_at_1000": 0.38147,
|
22 |
+
"ndcg_at_3": 0.26591,
|
23 |
+
"ndcg_at_5": 0.2843,
|
24 |
+
"precision_at_1": 0.22853,
|
25 |
+
"precision_at_10": 0.05031,
|
26 |
+
"precision_at_100": 0.00794,
|
27 |
+
"precision_at_1000": 0.0011,
|
28 |
+
"precision_at_3": 0.11401,
|
29 |
+
"precision_at_5": 0.0816,
|
30 |
+
"recall_at_1": 0.20409,
|
31 |
+
"recall_at_10": 0.41766,
|
32 |
+
"recall_at_100": 0.62964,
|
33 |
+
"recall_at_1000": 0.81682,
|
34 |
+
"recall_at_3": 0.29281,
|
35 |
+
"recall_at_5": 0.3383
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/CQADupstackTexRetrieval.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 5341.04,
|
6 |
+
"map_at_1": 0.14549,
|
7 |
+
"map_at_10": 0.20315,
|
8 |
+
"map_at_100": 0.21301,
|
9 |
+
"map_at_1000": 0.21425,
|
10 |
+
"map_at_3": 0.18132,
|
11 |
+
"map_at_5": 0.19429,
|
12 |
+
"mrr_at_1": 0.1786,
|
13 |
+
"mrr_at_10": 0.23861,
|
14 |
+
"mrr_at_100": 0.24737,
|
15 |
+
"mrr_at_1000": 0.2482,
|
16 |
+
"mrr_at_3": 0.21685,
|
17 |
+
"mrr_at_5": 0.23008,
|
18 |
+
"ndcg_at_1": 0.1786,
|
19 |
+
"ndcg_at_10": 0.24396,
|
20 |
+
"ndcg_at_100": 0.29328,
|
21 |
+
"ndcg_at_1000": 0.32486,
|
22 |
+
"ndcg_at_3": 0.20375,
|
23 |
+
"ndcg_at_5": 0.22411,
|
24 |
+
"precision_at_1": 0.1786,
|
25 |
+
"precision_at_10": 0.0447,
|
26 |
+
"precision_at_100": 0.0081,
|
27 |
+
"precision_at_1000": 0.00125,
|
28 |
+
"precision_at_3": 0.09475,
|
29 |
+
"precision_at_5": 0.07171,
|
30 |
+
"recall_at_1": 0.14549,
|
31 |
+
"recall_at_10": 0.33365,
|
32 |
+
"recall_at_100": 0.55797,
|
33 |
+
"recall_at_1000": 0.78632,
|
34 |
+
"recall_at_3": 0.22229,
|
35 |
+
"recall_at_5": 0.27339
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/CQADupstackUnixRetrieval.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 3320.59,
|
6 |
+
"map_at_1": 0.23286,
|
7 |
+
"map_at_10": 0.30728,
|
8 |
+
"map_at_100": 0.3184,
|
9 |
+
"map_at_1000": 0.31953,
|
10 |
+
"map_at_3": 0.28302,
|
11 |
+
"map_at_5": 0.29615,
|
12 |
+
"mrr_at_1": 0.27239,
|
13 |
+
"mrr_at_10": 0.34408,
|
14 |
+
"mrr_at_100": 0.35335,
|
15 |
+
"mrr_at_1000": 0.35405,
|
16 |
+
"mrr_at_3": 0.32152,
|
17 |
+
"mrr_at_5": 0.33355,
|
18 |
+
"ndcg_at_1": 0.27239,
|
19 |
+
"ndcg_at_10": 0.35324,
|
20 |
+
"ndcg_at_100": 0.40866,
|
21 |
+
"ndcg_at_1000": 0.43584,
|
22 |
+
"ndcg_at_3": 0.30899,
|
23 |
+
"ndcg_at_5": 0.32813,
|
24 |
+
"precision_at_1": 0.27239,
|
25 |
+
"precision_at_10": 0.05896,
|
26 |
+
"precision_at_100": 0.00979,
|
27 |
+
"precision_at_1000": 0.00133,
|
28 |
+
"precision_at_3": 0.13713,
|
29 |
+
"precision_at_5": 0.09683,
|
30 |
+
"recall_at_1": 0.23286,
|
31 |
+
"recall_at_10": 0.45711,
|
32 |
+
"recall_at_100": 0.70611,
|
33 |
+
"recall_at_1000": 0.90029,
|
34 |
+
"recall_at_3": 0.33615,
|
35 |
+
"recall_at_5": 0.3841
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/CQADupstackWebmastersRetrieval.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 1047.0,
|
6 |
+
"map_at_1": 0.23962,
|
7 |
+
"map_at_10": 0.31943,
|
8 |
+
"map_at_100": 0.33384,
|
9 |
+
"map_at_1000": 0.33611,
|
10 |
+
"map_at_3": 0.29243,
|
11 |
+
"map_at_5": 0.30446,
|
12 |
+
"mrr_at_1": 0.28458,
|
13 |
+
"mrr_at_10": 0.36157,
|
14 |
+
"mrr_at_100": 0.37093,
|
15 |
+
"mrr_at_1000": 0.37163,
|
16 |
+
"mrr_at_3": 0.3386,
|
17 |
+
"mrr_at_5": 0.35086,
|
18 |
+
"ndcg_at_1": 0.28458,
|
19 |
+
"ndcg_at_10": 0.37201,
|
20 |
+
"ndcg_at_100": 0.42591,
|
21 |
+
"ndcg_at_1000": 0.45539,
|
22 |
+
"ndcg_at_3": 0.32889,
|
23 |
+
"ndcg_at_5": 0.34483,
|
24 |
+
"precision_at_1": 0.28458,
|
25 |
+
"precision_at_10": 0.07332,
|
26 |
+
"precision_at_100": 0.01437,
|
27 |
+
"precision_at_1000": 0.00233,
|
28 |
+
"precision_at_3": 0.15547,
|
29 |
+
"precision_at_5": 0.11146,
|
30 |
+
"recall_at_1": 0.23962,
|
31 |
+
"recall_at_10": 0.46751,
|
32 |
+
"recall_at_100": 0.71626,
|
33 |
+
"recall_at_1000": 0.90939,
|
34 |
+
"recall_at_3": 0.34138,
|
35 |
+
"recall_at_5": 0.38673
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/CQADupstackWordpressRetrieval.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 3522.66,
|
6 |
+
"map_at_1": 0.18555,
|
7 |
+
"map_at_10": 0.24759,
|
8 |
+
"map_at_100": 0.25732,
|
9 |
+
"map_at_1000": 0.25847,
|
10 |
+
"map_at_3": 0.22646,
|
11 |
+
"map_at_5": 0.23792,
|
12 |
+
"mrr_at_1": 0.20148,
|
13 |
+
"mrr_at_10": 0.26696,
|
14 |
+
"mrr_at_100": 0.27605,
|
15 |
+
"mrr_at_1000": 0.27696,
|
16 |
+
"mrr_at_3": 0.24522,
|
17 |
+
"mrr_at_5": 0.25715,
|
18 |
+
"ndcg_at_1": 0.20148,
|
19 |
+
"ndcg_at_10": 0.28746,
|
20 |
+
"ndcg_at_100": 0.3357,
|
21 |
+
"ndcg_at_1000": 0.36584,
|
22 |
+
"ndcg_at_3": 0.24532,
|
23 |
+
"ndcg_at_5": 0.26484,
|
24 |
+
"precision_at_1": 0.20148,
|
25 |
+
"precision_at_10": 0.04529,
|
26 |
+
"precision_at_100": 0.00736,
|
27 |
+
"precision_at_1000": 0.00108,
|
28 |
+
"precision_at_3": 0.10351,
|
29 |
+
"precision_at_5": 0.0732,
|
30 |
+
"recall_at_1": 0.18555,
|
31 |
+
"recall_at_10": 0.39276,
|
32 |
+
"recall_at_100": 0.61511,
|
33 |
+
"recall_at_1000": 0.84111,
|
34 |
+
"recall_at_3": 0.27779,
|
35 |
+
"recall_at_5": 0.32591
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/ClimateFEVER.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 30738.76,
|
6 |
+
"map_at_1": 0.10367,
|
7 |
+
"map_at_10": 0.18954,
|
8 |
+
"map_at_100": 0.20675,
|
9 |
+
"map_at_1000": 0.20868,
|
10 |
+
"map_at_3": 0.15486,
|
11 |
+
"map_at_5": 0.17347,
|
12 |
+
"mrr_at_1": 0.23257,
|
13 |
+
"mrr_at_10": 0.35419,
|
14 |
+
"mrr_at_100": 0.36361,
|
15 |
+
"mrr_at_1000": 0.36403,
|
16 |
+
"mrr_at_3": 0.31748,
|
17 |
+
"mrr_at_5": 0.34077,
|
18 |
+
"ndcg_at_1": 0.23257,
|
19 |
+
"ndcg_at_10": 0.2711,
|
20 |
+
"ndcg_at_100": 0.33981,
|
21 |
+
"ndcg_at_1000": 0.37444,
|
22 |
+
"ndcg_at_3": 0.21472,
|
23 |
+
"ndcg_at_5": 0.23769,
|
24 |
+
"precision_at_1": 0.23257,
|
25 |
+
"precision_at_10": 0.08704,
|
26 |
+
"precision_at_100": 0.01606,
|
27 |
+
"precision_at_1000": 0.00225,
|
28 |
+
"precision_at_3": 0.16287,
|
29 |
+
"precision_at_5": 0.13068,
|
30 |
+
"recall_at_1": 0.10367,
|
31 |
+
"recall_at_10": 0.33706,
|
32 |
+
"recall_at_100": 0.57375,
|
33 |
+
"recall_at_1000": 0.7679,
|
34 |
+
"recall_at_3": 0.2018,
|
35 |
+
"recall_at_5": 0.26215
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/DBPedia.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 21716.72,
|
6 |
+
"map_at_1": 0.08246,
|
7 |
+
"map_at_10": 0.15979,
|
8 |
+
"map_at_100": 0.21025,
|
9 |
+
"map_at_1000": 0.2219,
|
10 |
+
"map_at_3": 0.11997,
|
11 |
+
"map_at_5": 0.13697,
|
12 |
+
"mrr_at_1": 0.6075,
|
13 |
+
"mrr_at_10": 0.68701,
|
14 |
+
"mrr_at_100": 0.691,
|
15 |
+
"mrr_at_1000": 0.69111,
|
16 |
+
"mrr_at_3": 0.66583,
|
17 |
+
"mrr_at_5": 0.67871,
|
18 |
+
"ndcg_at_1": 0.4975,
|
19 |
+
"ndcg_at_10": 0.34702,
|
20 |
+
"ndcg_at_100": 0.37607,
|
21 |
+
"ndcg_at_1000": 0.44322,
|
22 |
+
"ndcg_at_3": 0.39555,
|
23 |
+
"ndcg_at_5": 0.36684,
|
24 |
+
"precision_at_1": 0.6075,
|
25 |
+
"precision_at_10": 0.26625,
|
26 |
+
"precision_at_100": 0.0797,
|
27 |
+
"precision_at_1000": 0.01678,
|
28 |
+
"precision_at_3": 0.41833,
|
29 |
+
"precision_at_5": 0.345,
|
30 |
+
"recall_at_1": 0.08246,
|
31 |
+
"recall_at_10": 0.20968,
|
32 |
+
"recall_at_100": 0.42065,
|
33 |
+
"recall_at_1000": 0.63671,
|
34 |
+
"recall_at_3": 0.13039,
|
35 |
+
"recall_at_5": 0.16042
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/EmotionClassification.json
ADDED
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"accuracy": 0.49215,
|
6 |
+
"accuracy_stderr": 0.0188680285138644,
|
7 |
+
"evaluation_time": 46.17,
|
8 |
+
"f1": 0.44859524511637555,
|
9 |
+
"f1_stderr": 0.012754862698341127,
|
10 |
+
"main_score": 0.49215
|
11 |
+
}
|
12 |
+
}
|
evaluation/mteb/FEVER.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 32873.8,
|
6 |
+
"map_at_1": 0.56769,
|
7 |
+
"map_at_10": 0.67302,
|
8 |
+
"map_at_100": 0.67692,
|
9 |
+
"map_at_1000": 0.67712,
|
10 |
+
"map_at_3": 0.65346,
|
11 |
+
"map_at_5": 0.66574,
|
12 |
+
"mrr_at_1": 0.61371,
|
13 |
+
"mrr_at_10": 0.71875,
|
14 |
+
"mrr_at_100": 0.72195,
|
15 |
+
"mrr_at_1000": 0.72206,
|
16 |
+
"mrr_at_3": 0.7004,
|
17 |
+
"mrr_at_5": 0.71224,
|
18 |
+
"ndcg_at_1": 0.61371,
|
19 |
+
"ndcg_at_10": 0.72731,
|
20 |
+
"ndcg_at_100": 0.74468,
|
21 |
+
"ndcg_at_1000": 0.74916,
|
22 |
+
"ndcg_at_3": 0.69077,
|
23 |
+
"ndcg_at_5": 0.71111,
|
24 |
+
"precision_at_1": 0.61371,
|
25 |
+
"precision_at_10": 0.09326,
|
26 |
+
"precision_at_100": 0.0103,
|
27 |
+
"precision_at_1000": 0.00108,
|
28 |
+
"precision_at_3": 0.27303,
|
29 |
+
"precision_at_5": 0.17525,
|
30 |
+
"recall_at_1": 0.56769,
|
31 |
+
"recall_at_10": 0.8506,
|
32 |
+
"recall_at_100": 0.92767,
|
33 |
+
"recall_at_1000": 0.95933,
|
34 |
+
"recall_at_3": 0.75131,
|
35 |
+
"recall_at_5": 0.8017
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/FiQA2018.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 506.29,
|
6 |
+
"map_at_1": 0.15753,
|
7 |
+
"map_at_10": 0.25876,
|
8 |
+
"map_at_100": 0.27415,
|
9 |
+
"map_at_1000": 0.27591,
|
10 |
+
"map_at_3": 0.2217,
|
11 |
+
"map_at_5": 0.24236,
|
12 |
+
"mrr_at_1": 0.31019,
|
13 |
+
"mrr_at_10": 0.39977,
|
14 |
+
"mrr_at_100": 0.40789,
|
15 |
+
"mrr_at_1000": 0.40832,
|
16 |
+
"mrr_at_3": 0.37088,
|
17 |
+
"mrr_at_5": 0.38655,
|
18 |
+
"ndcg_at_1": 0.31019,
|
19 |
+
"ndcg_at_10": 0.33286,
|
20 |
+
"ndcg_at_100": 0.39529,
|
21 |
+
"ndcg_at_1000": 0.42934,
|
22 |
+
"ndcg_at_3": 0.2929,
|
23 |
+
"ndcg_at_5": 0.30615,
|
24 |
+
"precision_at_1": 0.31019,
|
25 |
+
"precision_at_10": 0.09383,
|
26 |
+
"precision_at_100": 0.01602,
|
27 |
+
"precision_at_1000": 0.00222,
|
28 |
+
"precision_at_3": 0.19753,
|
29 |
+
"precision_at_5": 0.14815,
|
30 |
+
"recall_at_1": 0.15753,
|
31 |
+
"recall_at_10": 0.40896,
|
32 |
+
"recall_at_100": 0.64443,
|
33 |
+
"recall_at_1000": 0.85218,
|
34 |
+
"recall_at_3": 0.26526,
|
35 |
+
"recall_at_5": 0.32453
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/HotpotQA.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 24496.84,
|
6 |
+
"map_at_1": 0.32154,
|
7 |
+
"map_at_10": 0.43651,
|
8 |
+
"map_at_100": 0.4441,
|
9 |
+
"map_at_1000": 0.44487,
|
10 |
+
"map_at_3": 0.41239,
|
11 |
+
"map_at_5": 0.42659,
|
12 |
+
"mrr_at_1": 0.64308,
|
13 |
+
"mrr_at_10": 0.71225,
|
14 |
+
"mrr_at_100": 0.7157,
|
15 |
+
"mrr_at_1000": 0.71591,
|
16 |
+
"mrr_at_3": 0.6995,
|
17 |
+
"mrr_at_5": 0.70738,
|
18 |
+
"ndcg_at_1": 0.64308,
|
19 |
+
"ndcg_at_10": 0.52835,
|
20 |
+
"ndcg_at_100": 0.55841,
|
21 |
+
"ndcg_at_1000": 0.57484,
|
22 |
+
"ndcg_at_3": 0.49014,
|
23 |
+
"ndcg_at_5": 0.51016,
|
24 |
+
"precision_at_1": 0.64308,
|
25 |
+
"precision_at_10": 0.1077,
|
26 |
+
"precision_at_100": 0.01315,
|
27 |
+
"precision_at_1000": 0.00153,
|
28 |
+
"precision_at_3": 0.30223,
|
29 |
+
"precision_at_5": 0.19716,
|
30 |
+
"recall_at_1": 0.32154,
|
31 |
+
"recall_at_10": 0.53849,
|
32 |
+
"recall_at_100": 0.6576,
|
33 |
+
"recall_at_1000": 0.76705,
|
34 |
+
"recall_at_3": 0.45334,
|
35 |
+
"recall_at_5": 0.49291
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/ImdbClassification.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"accuracy": 0.635316,
|
6 |
+
"accuracy_stderr": 0.04211004041793359,
|
7 |
+
"ap": 0.5890084300359825,
|
8 |
+
"ap_stderr": 0.03111656030669087,
|
9 |
+
"evaluation_time": 1823.15,
|
10 |
+
"f1": 0.6335727889030892,
|
11 |
+
"f1_stderr": 0.04298181731027657,
|
12 |
+
"main_score": 0.635316
|
13 |
+
}
|
14 |
+
}
|
evaluation/mteb/MSMARCO.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"validation": {
|
5 |
+
"evaluation_time": 43129.71,
|
6 |
+
"map_at_1": 0.20566,
|
7 |
+
"map_at_10": 0.32229,
|
8 |
+
"map_at_100": 0.33445,
|
9 |
+
"map_at_1000": 0.33501,
|
10 |
+
"map_at_3": 0.28504,
|
11 |
+
"map_at_5": 0.30681,
|
12 |
+
"mrr_at_1": 0.21218,
|
13 |
+
"mrr_at_10": 0.32816,
|
14 |
+
"mrr_at_100": 0.33986,
|
15 |
+
"mrr_at_1000": 0.34035,
|
16 |
+
"mrr_at_3": 0.2915,
|
17 |
+
"mrr_at_5": 0.3129,
|
18 |
+
"ndcg_at_1": 0.21218,
|
19 |
+
"ndcg_at_10": 0.38832,
|
20 |
+
"ndcg_at_100": 0.44743,
|
21 |
+
"ndcg_at_1000": 0.46138,
|
22 |
+
"ndcg_at_3": 0.31232,
|
23 |
+
"ndcg_at_5": 0.351,
|
24 |
+
"precision_at_1": 0.21218,
|
25 |
+
"precision_at_10": 0.06186,
|
26 |
+
"precision_at_100": 0.00914,
|
27 |
+
"precision_at_1000": 0.00103,
|
28 |
+
"precision_at_3": 0.13314,
|
29 |
+
"precision_at_5": 0.09943,
|
30 |
+
"recall_at_1": 0.20566,
|
31 |
+
"recall_at_10": 0.59192,
|
32 |
+
"recall_at_100": 0.86626,
|
33 |
+
"recall_at_1000": 0.97283,
|
34 |
+
"recall_at_3": 0.38492,
|
35 |
+
"recall_at_5": 0.4776
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/MTOPDomainClassification.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"en": {
|
6 |
+
"accuracy": 0.9256269949840401,
|
7 |
+
"accuracy_stderr": 0.0038850782151341893,
|
8 |
+
"f1": 0.921020975473988,
|
9 |
+
"f1_stderr": 0.0044060167819252195,
|
10 |
+
"main_score": 0.9256269949840401
|
11 |
+
},
|
12 |
+
"evaluation_time": 45.61
|
13 |
+
}
|
14 |
+
}
|
evaluation/mteb/MTOPIntentClassification.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"en": {
|
6 |
+
"accuracy": 0.7184678522571819,
|
7 |
+
"accuracy_stderr": 0.01111163093063421,
|
8 |
+
"f1": 0.5365271934859202,
|
9 |
+
"f1_stderr": 0.010588821247395342,
|
10 |
+
"main_score": 0.7184678522571819
|
11 |
+
},
|
12 |
+
"evaluation_time": 122.63
|
13 |
+
}
|
14 |
+
}
|
evaluation/mteb/MassiveIntentClassification.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"en": {
|
6 |
+
"accuracy": 0.6900806993947546,
|
7 |
+
"accuracy_stderr": 0.012602822825246073,
|
8 |
+
"f1": 0.6741429618885515,
|
9 |
+
"f1_stderr": 0.011707310656187842,
|
10 |
+
"main_score": 0.6900806993947546
|
11 |
+
},
|
12 |
+
"evaluation_time": 72.53
|
13 |
+
}
|
14 |
+
}
|
evaluation/mteb/MassiveScenarioClassification.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"en": {
|
6 |
+
"accuracy": 0.7590114324142568,
|
7 |
+
"accuracy_stderr": 0.010656499030857346,
|
8 |
+
"f1": 0.7625183590651454,
|
9 |
+
"f1_stderr": 0.010649247943952904,
|
10 |
+
"main_score": 0.7590114324142568
|
11 |
+
},
|
12 |
+
"evaluation_time": 41.51
|
13 |
+
}
|
14 |
+
}
|
evaluation/mteb/MedrxivClusteringP2P.json
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 3336.04,
|
6 |
+
"v_measure": 0.31350109978273394,
|
7 |
+
"v_measure_std": 0.015425381126297112
|
8 |
+
}
|
9 |
+
}
|
evaluation/mteb/MedrxivClusteringS2S.json
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 492.85,
|
6 |
+
"v_measure": 0.2876892369576733,
|
7 |
+
"v_measure_std": 0.01586647571955603
|
8 |
+
}
|
9 |
+
}
|
evaluation/mteb/NFCorpus.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 168.77,
|
6 |
+
"map_at_1": 0.05604,
|
7 |
+
"map_at_10": 0.1238,
|
8 |
+
"map_at_100": 0.15791,
|
9 |
+
"map_at_1000": 0.17327,
|
10 |
+
"map_at_3": 0.0915,
|
11 |
+
"map_at_5": 0.10599,
|
12 |
+
"mrr_at_1": 0.45201,
|
13 |
+
"mrr_at_10": 0.53374,
|
14 |
+
"mrr_at_100": 0.54089,
|
15 |
+
"mrr_at_1000": 0.54123,
|
16 |
+
"mrr_at_3": 0.51445,
|
17 |
+
"mrr_at_5": 0.5259,
|
18 |
+
"ndcg_at_1": 0.42879,
|
19 |
+
"ndcg_at_10": 0.33891,
|
20 |
+
"ndcg_at_100": 0.31392,
|
21 |
+
"ndcg_at_1000": 0.4036,
|
22 |
+
"ndcg_at_3": 0.39076,
|
23 |
+
"ndcg_at_5": 0.37047,
|
24 |
+
"precision_at_1": 0.44582,
|
25 |
+
"precision_at_10": 0.25294,
|
26 |
+
"precision_at_100": 0.08285,
|
27 |
+
"precision_at_1000": 0.02148,
|
28 |
+
"precision_at_3": 0.3612,
|
29 |
+
"precision_at_5": 0.3195,
|
30 |
+
"recall_at_1": 0.05604,
|
31 |
+
"recall_at_10": 0.16239,
|
32 |
+
"recall_at_100": 0.3216,
|
33 |
+
"recall_at_1000": 0.64513,
|
34 |
+
"recall_at_3": 0.10406,
|
35 |
+
"recall_at_5": 0.12685
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/NQ.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 15471.98,
|
6 |
+
"map_at_1": 0.25881,
|
7 |
+
"map_at_10": 0.39501,
|
8 |
+
"map_at_100": 0.40615,
|
9 |
+
"map_at_1000": 0.40661,
|
10 |
+
"map_at_3": 0.35559,
|
11 |
+
"map_at_5": 0.37773,
|
12 |
+
"mrr_at_1": 0.29229,
|
13 |
+
"mrr_at_10": 0.41956,
|
14 |
+
"mrr_at_100": 0.4286,
|
15 |
+
"mrr_at_1000": 0.42893,
|
16 |
+
"mrr_at_3": 0.38562,
|
17 |
+
"mrr_at_5": 0.40542,
|
18 |
+
"ndcg_at_1": 0.292,
|
19 |
+
"ndcg_at_10": 0.46703,
|
20 |
+
"ndcg_at_100": 0.51644,
|
21 |
+
"ndcg_at_1000": 0.52771,
|
22 |
+
"ndcg_at_3": 0.39142,
|
23 |
+
"ndcg_at_5": 0.42892,
|
24 |
+
"precision_at_1": 0.292,
|
25 |
+
"precision_at_10": 0.0792,
|
26 |
+
"precision_at_100": 0.01066,
|
27 |
+
"precision_at_1000": 0.00117,
|
28 |
+
"precision_at_3": 0.18105,
|
29 |
+
"precision_at_5": 0.13036,
|
30 |
+
"recall_at_1": 0.25881,
|
31 |
+
"recall_at_10": 0.66266,
|
32 |
+
"recall_at_100": 0.88116,
|
33 |
+
"recall_at_1000": 0.96582,
|
34 |
+
"recall_at_3": 0.46526,
|
35 |
+
"recall_at_5": 0.55154
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/QuoraRetrieval.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 1285.77,
|
6 |
+
"map_at_1": 0.67553,
|
7 |
+
"map_at_10": 0.8134,
|
8 |
+
"map_at_100": 0.82002,
|
9 |
+
"map_at_1000": 0.82027,
|
10 |
+
"map_at_3": 0.78281,
|
11 |
+
"map_at_5": 0.80149,
|
12 |
+
"mrr_at_1": 0.7772,
|
13 |
+
"mrr_at_10": 0.84733,
|
14 |
+
"mrr_at_100": 0.84878,
|
15 |
+
"mrr_at_1000": 0.84879,
|
16 |
+
"mrr_at_3": 0.83587,
|
17 |
+
"mrr_at_5": 0.84326,
|
18 |
+
"ndcg_at_1": 0.7775,
|
19 |
+
"ndcg_at_10": 0.85603,
|
20 |
+
"ndcg_at_100": 0.87069,
|
21 |
+
"ndcg_at_1000": 0.8725,
|
22 |
+
"ndcg_at_3": 0.82303,
|
23 |
+
"ndcg_at_5": 0.84037,
|
24 |
+
"precision_at_1": 0.7775,
|
25 |
+
"precision_at_10": 0.1304,
|
26 |
+
"precision_at_100": 0.01507,
|
27 |
+
"precision_at_1000": 0.00156,
|
28 |
+
"precision_at_3": 0.35903,
|
29 |
+
"precision_at_5": 0.23738,
|
30 |
+
"recall_at_1": 0.67553,
|
31 |
+
"recall_at_10": 0.93903,
|
32 |
+
"recall_at_100": 0.99062,
|
33 |
+
"recall_at_1000": 0.99935,
|
34 |
+
"recall_at_3": 0.84581,
|
35 |
+
"recall_at_5": 0.89316
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/RedditClustering.json
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 6540.34,
|
6 |
+
"v_measure": 0.46468877112302354,
|
7 |
+
"v_measure_std": 0.059743532887098036
|
8 |
+
}
|
9 |
+
}
|
evaluation/mteb/RedditClusteringP2P.json
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 26567.79,
|
6 |
+
"v_measure": 0.5416687629824692,
|
7 |
+
"v_measure_std": 0.11955619105267504
|
8 |
+
}
|
9 |
+
}
|
evaluation/mteb/SCIDOCS.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"evaluation_time": 338.56,
|
6 |
+
"map_at_1": 0.04053,
|
7 |
+
"map_at_10": 0.09694,
|
8 |
+
"map_at_100": 0.11387,
|
9 |
+
"map_at_1000": 0.11654,
|
10 |
+
"map_at_3": 0.07053,
|
11 |
+
"map_at_5": 0.08439,
|
12 |
+
"mrr_at_1": 0.199,
|
13 |
+
"mrr_at_10": 0.29359,
|
14 |
+
"mrr_at_100": 0.30484,
|
15 |
+
"mrr_at_1000": 0.30553,
|
16 |
+
"mrr_at_3": 0.262,
|
17 |
+
"mrr_at_5": 0.28115,
|
18 |
+
"ndcg_at_1": 0.199,
|
19 |
+
"ndcg_at_10": 0.16575,
|
20 |
+
"ndcg_at_100": 0.23655,
|
21 |
+
"ndcg_at_1000": 0.28853,
|
22 |
+
"ndcg_at_3": 0.15848,
|
23 |
+
"ndcg_at_5": 0.14026,
|
24 |
+
"precision_at_1": 0.199,
|
25 |
+
"precision_at_10": 0.0845,
|
26 |
+
"precision_at_100": 0.01872,
|
27 |
+
"precision_at_1000": 0.00313,
|
28 |
+
"precision_at_3": 0.14667,
|
29 |
+
"precision_at_5": 0.1232,
|
30 |
+
"recall_at_1": 0.04053,
|
31 |
+
"recall_at_10": 0.1717,
|
32 |
+
"recall_at_100": 0.38025,
|
33 |
+
"recall_at_1000": 0.63572,
|
34 |
+
"recall_at_3": 0.08903,
|
35 |
+
"recall_at_5": 0.12477
|
36 |
+
}
|
37 |
+
}
|
evaluation/mteb/SGPT-2.7B-weightedmean-msmarco-specb-bitfit_results.csv
ADDED
@@ -0,0 +1,354 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
model,task,dataset,language,metric,value
|
2 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,BitextMining,BUCC,,f1,
|
3 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,BitextMining,Tatoeba,,f1,
|
4 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,en,accuracy,0.6756716417910448
|
5 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,de,accuracy,
|
6 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,de,accuracy,
|
7 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,en-ext,accuracy,
|
8 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,en-ext,accuracy,
|
9 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,ja,accuracy,
|
10 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,ja,accuracy,
|
11 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonPolarityClassification,en,accuracy,0.71439575
|
12 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,en,accuracy,0.35748
|
13 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,de,accuracy,
|
14 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,de,accuracy,
|
15 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,es,accuracy,
|
16 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,es,accuracy,
|
17 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,fr,accuracy,
|
18 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,fr,accuracy,
|
19 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,ja,accuracy,
|
20 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,ja,accuracy,
|
21 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,zh,accuracy,
|
22 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,zh,accuracy,
|
23 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,Banking77Classification,en,accuracy,0.8321753246753246
|
24 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,EmotionClassification,en,accuracy,0.49215
|
25 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,ImdbClassification,en,accuracy,0.635316
|
26 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,af,accuracy,
|
27 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,af,accuracy,
|
28 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,am,accuracy,
|
29 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,am,accuracy,
|
30 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ar,accuracy,
|
31 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ar,accuracy,
|
32 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,az,accuracy,
|
33 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,az,accuracy,
|
34 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,bn,accuracy,
|
35 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,bn,accuracy,
|
36 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,cy,accuracy,
|
37 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,cy,accuracy,
|
38 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,da,accuracy,
|
39 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,da,accuracy,
|
40 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,de,accuracy,
|
41 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,de,accuracy,
|
42 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,el,accuracy,
|
43 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,el,accuracy,
|
44 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,en,accuracy,0.6900806993947546
|
45 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,es,accuracy,
|
46 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,es,accuracy,
|
47 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,fa,accuracy,
|
48 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,fa,accuracy,
|
49 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,fi,accuracy,
|
50 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,fi,accuracy,
|
51 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,fr,accuracy,
|
52 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,fr,accuracy,
|
53 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,he,accuracy,
|
54 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,he,accuracy,
|
55 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,hi,accuracy,
|
56 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,hi,accuracy,
|
57 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,hu,accuracy,
|
58 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,hu,accuracy,
|
59 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,hy,accuracy,
|
60 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,hy,accuracy,
|
61 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,id,accuracy,
|
62 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,id,accuracy,
|
63 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,is,accuracy,
|
64 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,is,accuracy,
|
65 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,it,accuracy,
|
66 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,it,accuracy,
|
67 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ja,accuracy,
|
68 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ja,accuracy,
|
69 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,jv,accuracy,
|
70 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,jv,accuracy,
|
71 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ka,accuracy,
|
72 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ka,accuracy,
|
73 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,km,accuracy,
|
74 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,km,accuracy,
|
75 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,kn,accuracy,
|
76 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,kn,accuracy,
|
77 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ko,accuracy,
|
78 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ko,accuracy,
|
79 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,lv,accuracy,
|
80 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,lv,accuracy,
|
81 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ml,accuracy,
|
82 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ml,accuracy,
|
83 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,mn,accuracy,
|
84 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,mn,accuracy,
|
85 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ms,accuracy,
|
86 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ms,accuracy,
|
87 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,my,accuracy,
|
88 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,my,accuracy,
|
89 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,nb,accuracy,
|
90 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,nb,accuracy,
|
91 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,nl,accuracy,
|
92 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,nl,accuracy,
|
93 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,pl,accuracy,
|
94 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,pl,accuracy,
|
95 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,pt,accuracy,
|
96 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,pt,accuracy,
|
97 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ro,accuracy,
|
98 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ro,accuracy,
|
99 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ru,accuracy,
|
100 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ru,accuracy,
|
101 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sl,accuracy,
|
102 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sl,accuracy,
|
103 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sq,accuracy,
|
104 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sq,accuracy,
|
105 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sv,accuracy,
|
106 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sv,accuracy,
|
107 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sw,accuracy,
|
108 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sw,accuracy,
|
109 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ta,accuracy,
|
110 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ta,accuracy,
|
111 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,te,accuracy,
|
112 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,te,accuracy,
|
113 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,th,accuracy,
|
114 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,th,accuracy,
|
115 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,tl,accuracy,
|
116 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,tl,accuracy,
|
117 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,tr,accuracy,
|
118 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,tr,accuracy,
|
119 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ur,accuracy,
|
120 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ur,accuracy,
|
121 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,vi,accuracy,
|
122 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,vi,accuracy,
|
123 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,zh-CN,accuracy,
|
124 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,zh-CN,accuracy,
|
125 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,zh-TW,accuracy,
|
126 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,zh-TW,accuracy,
|
127 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,af,accuracy,
|
128 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,af,accuracy,
|
129 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,am,accuracy,
|
130 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,am,accuracy,
|
131 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ar,accuracy,
|
132 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ar,accuracy,
|
133 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,az,accuracy,
|
134 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,az,accuracy,
|
135 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,bn,accuracy,
|
136 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,bn,accuracy,
|
137 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,cy,accuracy,
|
138 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,cy,accuracy,
|
139 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,da,accuracy,
|
140 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,da,accuracy,
|
141 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,de,accuracy,
|
142 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,de,accuracy,
|
143 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,el,accuracy,
|
144 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,el,accuracy,
|
145 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,en,accuracy,0.7590114324142568
|
146 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,es,accuracy,
|
147 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,es,accuracy,
|
148 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,fa,accuracy,
|
149 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,fa,accuracy,
|
150 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,fi,accuracy,
|
151 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,fi,accuracy,
|
152 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,fr,accuracy,
|
153 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,fr,accuracy,
|
154 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,he,accuracy,
|
155 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,he,accuracy,
|
156 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,hi,accuracy,
|
157 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,hi,accuracy,
|
158 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,hu,accuracy,
|
159 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,hu,accuracy,
|
160 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,hy,accuracy,
|
161 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,hy,accuracy,
|
162 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,id,accuracy,
|
163 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,id,accuracy,
|
164 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,is,accuracy,
|
165 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,is,accuracy,
|
166 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,it,accuracy,
|
167 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,it,accuracy,
|
168 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ja,accuracy,
|
169 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ja,accuracy,
|
170 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,jv,accuracy,
|
171 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,jv,accuracy,
|
172 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ka,accuracy,
|
173 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ka,accuracy,
|
174 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,km,accuracy,
|
175 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,km,accuracy,
|
176 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,kn,accuracy,
|
177 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,kn,accuracy,
|
178 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ko,accuracy,
|
179 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ko,accuracy,
|
180 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,lv,accuracy,
|
181 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,lv,accuracy,
|
182 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ml,accuracy,
|
183 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ml,accuracy,
|
184 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,mn,accuracy,
|
185 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,mn,accuracy,
|
186 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ms,accuracy,
|
187 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ms,accuracy,
|
188 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,my,accuracy,
|
189 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,my,accuracy,
|
190 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,nb,accuracy,
|
191 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,nb,accuracy,
|
192 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,nl,accuracy,
|
193 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,nl,accuracy,
|
194 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,pl,accuracy,
|
195 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,pl,accuracy,
|
196 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,pt,accuracy,
|
197 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,pt,accuracy,
|
198 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ro,accuracy,
|
199 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ro,accuracy,
|
200 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ru,accuracy,
|
201 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ru,accuracy,
|
202 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sl,accuracy,
|
203 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sl,accuracy,
|
204 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sq,accuracy,
|
205 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sq,accuracy,
|
206 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sv,accuracy,
|
207 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sv,accuracy,
|
208 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sw,accuracy,
|
209 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sw,accuracy,
|
210 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ta,accuracy,
|
211 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ta,accuracy,
|
212 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,te,accuracy,
|
213 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,te,accuracy,
|
214 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,th,accuracy,
|
215 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,th,accuracy,
|
216 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,tl,accuracy,
|
217 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,tl,accuracy,
|
218 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,tr,accuracy,
|
219 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,tr,accuracy,
|
220 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ur,accuracy,
|
221 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ur,accuracy,
|
222 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,vi,accuracy,
|
223 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,vi,accuracy,
|
224 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,zh-CN,accuracy,
|
225 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,zh-CN,accuracy,
|
226 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,zh-TW,accuracy,
|
227 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,zh-TW,accuracy,
|
228 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,en,accuracy,0.9256269949840401
|
229 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,de,accuracy,
|
230 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,de,accuracy,
|
231 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,es,accuracy,
|
232 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,es,accuracy,
|
233 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,fr,accuracy,
|
234 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,fr,accuracy,
|
235 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,hi,accuracy,
|
236 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,hi,accuracy,
|
237 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,th,accuracy,
|
238 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,th,accuracy,
|
239 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,en,accuracy,0.7184678522571819
|
240 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,de,accuracy,
|
241 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,de,accuracy,
|
242 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,es,accuracy,
|
243 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,es,accuracy,
|
244 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,fr,accuracy,
|
245 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,fr,accuracy,
|
246 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,hi,accuracy,
|
247 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,hi,accuracy,
|
248 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,th,accuracy,
|
249 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,th,accuracy,
|
250 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,ToxicConversationsClassification,en,accuracy,0.6884080000000001
|
251 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,TweetSentimentExtractionClassification,en,accuracy,0.5668647425014148
|
252 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Clustering,ArxivClusteringP2P,en,v_measure,0.44721257146422017
|
253 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Clustering,ArxivClusteringS2S,en,v_measure,0.35081451519142065
|
254 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Clustering,BiorxivClusteringP2P,en,v_measure,0.3441414219680629
|
255 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Clustering,BiorxivClusteringS2S,en,v_measure,0.30533275862270026
|
256 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Clustering,MedrxivClusteringP2P,en,v_measure,0.31350109978273394
|
257 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Clustering,MedrxivClusteringS2S,en,v_measure,0.2876892369576733
|
258 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Clustering,RedditClustering,en,v_measure,0.46468877112302354
|
259 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Clustering,RedditClusteringP2P,en,v_measure,0.5416687629824692
|
260 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Clustering,StackExchangeClustering,en,v_measure,0.5919409867397648
|
261 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Clustering,StackExchangeClusteringP2P,en,v_measure,0.32574403257811496
|
262 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Clustering,TwentyNewsgroupsClustering,en,v_measure,0.408911707239219
|
263 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,PairClassification,SprintDuplicateQuestions,en,ap,0.9347124923047998
|
264 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,PairClassification,TwitterSemEval2015,en,ap,0.6368133990830133
|
265 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,PairClassification,TwitterURLCorpus,en,ap,0.8480240716354543
|
266 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Reranking,AskUbuntuDupQuestions,en,map,0.5963466199039206
|
267 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Reranking,MindSmallReranking,,map,
|
268 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Reranking,SciDocsRR,en,map,0.7771580844366375
|
269 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Reranking,StackOverflowDupQuestions,en,map,0.4961186384154483
|
270 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Retrieval,ArguAna,en,ndcg_at_10,0.50491
|
271 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Retrieval,ClimateFEVER,en,ndcg_at_10,0.2711
|
272 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Retrieval,CQADupstackRetrieval,en,ndcg_at_10,0.3653358333333333
|
273 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Retrieval,DBPedia,en,ndcg_at_10,0.34702
|
274 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Retrieval,FEVER,en,ndcg_at_10,0.72731
|
275 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Retrieval,FiQA2018,en,ndcg_at_10,0.33286
|
276 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Retrieval,HotpotQA,en,ndcg_at_10,0.52835
|
277 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Retrieval,MSMARCO,en,ndcg_at_10,0.38832
|
278 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Retrieval,NFCorpus,en,ndcg_at_10,0.33891
|
279 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Retrieval,NQ,en,ndcg_at_10,0.46703
|
280 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Retrieval,QuoraRetrieval,en,ndcg_at_10,0.85603
|
281 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Retrieval,SCIDOCS,en,ndcg_at_10,0.16575
|
282 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Retrieval,SciFact,en,ndcg_at_10,0.70165
|
283 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Retrieval,Touche2020,en,ndcg_at_10,0.2344
|
284 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Retrieval,TRECCOVID,en,ndcg_at_10,0.7517
|
285 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,BIOSSES,en,cosine_spearman,0.8484289705838665
|
286 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,SICK-R,en,cosine_spearman,0.6819926431966059
|
287 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS12,en,cosine_spearman,0.6699390786191646
|
288 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS13,en,cosine_spearman,0.7757623085766706
|
289 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS14,en,cosine_spearman,0.7278258293483495
|
290 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS15,en,cosine_spearman,0.8261707296911949
|
291 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS16,en,cosine_spearman,0.8009839524406284
|
292 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,ko-ko,cosine_spearman,
|
293 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,ko-ko,cosine_spearman,
|
294 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,ar-ar,cosine_spearman,
|
295 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,ar-ar,cosine_spearman,
|
296 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-ar,cosine_spearman,
|
297 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-ar,cosine_spearman,
|
298 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-de,cosine_spearman,
|
299 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-de,cosine_spearman,
|
300 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-en,cosine_spearman,0.8725017540413703
|
301 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-tr,cosine_spearman,
|
302 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-tr,cosine_spearman,
|
303 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,es-en,cosine_spearman,
|
304 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,es-en,cosine_spearman,
|
305 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,es-es,cosine_spearman,
|
306 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,es-es,cosine_spearman,
|
307 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,fr-en,cosine_spearman,
|
308 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,fr-en,cosine_spearman,
|
309 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,it-en,cosine_spearman,
|
310 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,it-en,cosine_spearman,
|
311 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,nl-en,cosine_spearman,
|
312 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,nl-en,cosine_spearman,
|
313 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,en,cosine_spearman,0.687486910762485
|
314 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,de,cosine_spearman,
|
315 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,de,cosine_spearman,
|
316 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,es,cosine_spearman,
|
317 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,es,cosine_spearman,
|
318 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,pl,cosine_spearman,
|
319 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,pl,cosine_spearman,
|
320 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,tr,cosine_spearman,
|
321 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,tr,cosine_spearman,
|
322 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,ar,cosine_spearman,
|
323 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,ar,cosine_spearman,
|
324 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,ru,cosine_spearman,
|
325 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,ru,cosine_spearman,
|
326 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,zh,cosine_spearman,
|
327 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,zh,cosine_spearman,
|
328 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,fr,cosine_spearman,
|
329 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,fr,cosine_spearman,
|
330 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,de-en,cosine_spearman,
|
331 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,de-en,cosine_spearman,
|
332 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,es-en,cosine_spearman,
|
333 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,es-en,cosine_spearman,
|
334 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,it,cosine_spearman,
|
335 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,it,cosine_spearman,
|
336 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,pl-en,cosine_spearman,
|
337 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,pl-en,cosine_spearman,
|
338 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,zh-en,cosine_spearman,
|
339 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,zh-en,cosine_spearman,
|
340 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,es-it,cosine_spearman,
|
341 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,es-it,cosine_spearman,
|
342 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,de-fr,cosine_spearman,
|
343 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,de-fr,cosine_spearman,
|
344 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,de-pl,cosine_spearman,
|
345 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,de-pl,cosine_spearman,
|
346 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,fr-pl,cosine_spearman,
|
347 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,fr-pl,cosine_spearman,
|
348 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STSBenchmark,en,cosine_spearman,0.7920585637461047
|
349 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Summarization,SummEval,en,cosine_spearman,0.27870478281195465
|
350 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,average,en,accuracy,0.6713040365015015
|
351 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Clustering,average,en,v_measure,0.39833144224085476
|
352 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,PairClassification,average,en,ap,0.8065166543410891
|
353 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Retrieval,average,en,ndcg_at_10,0.4653783888888888
|
354 |
+
SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,average,en,cosine_spearman,0.768315074100644
|
evaluation/mteb/SICK-R.json
ADDED
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"cos_sim": {
|
6 |
+
"pearson": 0.7775487485196769,
|
7 |
+
"spearman": 0.6819926431966059
|
8 |
+
},
|
9 |
+
"euclidean": {
|
10 |
+
"pearson": 0.7169016204991725,
|
11 |
+
"spearman": 0.6698099673026834
|
12 |
+
},
|
13 |
+
"evaluation_time": 106.65,
|
14 |
+
"manhattan": {
|
15 |
+
"pearson": 0.7162994072488664,
|
16 |
+
"spearman": 0.6703435950744577
|
17 |
+
}
|
18 |
+
}
|
19 |
+
}
|
evaluation/mteb/STS12.json
ADDED
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"cos_sim": {
|
6 |
+
"pearson": 0.7591051402657887,
|
7 |
+
"spearman": 0.6699390786191646
|
8 |
+
},
|
9 |
+
"euclidean": {
|
10 |
+
"pearson": 0.7154128036454578,
|
11 |
+
"spearman": 0.6925605675649068
|
12 |
+
},
|
13 |
+
"evaluation_time": 49.4,
|
14 |
+
"manhattan": {
|
15 |
+
"pearson": 0.7160981030780171,
|
16 |
+
"spearman": 0.6927513670128046
|
17 |
+
}
|
18 |
+
}
|
19 |
+
}
|
evaluation/mteb/STS13.json
ADDED
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"cos_sim": {
|
6 |
+
"pearson": 0.7723835466417793,
|
7 |
+
"spearman": 0.7757623085766706
|
8 |
+
},
|
9 |
+
"euclidean": {
|
10 |
+
"pearson": 0.775090992200725,
|
11 |
+
"spearman": 0.7788601688144924
|
12 |
+
},
|
13 |
+
"evaluation_time": 21.2,
|
14 |
+
"manhattan": {
|
15 |
+
"pearson": 0.7739045060647423,
|
16 |
+
"spearman": 0.7777552718279098
|
17 |
+
}
|
18 |
+
}
|
19 |
+
}
|
evaluation/mteb/STS14.json
ADDED
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"dataset_version": null,
|
3 |
+
"mteb_version": "0.0.2",
|
4 |
+
"test": {
|
5 |
+
"cos_sim": {
|
6 |
+
"pearson": 0.7791692485139602,
|
7 |
+
"spearman": 0.7278258293483495
|
8 |
+
},
|
9 |
+
"euclidean": {
|
10 |
+
"pearson": 0.7464773017077789,
|
11 |
+
"spearman": 0.7181662299104619
|
12 |
+
},
|
13 |
+
"evaluation_time": 52.55,
|
14 |
+
"manhattan": {
|
15 |
+
"pearson": 0.7471043337995533,
|
16 |
+
"spearman": 0.7183960860845646
|
17 |
+
}
|
18 |
+
}
|
19 |
+
}
|