diff --git a/mteb/abstasks/AbsTaskClusteringFast.py b/mteb/abstasks/AbsTaskClusteringFast.py index a5142f3081..eb85b38ceb 100644 --- a/mteb/abstasks/AbsTaskClusteringFast.py +++ b/mteb/abstasks/AbsTaskClusteringFast.py @@ -82,7 +82,13 @@ class AbsTaskClusteringFast(AbsTask): The similarity then is calculated using the V-measure metric, which is invariant to the permutation of the labels. This approach is then repeated K times. - If the clustering is hieararchical, and more than one label is specified in order for each observation, + There are two ways to specify how a dataset is downsampled: + - max_document_to_embe (int): default to None + - max_fraction_of_documents_to_embed (float): default to 4%. + If both parameters are set to None, no downsampling is done in self._evaluate_subset(). + Only one of these two parameters can be not None at the same time. + + If the clustering is hierarchical, and more than one label is specified in order for each observation, V-measures are calculated in the outlined way on each of the levels separately. self.load_data() must generate a huggingface dataset with a split matching self.metadata_dict["eval_splits"], and assign it to self.dataset. @@ -91,8 +97,9 @@ class AbsTaskClusteringFast(AbsTask): labels: list[str] | list[list[str]] """ - max_documents_to_embed = 16_384 - max_documents_per_cluster = 2048 + max_fraction_of_documents_to_embed = 0.04 + max_document_to_embed = None + max_documents_per_cluster = 16_384 n_clusters = 10 k_mean_batch_size = 512 max_depth = None @@ -113,13 +120,29 @@ def _evaluate_subset( ) -> dict[str, float | dict[str, list[float]]]: rng_state = random.Random(self.seed) - if len(dataset) > self.max_documents_to_embed: - example_indices = rng_state.sample( - range(len(dataset)), k=self.max_documents_to_embed + if ( + self.max_document_to_embed is not None + and self.max_fraction_of_documents_to_embed is not None + ): + raise Exception( + "Both max_document_to_embed and max_fraction_of_documents_to_embed are set. Please only set one." ) - downsampled_dataset = dataset.select(example_indices) # type: ignore - else: + + if ( + self.max_document_to_embed is None + and self.max_fraction_of_documents_to_embed is None + ): downsampled_dataset = dataset + else: + max_documents_to_embed = self.max_document_to_embed + if self.max_fraction_of_documents_to_embed is not None: + max_documents_to_embed = int( + self.max_fraction_of_documents_to_embed * len(dataset) + ) + example_indices = rng_state.sample( + range(len(dataset)), k=max_documents_to_embed + ) + downsampled_dataset = dataset.select(example_indices) embeddings = model_encode( downsampled_dataset["sentences"], # type: ignore @@ -133,7 +156,7 @@ def _evaluate_subset( label = [label] labels.append(label) - v_measures = evaluate_clustering_bootstrapped( + all_v_scores = evaluate_clustering_bootstrapped( embeddings, labels, n_clusters=self.n_clusters, @@ -142,9 +165,15 @@ def _evaluate_subset( max_depth=self.max_depth, rng_state=rng_state, ) - all_v_scores = itertools.chain.from_iterable(v_measures.values()) - mean_v_measure = np.mean(list(all_v_scores)) - scores = {"v_measures": v_measures, "v_measure": float(mean_v_measure)} + v_measures = list(itertools.chain.from_iterable(all_v_scores.values())) + + mean_v_measure = np.mean(v_measures) + v_std = np.std(v_measures) + scores = { + "v_measures": all_v_scores, + "v_measure": float(mean_v_measure), + "v_measure_std": v_std, + } self._add_main_score(scores) return scores diff --git a/mteb/cli.py b/mteb/cli.py index 56efbe7176..5ce6a6464f 100644 --- a/mteb/cli.py +++ b/mteb/cli.py @@ -198,8 +198,8 @@ def add_run_parser(subparsers) -> None: parser.add_argument( "--output_folder", type=str, - default=None, - help="Output directory for results. Will default to results/{model_name} if not set.", + default="results", + help="Output directory for results. Will default to `results` if not set.", ) parser.add_argument( "-v", "--verbosity", type=int, default=2, help="Verbosity level" diff --git a/mteb/model_meta.py b/mteb/model_meta.py index 335d6476f7..664cd60206 100644 --- a/mteb/model_meta.py +++ b/mteb/model_meta.py @@ -77,7 +77,7 @@ class ModelMeta(BaseModel): def to_dict(self): dict_repr = self.model_dump() loader = dict_repr.pop("loader", None) - dict_repr["loader"] = get_loader_name(loader) + dict_repr["loader"] = loader.func.__name__ if loader is not None else None return dict_repr def load_model(self, **kwargs: Any) -> Encoder | EncoderWithQueryCorpusEncode: diff --git a/mteb/models/__init__.py b/mteb/models/__init__.py index 51e4ef8000..19f3dbc38b 100644 --- a/mteb/models/__init__.py +++ b/mteb/models/__init__.py @@ -8,9 +8,11 @@ from mteb.encoder_interface import Encoder, EncoderWithQueryCorpusEncode from mteb.model_meta import ModelMeta from mteb.models import ( + bge_models, e5_instruct, e5_models, gritlm, + mxbai_models, openai_models, sentence_transformers_models, voyage_models, @@ -55,8 +57,10 @@ def get_model_meta(model_name: str, revision: str | None = None) -> ModelMeta: A model metadata object """ if model_name in models: - if revision and (not models[model_name].revision == revision): - raise ValueError(f"Model {revision} not found for model {model_name}") + if not models[model_name].revision == revision: + raise ValueError( + f"Model revision {revision} not found for model {model_name}" + ) return models[model_name] else: # assume it is a sentence-transformers model logger.info( @@ -65,7 +69,9 @@ def get_model_meta(model_name: str, revision: str | None = None) -> ModelMeta: logger.info( f"Attempting to extract metadata by loading the model ({model_name}) using sentence-transformers." ) - model = SentenceTransformer(model_name, revision=revision) + model = SentenceTransformer( + model_name, revision=revision, trust_remote_code=True + ) meta = model_meta_from_sentence_transformers(model) meta.revision = revision @@ -108,11 +114,13 @@ def model_meta_from_sentence_transformers(model: SentenceTransformer) -> ModelMe model_modules = [ e5_models, - e5_instruct, gritlm, - openai_models, + e5_instruct, sentence_transformers_models, + openai_models, voyage_models, + bge_models, + mxbai_models, ] models = {} diff --git a/mteb/models/bge_models.py b/mteb/models/bge_models.py new file mode 100644 index 0000000000..42015759ff --- /dev/null +++ b/mteb/models/bge_models.py @@ -0,0 +1,58 @@ +from __future__ import annotations + +from functools import partial +from typing import Any + +import torch +from sentence_transformers import SentenceTransformer + +from mteb.model_meta import ModelMeta +from mteb.models.text_formatting_utils import corpus_to_texts + + +class BGEWrapper: + """following the hf model card documentation.""" + + def __init__(self, model_name: str, **kwargs: Any): + self.model_name = model_name + self.mdl = SentenceTransformer(model_name) + + def to(self, device: torch.device) -> None: + self.mdl.to(device) + + def encode( # type: ignore + self, + sentences: list[str], + *, + batch_size: int = 32, + **kwargs: Any, + ): + return self.mdl.encode(sentences, batch_size=batch_size, **kwargs) + + def encode_queries(self, queries: list[str], batch_size: int = 32, **kwargs: Any): + sentences = [ + "Represent this sentence for searching relevant passages: " + sentence + for sentence in queries + ] + emb = self.mdl.encode(sentences, batch_size=batch_size, **kwargs) + return emb + + def encode_corpus( + self, + corpus: list[dict[str, str]] | dict[str, list[str]], + batch_size: int = 32, + **kwargs: Any, + ): + sentences = corpus_to_texts(corpus) + emb = self.mdl.encode(sentences, batch_size=batch_size, **kwargs) + return emb + + +bge_base_en_v1_5 = ModelMeta( + loader=partial(BGEWrapper, model_name="BAAI/bge-base-en-v1.5"), # type: ignore + name="BAAI/bge-base-en-v1.5", + languages=["eng_Latn"], + open_source=True, + revision="a5beb1e3e68b9ab74eb54cfd186867f64f240e1a", + release_date="2023-09-11", # initial commit of hf model. +) diff --git a/mteb/models/e5_models.py b/mteb/models/e5_models.py index fec334709c..e95aaf9353 100644 --- a/mteb/models/e5_models.py +++ b/mteb/models/e5_models.py @@ -177,3 +177,39 @@ def encode_corpus( revision="4dc6d853a804b9c8886ede6dda8a073b7dc08a81", release_date=E5_PAPER_RELEASE_DATE, ) + +e5_eng_small_v2 = ModelMeta( + loader=partial(E5Wrapper, model_name="intfloat/e5-small-v2"), # type: ignore + name="intfloat/e5-small-v2", + languages=["eng_Latn"], + open_source=True, + revision="dca8b1a9dae0d4575df2bf423a5edb485a431236", + release_date=E5_PAPER_RELEASE_DATE, +) + +e5_eng_small = ModelMeta( + loader=partial(E5Wrapper, model_name="intfloat/e5-small"), # type: ignore + name="intfloat/e5-small", + languages=["eng_Latn"], + open_source=True, + revision="e272f3049e853b47cb5ca3952268c6662abda68f", + release_date=E5_PAPER_RELEASE_DATE, +) + +e5_eng_base_v2 = ModelMeta( + loader=partial(E5Wrapper, model_name="intfloat/e5-base-v2"), # type: ignore + name="intfloat/e5-base-v2", + languages=["eng_Latn"], + open_source=True, + revision="1c644c92ad3ba1efdad3f1451a637716616a20e8", + release_date=E5_PAPER_RELEASE_DATE, +) + +e5_eng_large_v2 = ModelMeta( + loader=partial(E5Wrapper, model_name="intfloat/e5-large-v2"), # type: ignore + name="intfloat/e5-large-v2", + languages=["eng_Latn"], + open_source=True, + revision="b322e09026e4ea05f42beadf4d661fb4e101d311", + release_date=E5_PAPER_RELEASE_DATE, +) diff --git a/mteb/models/mxbai_models.py b/mteb/models/mxbai_models.py new file mode 100644 index 0000000000..4fa83891e5 --- /dev/null +++ b/mteb/models/mxbai_models.py @@ -0,0 +1,58 @@ +from __future__ import annotations + +from functools import partial +from typing import Any + +import torch +from sentence_transformers import SentenceTransformer + +from mteb.model_meta import ModelMeta +from mteb.models.text_formatting_utils import corpus_to_texts + + +class MxbaiWrapper: + """following the hf model card documentation.""" + + def __init__(self, model_name: str, **kwargs: Any): + self.model_name = model_name + self.mdl = SentenceTransformer(model_name) + + def to(self, device: torch.device) -> None: + self.mdl.to(device) + + def encode( # type: ignore + self, + sentences: list[str], + *, + batch_size: int = 32, + **kwargs: Any, + ): + return self.mdl.encode(sentences, batch_size=batch_size, **kwargs) + + def encode_queries(self, queries: list[str], batch_size: int = 32, **kwargs: Any): + sentences = [ + "Represent this sentence for searching relevant passages: " + sentence + for sentence in queries + ] + emb = self.mdl.encode(sentences, batch_size=batch_size, **kwargs) + return emb + + def encode_corpus( + self, + corpus: list[dict[str, str]] | dict[str, list[str]], + batch_size: int = 32, + **kwargs: Any, + ): + sentences = corpus_to_texts(corpus) + emb = self.mdl.encode(sentences, batch_size=batch_size, **kwargs) + return emb + + +mxbai_embed_large_v1 = ModelMeta( + loader=partial(MxbaiWrapper, model_name="mixedbread-ai/mxbai-embed-large-v1"), # type: ignore + name="mixedbread-ai/mxbai-embed-large-v1", + languages=["eng_Latn"], + open_source=True, + revision="990580e27d329c7408b3741ecff85876e128e203", + release_date="2024-03-07", # initial commit of hf model. +) diff --git a/mteb/models/sentence_transformers_models.py b/mteb/models/sentence_transformers_models.py index 5af1ff3042..d1fb638be2 100644 --- a/mteb/models/sentence_transformers_models.py +++ b/mteb/models/sentence_transformers_models.py @@ -2,72 +2,90 @@ from mteb.model_meta import ModelMeta +paraphrase_langs = [ + "ara_Arab", + "bul_Cyrl", + "cat_Latn", + "ces_Latn", + "dan_Latn", + "deu_Latn", + "ell_Grek", + "eng_Latn", + "spa_Latn", + "est_Latn", + "fas_Arab", + "fin_Latn", + "fra_Latn", + "fra_Latn", + "glg_Latn", + "guj_Gujr", + "heb_Hebr", + "hin_Deva", + "hrv_Latn", + "hun_Latn", + "hye_Armn", + "ind_Latn", + "ita_Latn", + "jpn_Jpan", + "kat_Geor", + "kor_Hang", + "kur_Arab", + "lit_Latn", + "lav_Latn", + "mkd_Cyrl", + "mon_Cyrl", + "mar_Deva", + "msa_Latn", + "mya_Mymr", + "nob_Latn", + "nld_Latn", + "pol_Latn", + "por_Latn", + "por_Latn", + "ron_Latn", + "rus_Cyrl", + "slk_Latn", + "slv_Latn", + "sqi_Latn", + "srp_Cyrl", + "swe_Latn", + "tha_Thai", + "tur_Latn", + "ukr_Cyrl", + "urd_Arab", + "vie_Latn", + "zho_Hans", + "zho_Hant", +] + all_MiniLM_L6_v2 = ModelMeta( name="sentence-transformers/all-MiniLM-L6-v2", languages=["eng-Latn"], open_source=True, - revision=None, # can be any + revision="8b3219a92973c328a8e22fadcfa821b5dc75636a", # can be any release_date="2021-08-30", ) paraphrase_multilingual_MiniLM_L12_v2 = ModelMeta( name="sentence-transformers/paraphrase-multilingual-MiniLM-L12-v2", - languages=[ - "ara_Arab", - "bul_Cyrl", - "cat_Latn", - "ces_Latn", - "dan_Latn", - "deu_Latn", - "ell_Grek", - "eng_Latn", - "spa_Latn", - "est_Latn", - "fas_Arab", - "fin_Latn", - "fra_Latn", - "fra_Latn", - "glg_Latn", - "guj_Gujr", - "heb_Hebr", - "hin_Deva", - "hrv_Latn", - "hun_Latn", - "hye_Armn", - "ind_Latn", - "ita_Latn", - "jpn_Jpan", - "kat_Geor", - "kor_Hang", - "kur_Arab", - "lit_Latn", - "lav_Latn", - "mkd_Cyrl", - "mon_Cyrl", - "mar_Deva", - "msa_Latn", - "mya_Mymr", - "nob_Latn", - "nld_Latn", - "pol_Latn", - "por_Latn", - "por_Latn", - "ron_Latn", - "rus_Cyrl", - "slk_Latn", - "slv_Latn", - "sqi_Latn", - "srp_Cyrl", - "swe_Latn", - "tha_Thai", - "tur_Latn", - "ukr_Cyrl", - "urd_Arab", - "vie_Latn", - "zho_Hans", - "zho_Hant", - ], + languages=paraphrase_langs, + open_source=True, + revision="bf3bf13ab40c3157080a7ab344c831b9ad18b5eb", # can be any + release_date="2019-11-01", # release date of paper +) + +paraphrase_multilingual_mpnet_base_v2 = ModelMeta( + name="sentence-transformers/paraphrase-multilingual-mpnet-base-v2", + languages=paraphrase_langs, + open_source=True, + revision="79f2382ceacceacdf38563d7c5d16b9ff8d725d6", # can be any + release_date="2019-11-01", # release date of paper +) + +labse = ModelMeta( + name="sentence-transformers/LaBSE", + languages=paraphrase_langs, open_source=True, - revision=None, # can be any + revision="e34fab64a3011d2176c99545a93d5cbddc9a91b7", # can be any release_date="2019-11-01", # release date of paper ) diff --git a/mteb/tasks/Clustering/eng/BiorxivClusteringP2P.py b/mteb/tasks/Clustering/eng/BiorxivClusteringP2P.py index fe67db6dd1..b7ea042964 100644 --- a/mteb/tasks/Clustering/eng/BiorxivClusteringP2P.py +++ b/mteb/tasks/Clustering/eng/BiorxivClusteringP2P.py @@ -32,20 +32,13 @@ class BiorxivClusteringP2PFast(AbsTaskClusteringFast): dialect=[], text_creation="created", bibtex_citation="", - n_samples={"test": 2048}, + n_samples={"test": 2151}, avg_character_length={"test": 1664.0}, ) def dataset_transform(self): for split in self.metadata.eval_splits: check_label_distribution(self.dataset[split]) - self.dataset = self.stratified_subsampling( - self.dataset, - self.seed, - self.metadata.eval_splits, - label="labels", - n_samples=2048, - ) class BiorxivClusteringP2P(AbsTaskClustering): diff --git a/mteb/tasks/Clustering/eng/BiorxivClusteringS2S.py b/mteb/tasks/Clustering/eng/BiorxivClusteringS2S.py index b5283305db..597771e1a7 100644 --- a/mteb/tasks/Clustering/eng/BiorxivClusteringS2S.py +++ b/mteb/tasks/Clustering/eng/BiorxivClusteringS2S.py @@ -32,20 +32,13 @@ class BiorxivClusteringS2SFast(AbsTaskClusteringFast): dialect=[], text_creation="created", bibtex_citation="", - n_samples={"test": 2048}, + n_samples={"test": 2151}, avg_character_length={"test": 101.7}, ) def dataset_transform(self): for split in self.metadata.eval_splits: check_label_distribution(self.dataset[split]) - self.dataset = self.stratified_subsampling( - self.dataset, - self.seed, - self.metadata.eval_splits, - label="labels", - n_samples=2048, - ) class BiorxivClusteringS2S(AbsTaskClustering): diff --git a/mteb/tasks/Clustering/eng/MedrxivClusteringP2P.py b/mteb/tasks/Clustering/eng/MedrxivClusteringP2P.py index 3a569bcda5..7f2e89fde6 100644 --- a/mteb/tasks/Clustering/eng/MedrxivClusteringP2P.py +++ b/mteb/tasks/Clustering/eng/MedrxivClusteringP2P.py @@ -1,5 +1,9 @@ from __future__ import annotations +import itertools + +from datasets import Dataset, DatasetDict + from mteb.abstasks.AbsTaskClustering import AbsTaskClustering from mteb.abstasks.AbsTaskClusteringFast import ( AbsTaskClusteringFast, @@ -15,7 +19,7 @@ class MedrxivClusteringP2PFast(AbsTaskClusteringFast): reference="https://api.medrxiv.org/", dataset={ "path": "mteb/medrxiv-clustering-p2p", - "revision": "9894e30672c61db02f10a8593519d84e2b7a1a1c", + "revision": "e7a26af6f3ae46b30dde8737f02c07b1505bcc73", }, type="Clustering", category="p2p", @@ -32,20 +36,20 @@ class MedrxivClusteringP2PFast(AbsTaskClusteringFast): dialect=[], text_creation="created", bibtex_citation="", - n_samples={"test": 2048}, + n_samples={"test": 1500}, avg_character_length={"test": 1984.7}, ) def dataset_transform(self): + ds = dict() for split in self.metadata.eval_splits: + labels = list(itertools.chain.from_iterable(self.dataset[split]["labels"])) + sentences = list( + itertools.chain.from_iterable(self.dataset[split]["sentences"]) + ) check_label_distribution(self.dataset[split]) - self.dataset = self.stratified_subsampling( - self.dataset, - self.seed, - self.metadata.eval_splits, - label="labels", - n_samples=2048, - ) + ds[split] = Dataset.from_dict({"labels": labels, "sentences": sentences}) + self.dataset = DatasetDict(ds) class MedrxivClusteringP2P(AbsTaskClustering): @@ -73,6 +77,6 @@ class MedrxivClusteringP2P(AbsTaskClustering): dialect=[], text_creation="created", bibtex_citation="", - n_samples={"test": 375000}, + n_samples={"test": 37500}, avg_character_length={"test": 1981.2}, ) diff --git a/mteb/tasks/Clustering/eng/MedrxivClusteringS2S.py b/mteb/tasks/Clustering/eng/MedrxivClusteringS2S.py index 9ca7be8031..a29a0c0201 100644 --- a/mteb/tasks/Clustering/eng/MedrxivClusteringS2S.py +++ b/mteb/tasks/Clustering/eng/MedrxivClusteringS2S.py @@ -1,5 +1,9 @@ from __future__ import annotations +import itertools + +from datasets import Dataset, DatasetDict + from mteb.abstasks.AbsTaskClustering import AbsTaskClustering from mteb.abstasks.AbsTaskClusteringFast import ( AbsTaskClusteringFast, @@ -15,7 +19,7 @@ class MedrxivClusteringS2SFast(AbsTaskClusteringFast): reference="https://api.medrxiv.org/", dataset={ "path": "mteb/medrxiv-clustering-s2s", - "revision": "ec20c81676a749c0f06fb4a9397fc7e168521458", + "revision": "35191c8c0dca72d8ff3efcd72aa802307d469663", }, type="Clustering", category="s2s", @@ -32,20 +36,20 @@ class MedrxivClusteringS2SFast(AbsTaskClusteringFast): dialect=[], text_creation="created", bibtex_citation="", - n_samples={"test": 2048}, + n_samples={"test": 1500}, avg_character_length={"test": 114.9}, ) def dataset_transform(self): + ds = dict() for split in self.metadata.eval_splits: + labels = list(itertools.chain.from_iterable(self.dataset[split]["labels"])) + sentences = list( + itertools.chain.from_iterable(self.dataset[split]["sentences"]) + ) check_label_distribution(self.dataset[split]) - self.dataset = self.stratified_subsampling( - self.dataset, - self.seed, - self.metadata.eval_splits, - label="labels", - n_samples=2048, - ) + ds[split] = Dataset.from_dict({"labels": labels, "sentences": sentences}) + self.dataset = DatasetDict(ds) class MedrxivClusteringS2S(AbsTaskClustering): @@ -73,6 +77,6 @@ class MedrxivClusteringS2S(AbsTaskClustering): dialect=[], text_creation="created", bibtex_citation="", - n_samples={"test": 375000}, + n_samples={"test": 37500}, avg_character_length={"test": 114.7}, ) diff --git a/mteb/tasks/Clustering/eng/RedditClustering.py b/mteb/tasks/Clustering/eng/RedditClustering.py index a0804c3637..39071f9607 100644 --- a/mteb/tasks/Clustering/eng/RedditClustering.py +++ b/mteb/tasks/Clustering/eng/RedditClustering.py @@ -14,7 +14,7 @@ class RedditFastClusteringS2S(AbsTaskClusteringFast): metadata = TaskMetadata( - name="RedditClusteringS2S.v2", + name="RedditClustering.v2", description="Clustering of titles from 199 subreddits. Clustering of 25 sets, each with 10-50 classes, and each class with 100 - 1000 sentences.", reference="https://arxiv.org/abs/2104.07081", dataset={ @@ -48,7 +48,7 @@ class RedditFastClusteringS2S(AbsTaskClusteringFast): archivePrefix = {arXiv}, eprint = {2104.07081} }""", - n_samples={"test": 16000}, + n_samples={"test": 32768}, avg_character_length={"test": 64.7}, ) @@ -67,12 +67,13 @@ def dataset_transform(self): self.seed, self.metadata.eval_splits, label="labels", - n_samples=16000, + n_samples=32768, ) + self.max_fraction_of_documents_to_embed = None class RedditClustering(AbsTaskClustering): - superseeded_by = "RedditClusteringS2S.v2" + superseeded_by = "RedditClustering.v2" metadata = TaskMetadata( name="RedditClustering", description="Clustering of titles from 199 subreddits. Clustering of 25 sets, each with 10-50 classes, and each class with 100 - 1000 sentences.", diff --git a/mteb/tasks/Clustering/eng/RedditClusteringP2P.py b/mteb/tasks/Clustering/eng/RedditClusteringP2P.py index 015f5bb41f..6d6f290c35 100644 --- a/mteb/tasks/Clustering/eng/RedditClusteringP2P.py +++ b/mteb/tasks/Clustering/eng/RedditClusteringP2P.py @@ -91,7 +91,7 @@ class RedditFastClusteringP2P(AbsTaskClusteringFast): archivePrefix = {arXiv}, eprint = {2104.07081} }""", - n_samples={"test": 16000}, + n_samples={"test": 18375}, avg_character_length={"test": 727.7}, ) @@ -116,10 +116,3 @@ def dataset_transform(self): ds[split] = Dataset.from_dict({"labels": labels, "sentences": sentences}) self.dataset = DatasetDict(ds) - self.dataset = self.stratified_subsampling( - self.dataset, - self.seed, - self.metadata.eval_splits, - label="labels", - n_samples=16000, - ) diff --git a/mteb/tasks/Clustering/eng/StackExchangeClustering.py b/mteb/tasks/Clustering/eng/StackExchangeClustering.py index f8804845a3..8c33ec868a 100644 --- a/mteb/tasks/Clustering/eng/StackExchangeClustering.py +++ b/mteb/tasks/Clustering/eng/StackExchangeClustering.py @@ -48,7 +48,7 @@ class StackExchangeClusteringFast(AbsTaskClusteringFast): archivePrefix = {arXiv}, eprint = {2104.07081} }""", - n_samples={"test": 16000}, + n_samples={"test": 32768}, avg_character_length={"test": 57.0}, ) @@ -69,8 +69,9 @@ def dataset_transform(self): self.seed, self.metadata.eval_splits, label="labels", - n_samples=16000, + n_samples=32768, ) + self.max_fraction_of_documents_to_embed = None class StackExchangeClustering(AbsTaskClustering): diff --git a/mteb/tasks/Clustering/eng/StackExchangeClusteringP2P.py b/mteb/tasks/Clustering/eng/StackExchangeClusteringP2P.py index 09af30d457..66f5969161 100644 --- a/mteb/tasks/Clustering/eng/StackExchangeClusteringP2P.py +++ b/mteb/tasks/Clustering/eng/StackExchangeClusteringP2P.py @@ -50,7 +50,7 @@ class StackExchangeClusteringP2PFast(AbsTaskClusteringFast): archivePrefix = {arXiv}, eprint = {2104.07081} }""", - n_samples={"test": 16000}, + n_samples={"test": 2996}, avg_character_length={"test": 1090.7}, ) @@ -75,13 +75,6 @@ def dataset_transform(self): ds[split] = Dataset.from_dict({"labels": labels, "sentences": sentences}) self.dataset = DatasetDict(ds) - self.dataset = self.stratified_subsampling( - self.dataset, - self.seed, - self.metadata.eval_splits, - label="labels", - n_samples=16000, - ) class StackExchangeClusteringP2P(AbsTaskClustering): diff --git a/mteb/tasks/Clustering/eng/TwentyNewsgroupsClustering.py b/mteb/tasks/Clustering/eng/TwentyNewsgroupsClustering.py index ff73ec5f17..92f59edbce 100644 --- a/mteb/tasks/Clustering/eng/TwentyNewsgroupsClustering.py +++ b/mteb/tasks/Clustering/eng/TwentyNewsgroupsClustering.py @@ -92,7 +92,7 @@ class TwentyNewsgroupsClusteringFast(AbsTaskClusteringFast): author = {Ken Lang}, } """, - n_samples={"test": 2048}, + n_samples={"test": 2381}, avg_character_length={"test": 32.0}, ) @@ -108,9 +108,3 @@ def dataset_transform(self): ds[split] = Dataset.from_dict({"labels": labels, "sentences": sentences}) self.dataset = DatasetDict(ds) - self.dataset = self.stratified_subsampling( - self.dataset, - self.seed, - label="labels", - n_samples=2048, - ) diff --git a/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/BiorxivClusteringP2P.json b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/BiorxivClusteringP2P.json new file mode 100644 index 0000000000..3aa8a59726 --- /dev/null +++ b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/BiorxivClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "65b79d1d13f80053f67aca9498d9402c2d9f1f40", + "evaluation_time": 777.1277756690979, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.39440333414370987, + "v_measure": 0.39440333414370987, + "v_measure_std": 0.008581999510788163, + "v_measures": [ + 0.3917958283104731, + 0.3976716777098096, + 0.40355231070272335, + 0.373137475916239, + 0.39991311271437163, + 0.40390042586044406, + 0.38799405030896195, + 0.3965423039764483, + 0.397645797867978, + 0.3918803580696496 + ] + } + ] + }, + "task_name": "BiorxivClusteringP2P" +} \ No newline at end of file diff --git a/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/BiorxivClusteringP2P.v2.json b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/BiorxivClusteringP2P.v2.json new file mode 100644 index 0000000000..6e5d848739 --- /dev/null +++ b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/BiorxivClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "f5dbc242e11dd8e24def4c4268607a49e02946dc", + "evaluation_time": 24.745657205581665, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.41671936179830205, + "v_measure": 0.41671936179830205, + "v_measure_std": 0.011540793687140519, + "v_measures": { + "Level 0": [ + 0.41790088959899296, + 0.40153754167071154, + 0.3977312594576458, + 0.4216246118032285, + 0.41293231868079167, + 0.41359303690270827, + 0.43278603975913643, + 0.42676055778957683, + 0.4090636253521346, + 0.43326373696809367 + ] + } + } + ] + }, + "task_name": "BiorxivClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/BiorxivClusteringS2S.json b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/BiorxivClusteringS2S.json new file mode 100644 index 0000000000..05afb3768b --- /dev/null +++ b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/BiorxivClusteringS2S.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "258694dd0231531bc1fd9de6ceb52a0853c6d908", + "evaluation_time": 61.351367235183716, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.36618045119714715, + "v_measure": 0.36618045119714715, + "v_measure_std": 0.011531340072622196, + "v_measures": [ + 0.36114969283791015, + 0.36891445460044364, + 0.36163725831243365, + 0.363033909789725, + 0.3545098264916609, + 0.3527991389322706, + 0.37018911813889294, + 0.3860029985726374, + 0.35630299102391627, + 0.38726512327158114 + ] + } + ] + }, + "task_name": "BiorxivClusteringS2S" +} \ No newline at end of file diff --git a/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/BiorxivClusteringS2S.v2.json b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/BiorxivClusteringS2S.v2.json new file mode 100644 index 0000000000..347925ff52 --- /dev/null +++ b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/BiorxivClusteringS2S.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "eb4edb10386758d274cd161093eb351381a16dbf", + "evaluation_time": 5.298211336135864, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.39655966923632036, + "v_measure": 0.39655966923632036, + "v_measure_std": 0.010653039465331793, + "v_measures": { + "Level 0": [ + 0.39036249423358543, + 0.40097419897175324, + 0.412597544439385, + 0.39358730050837715, + 0.37151648289028316, + 0.40719654426126234, + 0.3917090958209424, + 0.3963214849729259, + 0.3980849045241106, + 0.40324664174057767 + ] + } + } + ] + }, + "task_name": "BiorxivClusteringS2S.v2" +} \ No newline at end of file diff --git a/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/MedrxivClusteringP2P.json b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/MedrxivClusteringP2P.json new file mode 100644 index 0000000000..0d9776da4c --- /dev/null +++ b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/MedrxivClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "e7a26af6f3ae46b30dde8737f02c07b1505bcc73", + "evaluation_time": 436.13413286209106, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3320930386787777, + "v_measure": 0.3320930386787777, + "v_measure_std": 0.01432017103509547, + "v_measures": [ + 0.3159311682742844, + 0.3226157572017578, + 0.32497912487263847, + 0.31978698562021995, + 0.31380447038572096, + 0.3525481662301037, + 0.3507450230893816, + 0.3515898507679645, + 0.33611469788018095, + 0.3328151424655248 + ] + } + ] + }, + "task_name": "MedrxivClusteringP2P" +} \ No newline at end of file diff --git a/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/MedrxivClusteringP2P.v2.json b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/MedrxivClusteringP2P.v2.json new file mode 100644 index 0000000000..1bf1216657 --- /dev/null +++ b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/MedrxivClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "e7a26af6f3ae46b30dde8737f02c07b1505bcc73", + "evaluation_time": 20.242704391479492, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3647703373858422, + "v_measure": 0.3647703373858422, + "v_measure_std": 0.008927999427499306, + "v_measures": { + "Level 0": [ + 0.36250409683049, + 0.3476670023873491, + 0.3620178030033809, + 0.37087005586496347, + 0.35910863381899083, + 0.36272170419591354, + 0.36745110270788583, + 0.3831164463636247, + 0.37208019254178504, + 0.3601663361440384 + ] + } + } + ] + }, + "task_name": "MedrxivClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/MedrxivClusteringS2S.json b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/MedrxivClusteringS2S.json new file mode 100644 index 0000000000..147098a316 --- /dev/null +++ b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/MedrxivClusteringS2S.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "35191c8c0dca72d8ff3efcd72aa802307d469663", + "evaluation_time": 34.84062385559082, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.31678936233423916, + "v_measure": 0.31678936233423916, + "v_measure_std": 0.015660625748838235, + "v_measures": [ + 0.2970687818009131, + 0.30652438424086176, + 0.2961629560347047, + 0.3033435105609232, + 0.30759600672709003, + 0.33162966661301724, + 0.328487735200982, + 0.3397078621754543, + 0.3358313674164977, + 0.32154135257194727 + ] + } + ] + }, + "task_name": "MedrxivClusteringS2S" +} \ No newline at end of file diff --git a/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/MedrxivClusteringS2S.v2.json b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/MedrxivClusteringS2S.v2.json new file mode 100644 index 0000000000..65ebc3dce1 --- /dev/null +++ b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/MedrxivClusteringS2S.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "35191c8c0dca72d8ff3efcd72aa802307d469663", + "evaluation_time": 5.479676246643066, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.35024221152776636, + "v_measure": 0.35024221152776636, + "v_measure_std": 0.005159654800337718, + "v_measures": { + "Level 0": [ + 0.3523041402550056, + 0.3486858109284018, + 0.34693317675261465, + 0.34881135875254043, + 0.34445029245650943, + 0.344829342458049, + 0.34792310643129176, + 0.35146553178893725, + 0.3540304389995867, + 0.36298891645472675 + ] + } + } + ] + }, + "task_name": "MedrxivClusteringS2S.v2" +} \ No newline at end of file diff --git a/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/RedditClustering.json b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/RedditClustering.json new file mode 100644 index 0000000000..92bd70e833 --- /dev/null +++ b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/RedditClustering.json @@ -0,0 +1,47 @@ +{ + "dataset_revision": "24640382cdbf8abc73003fb0fa6d111a705499eb", + "evaluation_time": 375.62032413482666, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.5660711132724433, + "v_measure": 0.5660711132724433, + "v_measure_std": 0.05154777346896376, + "v_measures": [ + 0.5826683596168553, + 0.6374354987310801, + 0.5006399487828275, + 0.5599555833529665, + 0.553370946454432, + 0.5385836878331731, + 0.5825386762613354, + 0.49964374262064243, + 0.5385965320402677, + 0.5238565054761791, + 0.5176587505639665, + 0.6008395139626939, + 0.5577297831043375, + 0.5716407618618421, + 0.6821623628927163, + 0.5182078636562623, + 0.5991687248615399, + 0.6756288410915288, + 0.5427660444209756, + 0.5327263322917711, + 0.5264571812647164, + 0.5459946027383078, + 0.6619165511407671, + 0.58824420320592, + 0.5133468335839784 + ] + } + ] + }, + "task_name": "RedditClustering" +} \ No newline at end of file diff --git a/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/RedditClustering.v2.json b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/RedditClustering.v2.json new file mode 100644 index 0000000000..832f853b52 --- /dev/null +++ b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/RedditClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "24640382cdbf8abc73003fb0fa6d111a705499eb", + "evaluation_time": 32.571887254714966, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.5267361142027605, + "v_measure": 0.5267361142027605, + "v_measure_std": 0.012213586741865694, + "v_measures": { + "Level 0": [ + 0.5366100999408451, + 0.5332629163529715, + 0.5338961457611263, + 0.5439400048183071, + 0.5141842906432071, + 0.5368107173281771, + 0.520076037439041, + 0.500606504773758, + 0.5252342952000336, + 0.5227401297701363 + ] + } + } + ] + }, + "task_name": "RedditClustering.v2" +} \ No newline at end of file diff --git a/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/RedditClusteringP2P.json b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/RedditClusteringP2P.json new file mode 100644 index 0000000000..2afbc02f90 --- /dev/null +++ b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/RedditClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "385e3cb46b4cfa89021f56c4380204149d0efe33", + "evaluation_time": 2379.5412561893463, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.6265647952538611, + "v_measure": 0.6265647952538611, + "v_measure_std": 0.13756467725269644, + "v_measures": [ + 0.6733551423928007, + 0.6732047583732851, + 0.6781581829063386, + 0.37327823319371817, + 0.7106057103385515, + 0.6317412190022346, + 0.3436554713646762, + 0.7376763710959159, + 0.7082732035253905, + 0.7356996603457007 + ] + } + ] + }, + "task_name": "RedditClusteringP2P" +} \ No newline at end of file diff --git a/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/RedditClusteringP2P.v2.json b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/RedditClusteringP2P.v2.json new file mode 100644 index 0000000000..5266b900b2 --- /dev/null +++ b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/RedditClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "385e3cb46b4cfa89021f56c4380204149d0efe33", + "evaluation_time": 105.30910229682922, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.638720606753781, + "v_measure": 0.638720606753781, + "v_measure_std": 0.004432929389151057, + "v_measures": { + "Level 0": [ + 0.6379955218861557, + 0.6454001931478575, + 0.6368926848975903, + 0.6355266342502021, + 0.6437159274793, + 0.6363764453495968, + 0.6302513439856101, + 0.6445164973914553, + 0.6391708811819383, + 0.6373599379681031 + ] + } + } + ] + }, + "task_name": "RedditClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/StackExchangeClustering.json b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/StackExchangeClustering.json new file mode 100644 index 0000000000..b09c9863df --- /dev/null +++ b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/StackExchangeClustering.json @@ -0,0 +1,47 @@ +{ + "dataset_revision": "6cbc1f7b2bc0622f2e39d2c77fa502909748c259", + "evaluation_time": 292.5053720474243, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.6611151950152403, + "v_measure": 0.6611151950152403, + "v_measure_std": 0.055340590036143396, + "v_measures": [ + 0.6851465029606203, + 0.6966861777177117, + 0.5675254556526353, + 0.6659633708232933, + 0.6707729854998247, + 0.613844702113425, + 0.5999916760385908, + 0.7527217463412903, + 0.6523476826107588, + 0.6697937400249022, + 0.7746840613363474, + 0.7860867259444937, + 0.7560088214143146, + 0.667323114751532, + 0.6100765978477901, + 0.6269766460752062, + 0.6478103344410351, + 0.6283739914292072, + 0.6264280121830134, + 0.6434559345581252, + 0.6545174769498185, + 0.639365433328066, + 0.5800535467509194, + 0.6629325057812006, + 0.6489926328068876 + ] + } + ] + }, + "task_name": "StackExchangeClustering" +} \ No newline at end of file diff --git a/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/StackExchangeClustering.v2.json b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/StackExchangeClustering.v2.json new file mode 100644 index 0000000000..e766b152e2 --- /dev/null +++ b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/StackExchangeClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "6cbc1f7b2bc0622f2e39d2c77fa502909748c259", + "evaluation_time": 32.72022986412048, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.5533297004859964, + "v_measure": 0.5533297004859964, + "v_measure_std": 0.009303140286447797, + "v_measures": { + "Level 0": [ + 0.5605729742984057, + 0.5546763255935093, + 0.5469880751844894, + 0.5622625010266126, + 0.533495720395276, + 0.5509607570319965, + 0.5628308046578062, + 0.5462603205412908, + 0.5500401159906116, + 0.5652094101399657 + ] + } + } + ] + }, + "task_name": "StackExchangeClustering.v2" +} \ No newline at end of file diff --git a/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/StackExchangeClusteringP2P.json b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/StackExchangeClusteringP2P.json new file mode 100644 index 0000000000..4a6623c45a --- /dev/null +++ b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/StackExchangeClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "815ca46b2622cec33ccafc3735d572c266efdb44", + "evaluation_time": 581.4754991531372, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3523859931066552, + "v_measure": 0.3523859931066552, + "v_measure_std": 0.01698049637695688, + "v_measures": [ + 0.340799489633914, + 0.3357140660563895, + 0.33039927742817043, + 0.3319496194605114, + 0.3416884512851855, + 0.37597360575452043, + 0.36821075173919343, + 0.360086282038675, + 0.3706345149538094, + 0.3684038727161832 + ] + } + ] + }, + "task_name": "StackExchangeClusteringP2P" +} \ No newline at end of file diff --git a/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/StackExchangeClusteringP2P.v2.json b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/StackExchangeClusteringP2P.v2.json new file mode 100644 index 0000000000..bbc99e358f --- /dev/null +++ b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/StackExchangeClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "815ca46b2622cec33ccafc3735d572c266efdb44", + "evaluation_time": 29.96759581565857, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.40645947103989294, + "v_measure": 0.40645947103989294, + "v_measure_std": 0.008734596237860525, + "v_measures": { + "Level 0": [ + 0.40935492280745184, + 0.3866755730263645, + 0.40293811244377187, + 0.4152943513973367, + 0.40489343673189104, + 0.40731996079925664, + 0.4011122070592509, + 0.4032459985962018, + 0.41946850087560705, + 0.41429164666179735 + ] + } + } + ] + }, + "task_name": "StackExchangeClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/TwentyNewsgroupsClustering.json b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/TwentyNewsgroupsClustering.json new file mode 100644 index 0000000000..5829218bb7 --- /dev/null +++ b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/TwentyNewsgroupsClustering.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "6125ec4e24fa026cec8a478383ee943acfbd5449", + "evaluation_time": 27.8270263671875, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.5075400848683261, + "v_measure": 0.5075400848683261, + "v_measure_std": 0.011873426720678001, + "v_measures": [ + 0.5165065319441966, + 0.5007593841280532, + 0.5117411948809809, + 0.5325035353499994, + 0.5008187050697264, + 0.5118453843850534, + 0.5050624947508916, + 0.5121236090168767, + 0.4979351917610641, + 0.48610481739642003 + ] + } + ] + }, + "task_name": "TwentyNewsgroupsClustering" +} \ No newline at end of file diff --git a/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/TwentyNewsgroupsClustering.v2.json b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/TwentyNewsgroupsClustering.v2.json new file mode 100644 index 0000000000..33843c3e72 --- /dev/null +++ b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/TwentyNewsgroupsClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "6125ec4e24fa026cec8a478383ee943acfbd5449", + "evaluation_time": 4.340036630630493, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.501358752662136, + "v_measure": 0.501358752662136, + "v_measure_std": 0.017643729288488494, + "v_measures": { + "Level 0": [ + 0.503371353688989, + 0.5032976135241535, + 0.48013960653119886, + 0.5483822233004637, + 0.5078017408553777, + 0.4866465039736367, + 0.4943784209763925, + 0.5006592619591322, + 0.4899137091857001, + 0.49899709262631603 + ] + } + } + ] + }, + "task_name": "TwentyNewsgroupsClustering.v2" +} \ No newline at end of file diff --git a/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/model_meta.json b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/model_meta.json new file mode 100644 index 0000000000..96828cad2b --- /dev/null +++ b/results/BAAI__bge-base-en-v1.5/a5beb1e3e68b9ab74eb54cfd186867f64f240e1a/model_meta.json @@ -0,0 +1 @@ +{"name": "BAAI/bge-base-en-v1.5", "revision": "a5beb1e3e68b9ab74eb54cfd186867f64f240e1a", "release_date": "2023-09-11", "languages": ["eng_Latn"], "n_parameters": null, "memory_usage": null, "max_tokens": null, "embed_dim": null, "license": null, "open_source": true, "framework": [], "loader": "BGEWrapper"} \ No newline at end of file diff --git a/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/BiorxivClusteringP2P.json b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/BiorxivClusteringP2P.json new file mode 100644 index 0000000000..3d46bd16bd --- /dev/null +++ b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/BiorxivClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "65b79d1d13f80053f67aca9498d9402c2d9f1f40", + "evaluation_time": 779.6743319034576, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3711689213861582, + "v_measure": 0.3711689213861582, + "v_measure_std": 0.007056474352968967, + "v_measures": [ + 0.3807543996587275, + 0.3633021753815821, + 0.3676882118744135, + 0.3687727562736903, + 0.375941998736464, + 0.38173423104513415, + 0.3703522519565331, + 0.36457423266293576, + 0.3608985639356183, + 0.3776703923364835 + ] + } + ] + }, + "task_name": "BiorxivClusteringP2P" +} \ No newline at end of file diff --git a/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/BiorxivClusteringP2P.v2.json b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/BiorxivClusteringP2P.v2.json new file mode 100644 index 0000000000..d594d2fda9 --- /dev/null +++ b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/BiorxivClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "f5dbc242e11dd8e24def4c4268607a49e02946dc", + "evaluation_time": 24.953575372695923, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3911946928392568, + "v_measure": 0.3911946928392568, + "v_measure_std": 0.006438588643936885, + "v_measures": { + "Level 0": [ + 0.3903491897604992, + 0.3908341638410035, + 0.39889031965332117, + 0.39202127631945194, + 0.3958097667620781, + 0.40243616389475695, + 0.37869224014288366, + 0.3884506021610787, + 0.3895640232569745, + 0.38489918260052025 + ] + } + } + ] + }, + "task_name": "BiorxivClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/BiorxivClusteringS2S.json b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/BiorxivClusteringS2S.json new file mode 100644 index 0000000000..a044683391 --- /dev/null +++ b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/BiorxivClusteringS2S.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "258694dd0231531bc1fd9de6ceb52a0853c6d908", + "evaluation_time": 66.49916672706604, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.33408904429780945, + "v_measure": 0.33408904429780945, + "v_measure_std": 0.006736717488046786, + "v_measures": [ + 0.32940515827770667, + 0.33652762829600685, + 0.3401292196030229, + 0.330407153903208, + 0.3291338220004731, + 0.3303315288264198, + 0.3262780325294901, + 0.3399265501097091, + 0.3297255540293177, + 0.3490257954027401 + ] + } + ] + }, + "task_name": "BiorxivClusteringS2S" +} \ No newline at end of file diff --git a/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/BiorxivClusteringS2S.v2.json b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/BiorxivClusteringS2S.v2.json new file mode 100644 index 0000000000..657fa14742 --- /dev/null +++ b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/BiorxivClusteringS2S.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "eb4edb10386758d274cd161093eb351381a16dbf", + "evaluation_time": 5.164421558380127, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.358364074912478, + "v_measure": 0.358364074912478, + "v_measure_std": 0.010099972906064836, + "v_measures": { + "Level 0": [ + 0.37156475831350266, + 0.3457624094562136, + 0.3417047639689733, + 0.36030591631654846, + 0.3486221188266999, + 0.3571954211214105, + 0.3598704822436495, + 0.36527451096664154, + 0.37446291707424023, + 0.3588774508369004 + ] + } + } + ] + }, + "task_name": "BiorxivClusteringS2S.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/MedrxivClusteringP2P.json b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/MedrxivClusteringP2P.json new file mode 100644 index 0000000000..9f5ddc9e5a --- /dev/null +++ b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/MedrxivClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "e7a26af6f3ae46b30dde8737f02c07b1505bcc73", + "evaluation_time": 437.5574972629547, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.31815239658725913, + "v_measure": 0.31815239658725913, + "v_measure_std": 0.01437578434142839, + "v_measures": [ + 0.30075826181301013, + 0.30121026774047355, + 0.3031910785997809, + 0.306078604657783, + 0.31574931057925354, + 0.3407028727667541, + 0.3246748153794257, + 0.3347722094354529, + 0.33463937261725935, + 0.31974717228339783 + ] + } + ] + }, + "task_name": "MedrxivClusteringP2P" +} \ No newline at end of file diff --git a/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/MedrxivClusteringP2P.v2.json b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/MedrxivClusteringP2P.v2.json new file mode 100644 index 0000000000..14b4f45147 --- /dev/null +++ b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/MedrxivClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "e7a26af6f3ae46b30dde8737f02c07b1505bcc73", + "evaluation_time": 20.39490556716919, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3553594605417122, + "v_measure": 0.3553594605417122, + "v_measure_std": 0.008225346393502699, + "v_measures": { + "Level 0": [ + 0.3523703130111339, + 0.3487654759823081, + 0.36460719575675593, + 0.3566131522698559, + 0.3420302833471538, + 0.3479292597917499, + 0.36338298384005957, + 0.3483149570890772, + 0.3672693760083565, + 0.362311608320671 + ] + } + } + ] + }, + "task_name": "MedrxivClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/MedrxivClusteringS2S.json b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/MedrxivClusteringS2S.json new file mode 100644 index 0000000000..cc01b35a18 --- /dev/null +++ b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/MedrxivClusteringS2S.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "35191c8c0dca72d8ff3efcd72aa802307d469663", + "evaluation_time": 36.63607144355774, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.2967975888813038, + "v_measure": 0.2967975888813038, + "v_measure_std": 0.014401899859793517, + "v_measures": [ + 0.2848416757045636, + 0.2959044184688961, + 0.2795960368451605, + 0.2825894441270454, + 0.28904155767005074, + 0.3234195765125117, + 0.2972550618349341, + 0.32125338544635806, + 0.3027533224381085, + 0.2913214097654094 + ] + } + ] + }, + "task_name": "MedrxivClusteringS2S" +} \ No newline at end of file diff --git a/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/MedrxivClusteringS2S.v2.json b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/MedrxivClusteringS2S.v2.json new file mode 100644 index 0000000000..324c9cd341 --- /dev/null +++ b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/MedrxivClusteringS2S.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "35191c8c0dca72d8ff3efcd72aa802307d469663", + "evaluation_time": 5.435777425765991, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.33347301106853483, + "v_measure": 0.33347301106853483, + "v_measure_std": 0.006896358853349648, + "v_measures": { + "Level 0": [ + 0.3278545833285326, + 0.33320774197210096, + 0.33737074625953306, + 0.32647211021659667, + 0.33504446834899854, + 0.3300092452571598, + 0.3231564498158958, + 0.34763371032037127, + 0.3410884397465966, + 0.33289261541956355 + ] + } + } + ] + }, + "task_name": "MedrxivClusteringS2S.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/RedditClustering.json b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/RedditClustering.json new file mode 100644 index 0000000000..35a633ae49 --- /dev/null +++ b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/RedditClustering.json @@ -0,0 +1,47 @@ +{ + "dataset_revision": "24640382cdbf8abc73003fb0fa6d111a705499eb", + "evaluation_time": 413.73885917663574, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.5653713988148936, + "v_measure": 0.5653713988148936, + "v_measure_std": 0.05599793134105555, + "v_measures": [ + 0.6083594592896844, + 0.6282966499991045, + 0.5069191842852458, + 0.5541494992233397, + 0.554216867201631, + 0.5519659489270933, + 0.613269559447958, + 0.5010446934880212, + 0.5335099650892506, + 0.5385152193073659, + 0.5047798115126595, + 0.5622127481749373, + 0.5601568063685916, + 0.5794133559136945, + 0.6527737683113702, + 0.5012428987092308, + 0.5737719840953437, + 0.6881984422096482, + 0.5464204067219086, + 0.5473901412560249, + 0.5290306067708539, + 0.5153708161502937, + 0.7086825902607814, + 0.5769158347113487, + 0.49767771294695734 + ] + } + ] + }, + "task_name": "RedditClustering" +} \ No newline at end of file diff --git a/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/RedditClustering.v2.json b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/RedditClustering.v2.json new file mode 100644 index 0000000000..8efa027aa8 --- /dev/null +++ b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/RedditClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "24640382cdbf8abc73003fb0fa6d111a705499eb", + "evaluation_time": 33.857632875442505, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.5122635899930399, + "v_measure": 0.5122635899930399, + "v_measure_std": 0.02040001824946415, + "v_measures": { + "Level 0": [ + 0.5339792785498363, + 0.5127657842566198, + 0.5425730987976187, + 0.5374254815733197, + 0.4878512092710704, + 0.498007470033854, + 0.48200396552798214, + 0.5244004121805728, + 0.49645336858571726, + 0.5071758311538069 + ] + } + } + ] + }, + "task_name": "RedditClustering.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/RedditClusteringP2P.json b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/RedditClusteringP2P.json new file mode 100644 index 0000000000..d26e59d5f0 --- /dev/null +++ b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/RedditClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "385e3cb46b4cfa89021f56c4380204149d0efe33", + "evaluation_time": 2393.2942266464233, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.6323486223988497, + "v_measure": 0.6323486223988497, + "v_measure_std": 0.12239058534551613, + "v_measures": [ + 0.6617301587670905, + 0.6647586424160368, + 0.6937195710639809, + 0.3882219872107206, + 0.7169945216259029, + 0.633268724904716, + 0.4016452638206048, + 0.7358239556494944, + 0.7037604278085643, + 0.7235629707213856 + ] + } + ] + }, + "task_name": "RedditClusteringP2P" +} \ No newline at end of file diff --git a/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/RedditClusteringP2P.v2.json b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/RedditClusteringP2P.v2.json new file mode 100644 index 0000000000..21d052c8f1 --- /dev/null +++ b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/RedditClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "385e3cb46b4cfa89021f56c4380204149d0efe33", + "evaluation_time": 106.2341423034668, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.6161027087340416, + "v_measure": 0.6161027087340416, + "v_measure_std": 0.0050706645527014895, + "v_measures": { + "Level 0": [ + 0.6203736563174647, + 0.6211594750325465, + 0.6126321005659731, + 0.6081239364199233, + 0.6171120305430524, + 0.621921317644637, + 0.6164605171265777, + 0.6148088508778567, + 0.6210664804481952, + 0.607368722364189 + ] + } + } + ] + }, + "task_name": "RedditClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/StackExchangeClustering.json b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/StackExchangeClustering.json new file mode 100644 index 0000000000..34657189cb --- /dev/null +++ b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/StackExchangeClustering.json @@ -0,0 +1,47 @@ +{ + "dataset_revision": "6cbc1f7b2bc0622f2e39d2c77fa502909748c259", + "evaluation_time": 309.14301013946533, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.64604146543404, + "v_measure": 0.64604146543404, + "v_measure_std": 0.04524872793939309, + "v_measures": [ + 0.7199319736136006, + 0.6738492751686043, + 0.5645298080558337, + 0.652348672187612, + 0.5859380763649736, + 0.6101403186177303, + 0.6074961120410487, + 0.7303805227864945, + 0.6652104209881352, + 0.6594132878826369, + 0.6930843380450249, + 0.7161687415455774, + 0.7112542082865904, + 0.7025274027928885, + 0.5956188460539461, + 0.6459354776132272, + 0.6323364033179264, + 0.6361180546531052, + 0.616031924671681, + 0.605783904230308, + 0.6603007926610304, + 0.6306082725789917, + 0.6188153358951854, + 0.6211200514965063, + 0.5960944143023409 + ] + } + ] + }, + "task_name": "StackExchangeClustering" +} \ No newline at end of file diff --git a/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/StackExchangeClustering.v2.json b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/StackExchangeClustering.v2.json new file mode 100644 index 0000000000..111922a91a --- /dev/null +++ b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/StackExchangeClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "6cbc1f7b2bc0622f2e39d2c77fa502909748c259", + "evaluation_time": 33.7830171585083, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.5311466874767545, + "v_measure": 0.5311466874767545, + "v_measure_std": 0.008211755898140294, + "v_measures": { + "Level 0": [ + 0.5289893304073823, + 0.5443716465979148, + 0.5231414440953195, + 0.5327878212351028, + 0.5460852176108789, + 0.5246539880904284, + 0.5234606889818078, + 0.5372249472922062, + 0.5255485870461373, + 0.5252032034103663 + ] + } + } + ] + }, + "task_name": "StackExchangeClustering.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/StackExchangeClusteringP2P.json b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/StackExchangeClusteringP2P.json new file mode 100644 index 0000000000..2c3ff6cfb1 --- /dev/null +++ b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/StackExchangeClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "815ca46b2622cec33ccafc3735d572c266efdb44", + "evaluation_time": 584.0322182178497, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3301535658734802, + "v_measure": 0.3301535658734802, + "v_measure_std": 0.015493704484823902, + "v_measures": [ + 0.31890706223692195, + 0.32044307701661306, + 0.31005803229984974, + 0.3177012680888083, + 0.3153628166396013, + 0.36204998911637076, + 0.33304458124594366, + 0.3422431685262168, + 0.3415108540172161, + 0.3402148095472609 + ] + } + ] + }, + "task_name": "StackExchangeClusteringP2P" +} \ No newline at end of file diff --git a/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/StackExchangeClusteringP2P.v2.json b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/StackExchangeClusteringP2P.v2.json new file mode 100644 index 0000000000..b9e6c33b5f --- /dev/null +++ b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/StackExchangeClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "815ca46b2622cec33ccafc3735d572c266efdb44", + "evaluation_time": 30.189608812332153, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3953167019072793, + "v_measure": 0.3953167019072793, + "v_measure_std": 0.005778919889196468, + "v_measures": { + "Level 0": [ + 0.39787020578132626, + 0.39491801976144836, + 0.4058638142169556, + 0.3894241112972474, + 0.3877900158114598, + 0.3928936310738038, + 0.38906041782167755, + 0.3935872538351701, + 0.40359691510328377, + 0.3981626343704206 + ] + } + } + ] + }, + "task_name": "StackExchangeClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/TwentyNewsgroupsClustering.json b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/TwentyNewsgroupsClustering.json new file mode 100644 index 0000000000..befeb8cfa0 --- /dev/null +++ b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/TwentyNewsgroupsClustering.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "6125ec4e24fa026cec8a478383ee943acfbd5449", + "evaluation_time": 30.525418996810913, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.49856012975943853, + "v_measure": 0.49856012975943853, + "v_measure_std": 0.016648564614337825, + "v_measures": [ + 0.47666313994083465, + 0.48436026136313826, + 0.4918727075900399, + 0.48898462890706085, + 0.5069067113181409, + 0.522951355031455, + 0.47929236549196796, + 0.528112227092821, + 0.5023761561426264, + 0.5040817447163003 + ] + } + ] + }, + "task_name": "TwentyNewsgroupsClustering" +} \ No newline at end of file diff --git a/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/TwentyNewsgroupsClustering.v2.json b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/TwentyNewsgroupsClustering.v2.json new file mode 100644 index 0000000000..c59f41cd86 --- /dev/null +++ b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/TwentyNewsgroupsClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "6125ec4e24fa026cec8a478383ee943acfbd5449", + "evaluation_time": 4.5293262004852295, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.4836694939036682, + "v_measure": 0.4836694939036682, + "v_measure_std": 0.015249602266826543, + "v_measures": { + "Level 0": [ + 0.5074530142289061, + 0.4722047471870994, + 0.4728945702372941, + 0.49464312421119094, + 0.5039767075071102, + 0.4561770131210821, + 0.47342287673769895, + 0.48489827075585384, + 0.4780835293422749, + 0.49294108570817147 + ] + } + } + ] + }, + "task_name": "TwentyNewsgroupsClustering.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/model_meta.json b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/model_meta.json new file mode 100644 index 0000000000..abb1f3d422 --- /dev/null +++ b/results/intfloat__e5-base-v2/1c644c92ad3ba1efdad3f1451a637716616a20e8/model_meta.json @@ -0,0 +1 @@ +{"name": "intfloat/e5-base-v2", "revision": "1c644c92ad3ba1efdad3f1451a637716616a20e8", "release_date": "2024-02-08", "languages": ["eng_Latn"], "n_parameters": null, "memory_usage": null, "max_tokens": null, "embed_dim": null, "license": null, "open_source": true, "framework": [], "loader": "E5Wrapper"} \ No newline at end of file diff --git a/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/BiorxivClusteringP2P.json b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/BiorxivClusteringP2P.json new file mode 100644 index 0000000000..9ff4907309 --- /dev/null +++ b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/BiorxivClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "65b79d1d13f80053f67aca9498d9402c2d9f1f40", + "evaluation_time": 2467.8042948246, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3672394652554166, + "v_measure": 0.3672394652554166, + "v_measure_std": 0.007397613976716682, + "v_measures": [ + 0.3738774449790624, + 0.38023354785161845, + 0.3617589533405553, + 0.362939779299527, + 0.35775836721065946, + 0.3721461323990733, + 0.36600568601234873, + 0.37632836661667146, + 0.3615350769331085, + 0.35981129791154154 + ] + } + ] + }, + "task_name": "BiorxivClusteringP2P" +} \ No newline at end of file diff --git a/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/BiorxivClusteringP2P.v2.json b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/BiorxivClusteringP2P.v2.json new file mode 100644 index 0000000000..94ba8dd7bd --- /dev/null +++ b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/BiorxivClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "f5dbc242e11dd8e24def4c4268607a49e02946dc", + "evaluation_time": 73.5835657119751, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.397176428189129, + "v_measure": 0.397176428189129, + "v_measure_std": 0.009320379048162644, + "v_measures": { + "Level 0": [ + 0.39161074947551, + 0.3972276394302246, + 0.4179950542344692, + 0.40249476421417146, + 0.3874902825510115, + 0.3860104327047624, + 0.40421432912190564, + 0.3971016346714517, + 0.3872787291511981, + 0.40034066633658594 + ] + } + } + ] + }, + "task_name": "BiorxivClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/BiorxivClusteringS2S.json b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/BiorxivClusteringS2S.json new file mode 100644 index 0000000000..e63032eb54 --- /dev/null +++ b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/BiorxivClusteringS2S.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "258694dd0231531bc1fd9de6ceb52a0853c6d908", + "evaluation_time": 200.92669582366943, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3546663339916155, + "v_measure": 0.3546663339916155, + "v_measure_std": 0.009365874706302691, + "v_measures": [ + 0.3560305584962096, + 0.34538118351907743, + 0.348432991557803, + 0.3567165998335342, + 0.34331774248519087, + 0.36191828186573033, + 0.343896060818805, + 0.3686708544572132, + 0.35197096031199776, + 0.3703281065705938 + ] + } + ] + }, + "task_name": "BiorxivClusteringS2S" +} \ No newline at end of file diff --git a/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/BiorxivClusteringS2S.v2.json b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/BiorxivClusteringS2S.v2.json new file mode 100644 index 0000000000..dac5af6a4d --- /dev/null +++ b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/BiorxivClusteringS2S.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "eb4edb10386758d274cd161093eb351381a16dbf", + "evaluation_time": 9.408823728561401, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3717788962965562, + "v_measure": 0.3717788962965562, + "v_measure_std": 0.013360590478514298, + "v_measures": { + "Level 0": [ + 0.3802204868404927, + 0.3525640753790324, + 0.3697642555521002, + 0.38633978625576226, + 0.38364066622781673, + 0.3796080174204095, + 0.36437420078961175, + 0.363157764039173, + 0.38884076980432514, + 0.3492789406568385 + ] + } + } + ] + }, + "task_name": "BiorxivClusteringS2S.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/MedrxivClusteringP2P.json b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/MedrxivClusteringP2P.json new file mode 100644 index 0000000000..dc9f634311 --- /dev/null +++ b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/MedrxivClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "e7a26af6f3ae46b30dde8737f02c07b1505bcc73", + "evaluation_time": 1352.6134810447693, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.31450740853371567, + "v_measure": 0.31450740853371567, + "v_measure_std": 0.01242717025119835, + "v_measures": [ + 0.29917806727822893, + 0.31487496231534806, + 0.3094679573601618, + 0.29875952996609906, + 0.2986687882119296, + 0.3335938151175009, + 0.3283226447833997, + 0.32761808153145233, + 0.31269163781074216, + 0.321898600962294 + ] + } + ] + }, + "task_name": "MedrxivClusteringP2P" +} \ No newline at end of file diff --git a/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/MedrxivClusteringP2P.v2.json b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/MedrxivClusteringP2P.v2.json new file mode 100644 index 0000000000..eed42f339c --- /dev/null +++ b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/MedrxivClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "e7a26af6f3ae46b30dde8737f02c07b1505bcc73", + "evaluation_time": 57.98740196228027, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.35215934606100385, + "v_measure": 0.35215934606100385, + "v_measure_std": 0.004311967458706847, + "v_measures": { + "Level 0": [ + 0.3544899440850619, + 0.3419729312373265, + 0.353272462768754, + 0.3594824167955063, + 0.3509152255702455, + 0.35401734544210295, + 0.3523227914155818, + 0.3516655946177408, + 0.35457569000318484, + 0.34887905867453434 + ] + } + } + ] + }, + "task_name": "MedrxivClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/MedrxivClusteringS2S.json b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/MedrxivClusteringS2S.json new file mode 100644 index 0000000000..1319bb5b69 --- /dev/null +++ b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/MedrxivClusteringS2S.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "35191c8c0dca72d8ff3efcd72aa802307d469663", + "evaluation_time": 110.54792213439941, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.29909963825947133, + "v_measure": 0.29909963825947133, + "v_measure_std": 0.011115579159618558, + "v_measures": [ + 0.29151359135787075, + 0.28898535949146714, + 0.28814314211087916, + 0.29263093585765737, + 0.28687146831792315, + 0.31876055334489795, + 0.3014252885026561, + 0.3061058538401158, + 0.3170746484180315, + 0.29948554135321426 + ] + } + ] + }, + "task_name": "MedrxivClusteringS2S" +} \ No newline at end of file diff --git a/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/MedrxivClusteringS2S.v2.json b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/MedrxivClusteringS2S.v2.json new file mode 100644 index 0000000000..ed51bab96b --- /dev/null +++ b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/MedrxivClusteringS2S.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "35191c8c0dca72d8ff3efcd72aa802307d469663", + "evaluation_time": 8.588359355926514, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3385838541505167, + "v_measure": 0.3385838541505167, + "v_measure_std": 0.00936960395657303, + "v_measures": { + "Level 0": [ + 0.33661199876853914, + 0.31349215303897215, + 0.3429341742345396, + 0.3408105920842293, + 0.3364352597109661, + 0.3362430639073333, + 0.34502913141453573, + 0.34884370009947063, + 0.33888355112805696, + 0.34655491711852404 + ] + } + } + ] + }, + "task_name": "MedrxivClusteringS2S.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/RedditClustering.json b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/RedditClustering.json new file mode 100644 index 0000000000..d28d1b8516 --- /dev/null +++ b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/RedditClustering.json @@ -0,0 +1,47 @@ +{ + "dataset_revision": "24640382cdbf8abc73003fb0fa6d111a705499eb", + "evaluation_time": 1237.830090045929, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.554997966486664, + "v_measure": 0.554997966486664, + "v_measure_std": 0.06369363090002754, + "v_measures": [ + 0.5992801709344349, + 0.6346041727077204, + 0.4940350439676296, + 0.5668407780314241, + 0.5584566901267188, + 0.5594253951502438, + 0.5894774957036318, + 0.5038470727199881, + 0.49696784371621583, + 0.5013216829506099, + 0.522976497516942, + 0.6006487364957644, + 0.5262955817946007, + 0.5425059123444281, + 0.7147404831193653, + 0.4942805331982798, + 0.5831717341954291, + 0.6795317312714327, + 0.510218244454103, + 0.4567106294365542, + 0.48164778527405044, + 0.5209184857098321, + 0.653887650922213, + 0.5664712226356713, + 0.5166875877893174 + ] + } + ] + }, + "task_name": "RedditClustering" +} \ No newline at end of file diff --git a/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/RedditClustering.v2.json b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/RedditClustering.v2.json new file mode 100644 index 0000000000..3729be8a13 --- /dev/null +++ b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/RedditClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "24640382cdbf8abc73003fb0fa6d111a705499eb", + "evaluation_time": 102.21613621711731, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.4858953604929018, + "v_measure": 0.4858953604929018, + "v_measure_std": 0.011996961508966422, + "v_measures": { + "Level 0": [ + 0.48421827017108426, + 0.4992476654054556, + 0.47291630505884624, + 0.4756930942527921, + 0.48702009269702035, + 0.4960352419102772, + 0.49328767963362663, + 0.4655815563905837, + 0.5052756938339665, + 0.4796780055753648 + ] + } + } + ] + }, + "task_name": "RedditClustering.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/RedditClusteringP2P.json b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/RedditClusteringP2P.json new file mode 100644 index 0000000000..f313558e0d --- /dev/null +++ b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/RedditClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "385e3cb46b4cfa89021f56c4380204149d0efe33", + "evaluation_time": 7636.0380737781525, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.6370633126955434, + "v_measure": 0.6370633126955434, + "v_measure_std": 0.11559459183230124, + "v_measures": [ + 0.6844742821956354, + 0.6911678272452055, + 0.6519381485995118, + 0.37717619714345724, + 0.7262729519420306, + 0.6357815536341453, + 0.4549113574972448, + 0.7287831567661298, + 0.6946786477605348, + 0.7254490041715388 + ] + } + ] + }, + "task_name": "RedditClusteringP2P" +} \ No newline at end of file diff --git a/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/RedditClusteringP2P.v2.json b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/RedditClusteringP2P.v2.json new file mode 100644 index 0000000000..265fc9d9f0 --- /dev/null +++ b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/RedditClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "385e3cb46b4cfa89021f56c4380204149d0efe33", + "evaluation_time": 325.6005687713623, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.6172405658925249, + "v_measure": 0.6172405658925249, + "v_measure_std": 0.008332188813774377, + "v_measures": { + "Level 0": [ + 0.6232076006561355, + 0.6283435376933579, + 0.6065177173941129, + 0.6093826781902506, + 0.6244506284613052, + 0.6230695109749914, + 0.606198207240463, + 0.6268029268779168, + 0.610115433770851, + 0.6143174176658642 + ] + } + } + ] + }, + "task_name": "RedditClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/StackExchangeClustering.json b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/StackExchangeClustering.json new file mode 100644 index 0000000000..35ef8f37ea --- /dev/null +++ b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/StackExchangeClustering.json @@ -0,0 +1,47 @@ +{ + "dataset_revision": "6cbc1f7b2bc0622f2e39d2c77fa502909748c259", + "evaluation_time": 963.4406597614288, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.652310289571111, + "v_measure": 0.652310289571111, + "v_measure_std": 0.04378853470993744, + "v_measures": [ + 0.6779129712294665, + 0.7163425038003004, + 0.5760699141523622, + 0.701721612043686, + 0.6393636658490027, + 0.6042464498801883, + 0.6171412368704584, + 0.7213847302795137, + 0.6306224520444482, + 0.6699946627482336, + 0.7256874222517498, + 0.6950492566187088, + 0.7236445250789381, + 0.695536814063526, + 0.6142119226815635, + 0.6341882780280998, + 0.6248762004047377, + 0.6381287789536728, + 0.6182113655473385, + 0.6285392588222483, + 0.6489273760171093, + 0.6303974325712444, + 0.5736349293586929, + 0.6640533390692047, + 0.6378701409132815 + ] + } + ] + }, + "task_name": "StackExchangeClustering" +} \ No newline at end of file diff --git a/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/StackExchangeClustering.v2.json b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/StackExchangeClustering.v2.json new file mode 100644 index 0000000000..779fd6bbec --- /dev/null +++ b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/StackExchangeClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "6cbc1f7b2bc0622f2e39d2c77fa502909748c259", + "evaluation_time": 97.58061671257019, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.5207408773855098, + "v_measure": 0.5207408773855098, + "v_measure_std": 0.010143577781006576, + "v_measures": { + "Level 0": [ + 0.5108265916668678, + 0.512178654787436, + 0.5413250815466998, + 0.5230029267733962, + 0.5139904010592331, + 0.5196193297917938, + 0.5137295721001438, + 0.5114246141739172, + 0.5257009409833286, + 0.5356106609722808 + ] + } + } + ] + }, + "task_name": "StackExchangeClustering.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/StackExchangeClusteringP2P.json b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/StackExchangeClusteringP2P.json new file mode 100644 index 0000000000..bd8841d915 --- /dev/null +++ b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/StackExchangeClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "815ca46b2622cec33ccafc3735d572c266efdb44", + "evaluation_time": 1830.958482503891, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3361698865959878, + "v_measure": 0.3361698865959878, + "v_measure_std": 0.0160653600393997, + "v_measures": [ + 0.32674509318570594, + 0.3245264625205659, + 0.3165526722611096, + 0.3158324930638145, + 0.321942762019177, + 0.35839859569395577, + 0.34177840057221426, + 0.34927758807037795, + 0.34741029429157866, + 0.3592345042813784 + ] + } + ] + }, + "task_name": "StackExchangeClusteringP2P" +} \ No newline at end of file diff --git a/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/StackExchangeClusteringP2P.v2.json b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/StackExchangeClusteringP2P.v2.json new file mode 100644 index 0000000000..e8df6c05e3 --- /dev/null +++ b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/StackExchangeClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "815ca46b2622cec33ccafc3735d572c266efdb44", + "evaluation_time": 81.74703669548035, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3984375347506265, + "v_measure": 0.3984375347506265, + "v_measure_std": 0.00490496800679445, + "v_measures": { + "Level 0": [ + 0.3946260828697897, + 0.40278628960607493, + 0.40375931702041, + 0.4038177572367214, + 0.39684079229197977, + 0.40366300871003813, + 0.3915464952376379, + 0.39817893493635764, + 0.3899585510285294, + 0.39919811856872595 + ] + } + } + ] + }, + "task_name": "StackExchangeClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/TwentyNewsgroupsClustering.json b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/TwentyNewsgroupsClustering.json new file mode 100644 index 0000000000..80d16bf3e5 --- /dev/null +++ b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/TwentyNewsgroupsClustering.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "6125ec4e24fa026cec8a478383ee943acfbd5449", + "evaluation_time": 87.74184966087341, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.48733975350340736, + "v_measure": 0.48733975350340736, + "v_measure_std": 0.016558537023323175, + "v_measures": [ + 0.45809310702668987, + 0.47081310579946184, + 0.4920652363604418, + 0.47435619423254144, + 0.48705065217212423, + 0.5201409766208283, + 0.4851093687616796, + 0.4855015877175132, + 0.5024495811636626, + 0.4978177251791305 + ] + } + ] + }, + "task_name": "TwentyNewsgroupsClustering" +} \ No newline at end of file diff --git a/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/TwentyNewsgroupsClustering.v2.json b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/TwentyNewsgroupsClustering.v2.json new file mode 100644 index 0000000000..c0ac9eca6a --- /dev/null +++ b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/TwentyNewsgroupsClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "6125ec4e24fa026cec8a478383ee943acfbd5449", + "evaluation_time": 6.978201627731323, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.4824365573569779, + "v_measure": 0.4824365573569779, + "v_measure_std": 0.020950361189034757, + "v_measures": { + "Level 0": [ + 0.4857556747044126, + 0.4719530641149698, + 0.4653839257061806, + 0.5243814740624608, + 0.5049709160823869, + 0.4852236142989205, + 0.48340694656560235, + 0.44136812909962864, + 0.47865761496917214, + 0.4832642139660443 + ] + } + } + ] + }, + "task_name": "TwentyNewsgroupsClustering.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/model_meta.json b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/model_meta.json new file mode 100644 index 0000000000..247d92c403 --- /dev/null +++ b/results/intfloat__e5-large-v2/b322e09026e4ea05f42beadf4d661fb4e101d311/model_meta.json @@ -0,0 +1 @@ +{"name": "intfloat/e5-large-v2", "revision": "b322e09026e4ea05f42beadf4d661fb4e101d311", "release_date": "2024-02-08", "languages": ["eng_Latn"], "n_parameters": null, "memory_usage": null, "max_tokens": null, "embed_dim": null, "license": null, "open_source": true, "framework": [], "loader": "E5Wrapper"} \ No newline at end of file diff --git a/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/BiorxivClusteringP2P.json b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/BiorxivClusteringP2P.json new file mode 100644 index 0000000000..647c163539 --- /dev/null +++ b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/BiorxivClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "65b79d1d13f80053f67aca9498d9402c2d9f1f40", + "evaluation_time": 351.17173528671265, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3613581658569338, + "v_measure": 0.3613581658569338, + "v_measure_std": 0.007103622519613694, + "v_measures": [ + 0.3632798914619017, + 0.36736526200015673, + 0.3649324194559493, + 0.34490547883370787, + 0.35713305418417995, + 0.3534995332781896, + 0.3662681229099763, + 0.36107457716061553, + 0.36701136390122385, + 0.36811195538343716 + ] + } + ] + }, + "task_name": "BiorxivClusteringP2P" +} \ No newline at end of file diff --git a/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/BiorxivClusteringP2P.v2.json b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/BiorxivClusteringP2P.v2.json new file mode 100644 index 0000000000..a9d4e9c597 --- /dev/null +++ b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/BiorxivClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "f5dbc242e11dd8e24def4c4268607a49e02946dc", + "evaluation_time": 12.726956367492676, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.37464846514243255, + "v_measure": 0.37464846514243255, + "v_measure_std": 0.005878075676975097, + "v_measures": { + "Level 0": [ + 0.38100376427082094, + 0.37136883775106455, + 0.37281613715029044, + 0.36822879692443194, + 0.38218329561009223, + 0.3715128197027489, + 0.36316694507910713, + 0.3782691609666132, + 0.3782766156434255, + 0.37965827832573007 + ] + } + } + ] + }, + "task_name": "BiorxivClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/BiorxivClusteringS2S.json b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/BiorxivClusteringS2S.json new file mode 100644 index 0000000000..92d6c3255e --- /dev/null +++ b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/BiorxivClusteringS2S.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "258694dd0231531bc1fd9de6ceb52a0853c6d908", + "evaluation_time": 27.937171936035156, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.2968042178414473, + "v_measure": 0.2968042178414473, + "v_measure_std": 0.006755310407544819, + "v_measures": [ + 0.29864690177900116, + 0.2869036369606473, + 0.301652556309486, + 0.28778555329970007, + 0.3017969570029975, + 0.30286554189606213, + 0.29057567698252407, + 0.29150143927008515, + 0.29864106172908783, + 0.3076728531848818 + ] + } + ] + }, + "task_name": "BiorxivClusteringS2S" +} \ No newline at end of file diff --git a/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/BiorxivClusteringS2S.v2.json b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/BiorxivClusteringS2S.v2.json new file mode 100644 index 0000000000..c87e3fdad6 --- /dev/null +++ b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/BiorxivClusteringS2S.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "eb4edb10386758d274cd161093eb351381a16dbf", + "evaluation_time": 3.730611801147461, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.31224001745374086, + "v_measure": 0.31224001745374086, + "v_measure_std": 0.007229725144242237, + "v_measures": { + "Level 0": [ + 0.3104229360305897, + 0.3092877823606324, + 0.30859388253944486, + 0.30286194564424546, + 0.3136614969200592, + 0.3075918676155071, + 0.30473903556306, + 0.32552238517362064, + 0.3155578695722236, + 0.3241609731180262 + ] + } + } + ] + }, + "task_name": "BiorxivClusteringS2S.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/MedrxivClusteringP2P.json b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/MedrxivClusteringP2P.json new file mode 100644 index 0000000000..848d693383 --- /dev/null +++ b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/MedrxivClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "e7a26af6f3ae46b30dde8737f02c07b1505bcc73", + "evaluation_time": 201.23111581802368, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.31666475705282715, + "v_measure": 0.31666475705282715, + "v_measure_std": 0.012662547551139122, + "v_measures": [ + 0.30726419206992095, + 0.30265318585747536, + 0.30118166808595215, + 0.3030875620589692, + 0.31506744075108095, + 0.3284005700423578, + 0.31391081283140737, + 0.33540511031935255, + 0.3347618543172162, + 0.32491517419453897 + ] + } + ] + }, + "task_name": "MedrxivClusteringP2P" +} \ No newline at end of file diff --git a/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/MedrxivClusteringP2P.v2.json b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/MedrxivClusteringP2P.v2.json new file mode 100644 index 0000000000..794cc49fe0 --- /dev/null +++ b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/MedrxivClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "e7a26af6f3ae46b30dde8737f02c07b1505bcc73", + "evaluation_time": 11.121971845626831, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3480660307591203, + "v_measure": 0.3480660307591203, + "v_measure_std": 0.008729597263994714, + "v_measures": { + "Level 0": [ + 0.34479481931294786, + 0.3443311076819651, + 0.33400139522070055, + 0.3619609795483745, + 0.35889246612735537, + 0.3390803411402807, + 0.3542365866175847, + 0.3516597512757167, + 0.35247603662170357, + 0.339226824044574 + ] + } + } + ] + }, + "task_name": "MedrxivClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/MedrxivClusteringS2S.json b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/MedrxivClusteringS2S.json new file mode 100644 index 0000000000..8e3b2cc238 --- /dev/null +++ b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/MedrxivClusteringS2S.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "35191c8c0dca72d8ff3efcd72aa802307d469663", + "evaluation_time": 16.17210030555725, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.283164564799259, + "v_measure": 0.283164564799259, + "v_measure_std": 0.015155702084198797, + "v_measures": [ + 0.26827473117648465, + 0.272649119074579, + 0.26797620924173277, + 0.26129982787466344, + 0.2745093727132204, + 0.30664359717753803, + 0.29038842959592087, + 0.29385761536407184, + 0.30131329896441195, + 0.29473344680996727 + ] + } + ] + }, + "task_name": "MedrxivClusteringS2S" +} \ No newline at end of file diff --git a/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/MedrxivClusteringS2S.v2.json b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/MedrxivClusteringS2S.v2.json new file mode 100644 index 0000000000..d36edccc80 --- /dev/null +++ b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/MedrxivClusteringS2S.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "35191c8c0dca72d8ff3efcd72aa802307d469663", + "evaluation_time": 4.060302734375, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3150336772588932, + "v_measure": 0.3150336772588932, + "v_measure_std": 0.0069662906315432465, + "v_measures": { + "Level 0": [ + 0.3026320231982677, + 0.31257949644757316, + 0.32154867768683876, + 0.31214222110555023, + 0.32372817905467643, + 0.31094620190979755, + 0.31244238731460605, + 0.3267404449171592, + 0.31800144864379115, + 0.3095756923106721 + ] + } + } + ] + }, + "task_name": "MedrxivClusteringS2S.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/RedditClustering.json b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/RedditClustering.json new file mode 100644 index 0000000000..40a5e19516 --- /dev/null +++ b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/RedditClustering.json @@ -0,0 +1,47 @@ +{ + "dataset_revision": "24640382cdbf8abc73003fb0fa6d111a705499eb", + "evaluation_time": 164.52006793022156, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.457443544893067, + "v_measure": 0.457443544893067, + "v_measure_std": 0.05725099955893965, + "v_measures": [ + 0.5020898340618893, + 0.5025360281153423, + 0.4074998965709022, + 0.4208437545110391, + 0.47711856986814094, + 0.392457719643408, + 0.5130653184623098, + 0.41488879717365684, + 0.42459696145140385, + 0.4447769018209246, + 0.43037567287198036, + 0.5239454296989859, + 0.4551588550276138, + 0.4746363987914386, + 0.5702795228807702, + 0.4110121021325805, + 0.4889453515367223, + 0.5765031995202085, + 0.37993054866503406, + 0.39712457872001355, + 0.3883712475518408, + 0.41953751687968927, + 0.5577055079978556, + 0.4148152453544856, + 0.44787366301843895 + ] + } + ] + }, + "task_name": "RedditClustering" +} \ No newline at end of file diff --git a/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/RedditClustering.v2.json b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/RedditClustering.v2.json new file mode 100644 index 0000000000..32abe5f111 --- /dev/null +++ b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/RedditClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "24640382cdbf8abc73003fb0fa6d111a705499eb", + "evaluation_time": 15.87044906616211, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.4084442247357899, + "v_measure": 0.4084442247357899, + "v_measure_std": 0.010422431431367691, + "v_measures": { + "Level 0": [ + 0.4030354493809208, + 0.3966717183428491, + 0.400619855607914, + 0.4059486262598946, + 0.4329547895901431, + 0.42114994944404477, + 0.4114536239906265, + 0.40006813187778506, + 0.40649648399225013, + 0.4060436188714708 + ] + } + } + ] + }, + "task_name": "RedditClustering.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/RedditClusteringP2P.json b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/RedditClusteringP2P.json new file mode 100644 index 0000000000..bc888ec185 --- /dev/null +++ b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/RedditClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "385e3cb46b4cfa89021f56c4380204149d0efe33", + "evaluation_time": 1031.6095232963562, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.5986311932913578, + "v_measure": 0.5986311932913578, + "v_measure_std": 0.1158972234978085, + "v_measures": [ + 0.6440791091200495, + 0.6355074016869999, + 0.6469322086040408, + 0.3727114507395317, + 0.6824245256136253, + 0.6013995697480568, + 0.37103504044945124, + 0.6753473170755456, + 0.6724762514398748, + 0.6843990584364021 + ] + } + ] + }, + "task_name": "RedditClusteringP2P" +} \ No newline at end of file diff --git a/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/RedditClusteringP2P.v2.json b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/RedditClusteringP2P.v2.json new file mode 100644 index 0000000000..975b0c9a8d --- /dev/null +++ b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/RedditClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "385e3cb46b4cfa89021f56c4380204149d0efe33", + "evaluation_time": 48.343266248703, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.580522381202967, + "v_measure": 0.580522381202967, + "v_measure_std": 0.006543093058959593, + "v_measures": { + "Level 0": [ + 0.5884102293940566, + 0.5841124632359008, + 0.5828424789661785, + 0.5865598894284151, + 0.5796485745957438, + 0.5855589754165801, + 0.5717069618938344, + 0.5798793796284331, + 0.5661383874973958, + 0.5803664719731312 + ] + } + } + ] + }, + "task_name": "RedditClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/StackExchangeClustering.json b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/StackExchangeClustering.json new file mode 100644 index 0000000000..1efc9962d9 --- /dev/null +++ b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/StackExchangeClustering.json @@ -0,0 +1,47 @@ +{ + "dataset_revision": "6cbc1f7b2bc0622f2e39d2c77fa502909748c259", + "evaluation_time": 131.6534924507141, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.5786749693067104, + "v_measure": 0.5786749693067104, + "v_measure_std": 0.04851157828913518, + "v_measures": [ + 0.6038475427609066, + 0.6423442010651822, + 0.5132274943643667, + 0.5886488130104082, + 0.5816516197141172, + 0.5119608192960428, + 0.5080101638361733, + 0.6494452535856595, + 0.5801403211427602, + 0.571147628691392, + 0.631567504473316, + 0.6719649455303834, + 0.6610790923004143, + 0.6407971890406244, + 0.543821985577552, + 0.548387072347732, + 0.5349593640241069, + 0.5925768419501714, + 0.5256054401477923, + 0.5306452180764517, + 0.5788999152819156, + 0.5183925097034577, + 0.5867034015501511, + 0.5727459243257725, + 0.5783039708709098 + ] + } + ] + }, + "task_name": "StackExchangeClustering" +} \ No newline at end of file diff --git a/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/StackExchangeClustering.v2.json b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/StackExchangeClustering.v2.json new file mode 100644 index 0000000000..e0f8df7ada --- /dev/null +++ b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/StackExchangeClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "6cbc1f7b2bc0622f2e39d2c77fa502909748c259", + "evaluation_time": 15.56183409690857, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.4655300833419639, + "v_measure": 0.4655300833419639, + "v_measure_std": 0.007533566875829111, + "v_measures": { + "Level 0": [ + 0.4567026624166713, + 0.4781530750358173, + 0.45802449001206036, + 0.47583158996519453, + 0.464874716114081, + 0.4602806833377055, + 0.4670358964694553, + 0.47421608044147556, + 0.46130678618446114, + 0.45887485344271617 + ] + } + } + ] + }, + "task_name": "StackExchangeClustering.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/StackExchangeClusteringP2P.json b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/StackExchangeClusteringP2P.json new file mode 100644 index 0000000000..58d19c9921 --- /dev/null +++ b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/StackExchangeClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "815ca46b2622cec33ccafc3735d572c266efdb44", + "evaluation_time": 259.68598222732544, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.31907396015131756, + "v_measure": 0.31907396015131756, + "v_measure_std": 0.01280924297336394, + "v_measures": [ + 0.3072356748716255, + 0.30685103271511366, + 0.3090189295524522, + 0.3052029127805473, + 0.3041958697891806, + 0.3302115997718814, + 0.3271299055432762, + 0.33403862603160295, + 0.33103809271724166, + 0.3358169577402535 + ] + } + ] + }, + "task_name": "StackExchangeClusteringP2P" +} \ No newline at end of file diff --git a/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/StackExchangeClusteringP2P.v2.json b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/StackExchangeClusteringP2P.v2.json new file mode 100644 index 0000000000..d52bc65d0d --- /dev/null +++ b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/StackExchangeClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "815ca46b2622cec33ccafc3735d572c266efdb44", + "evaluation_time": 15.348011255264282, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.381701495052936, + "v_measure": 0.381701495052936, + "v_measure_std": 0.0059882715623274865, + "v_measures": { + "Level 0": [ + 0.3828059826956902, + 0.3826335078803138, + 0.37920799891506035, + 0.382694062261965, + 0.38087575963799014, + 0.38819200547844224, + 0.378423781223926, + 0.38845693195117315, + 0.3869441836451505, + 0.3667807368396486 + ] + } + } + ] + }, + "task_name": "StackExchangeClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/TwentyNewsgroupsClustering.json b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/TwentyNewsgroupsClustering.json new file mode 100644 index 0000000000..86ec0e1fb7 --- /dev/null +++ b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/TwentyNewsgroupsClustering.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "6125ec4e24fa026cec8a478383ee943acfbd5449", + "evaluation_time": 16.902500867843628, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.41245523322358457, + "v_measure": 0.41245523322358457, + "v_measure_std": 0.014551197354529017, + "v_measures": [ + 0.4114087609518188, + 0.42974156567488775, + 0.3850868654398094, + 0.42363804535245053, + 0.42380427126965614, + 0.4220912132909387, + 0.4151511048533169, + 0.4110350980377996, + 0.41652038401947455, + 0.38607502334569266 + ] + } + ] + }, + "task_name": "TwentyNewsgroupsClustering" +} \ No newline at end of file diff --git a/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/TwentyNewsgroupsClustering.v2.json b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/TwentyNewsgroupsClustering.v2.json new file mode 100644 index 0000000000..45d2abeb26 --- /dev/null +++ b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/TwentyNewsgroupsClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "6125ec4e24fa026cec8a478383ee943acfbd5449", + "evaluation_time": 3.654139757156372, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.41205223085486686, + "v_measure": 0.41205223085486686, + "v_measure_std": 0.022068568047595234, + "v_measures": { + "Level 0": [ + 0.3737723114652832, + 0.4452800099447602, + 0.37508018434911744, + 0.43125470190709353, + 0.4153807354814707, + 0.4136790271968939, + 0.4313514398540077, + 0.4224675771252919, + 0.4064878659568246, + 0.40576845526792543 + ] + } + } + ] + }, + "task_name": "TwentyNewsgroupsClustering.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/model_meta.json b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/model_meta.json new file mode 100644 index 0000000000..a998beffb9 --- /dev/null +++ b/results/intfloat__e5-small-v2/dca8b1a9dae0d4575df2bf423a5edb485a431236/model_meta.json @@ -0,0 +1 @@ +{"name": "intfloat/e5-small-v2", "revision": "dca8b1a9dae0d4575df2bf423a5edb485a431236", "release_date": "2024-02-08", "languages": ["eng_Latn"], "n_parameters": null, "memory_usage": null, "max_tokens": null, "embed_dim": null, "license": null, "open_source": true, "framework": [], "loader": "E5Wrapper"} \ No newline at end of file diff --git a/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/BiorxivClusteringP2P.json b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/BiorxivClusteringP2P.json new file mode 100644 index 0000000000..738d2fdee2 --- /dev/null +++ b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/BiorxivClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "65b79d1d13f80053f67aca9498d9402c2d9f1f40", + "evaluation_time": 350.7559583187103, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3610012956346088, + "v_measure": 0.3610012956346088, + "v_measure_std": 0.012539680600009864, + "v_measures": [ + 0.37123436347856315, + 0.35270011898473436, + 0.3569474834574744, + 0.3396733815867422, + 0.36577568904797714, + 0.36259449347007916, + 0.34865495930601687, + 0.3815862099295279, + 0.3773999463966529, + 0.35344631068832005 + ] + } + ] + }, + "task_name": "BiorxivClusteringP2P" +} \ No newline at end of file diff --git a/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/BiorxivClusteringP2P.v2.json b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/BiorxivClusteringP2P.v2.json new file mode 100644 index 0000000000..c67e74da61 --- /dev/null +++ b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/BiorxivClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "f5dbc242e11dd8e24def4c4268607a49e02946dc", + "evaluation_time": 12.65479302406311, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3816344531951946, + "v_measure": 0.3816344531951946, + "v_measure_std": 0.009422096670958694, + "v_measures": { + "Level 0": [ + 0.37989432697263664, + 0.3771192225156711, + 0.3930962793156987, + 0.3911370984206704, + 0.36889070843871247, + 0.37000648328064434, + 0.3848614294868738, + 0.38228852036569133, + 0.397124892112692, + 0.3719255710426558 + ] + } + } + ] + }, + "task_name": "BiorxivClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/BiorxivClusteringS2S.json b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/BiorxivClusteringS2S.json new file mode 100644 index 0000000000..11f8e27610 --- /dev/null +++ b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/BiorxivClusteringS2S.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "258694dd0231531bc1fd9de6ceb52a0853c6d908", + "evaluation_time": 28.016948223114014, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3151052799617089, + "v_measure": 0.3151052799617089, + "v_measure_std": 0.011540533484604572, + "v_measures": [ + 0.3245264423314214, + 0.30843737351412065, + 0.3082999230291673, + 0.30619537114113, + 0.30517580020450186, + 0.29670069951031625, + 0.3245525242049214, + 0.33217017457988274, + 0.3139575153551249, + 0.3310369757465025 + ] + } + ] + }, + "task_name": "BiorxivClusteringS2S" +} \ No newline at end of file diff --git a/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/BiorxivClusteringS2S.v2.json b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/BiorxivClusteringS2S.v2.json new file mode 100644 index 0000000000..1f7a0d81ee --- /dev/null +++ b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/BiorxivClusteringS2S.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "eb4edb10386758d274cd161093eb351381a16dbf", + "evaluation_time": 3.8613884449005127, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3334109458672628, + "v_measure": 0.3334109458672628, + "v_measure_std": 0.009675657257872103, + "v_measures": { + "Level 0": [ + 0.3463312289884471, + 0.3292517403513273, + 0.3414093977402835, + 0.3281457186142632, + 0.3334312099843353, + 0.34321946463800473, + 0.3122898970979796, + 0.3412461954364403, + 0.3328748742605356, + 0.3259097315610112 + ] + } + } + ] + }, + "task_name": "BiorxivClusteringS2S.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/MedrxivClusteringP2P.json b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/MedrxivClusteringP2P.json new file mode 100644 index 0000000000..2f3a2c80e7 --- /dev/null +++ b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/MedrxivClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "e7a26af6f3ae46b30dde8737f02c07b1505bcc73", + "evaluation_time": 200.54774618148804, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3130822858667672, + "v_measure": 0.3130822858667672, + "v_measure_std": 0.015357820967639678, + "v_measures": [ + 0.29906442040389203, + 0.2996753551443111, + 0.29654787580388764, + 0.30188213953676823, + 0.30285112803175973, + 0.3348979883976372, + 0.3312591942638761, + 0.33900951413374075, + 0.31312387687863674, + 0.3125113660731623 + ] + } + ] + }, + "task_name": "MedrxivClusteringP2P" +} \ No newline at end of file diff --git a/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/MedrxivClusteringP2P.v2.json b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/MedrxivClusteringP2P.v2.json new file mode 100644 index 0000000000..b49861cc98 --- /dev/null +++ b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/MedrxivClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "e7a26af6f3ae46b30dde8737f02c07b1505bcc73", + "evaluation_time": 10.914621114730835, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.34459737263951334, + "v_measure": 0.34459737263951334, + "v_measure_std": 0.006872796436997929, + "v_measures": { + "Level 0": [ + 0.35972242143304006, + 0.3469889064098362, + 0.343231308226251, + 0.3459611860680721, + 0.35071503574497287, + 0.3382199172517198, + 0.34353894740724344, + 0.33329988256001114, + 0.3393830008667627, + 0.34491312042722366 + ] + } + } + ] + }, + "task_name": "MedrxivClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/MedrxivClusteringS2S.json b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/MedrxivClusteringS2S.json new file mode 100644 index 0000000000..bf59636d26 --- /dev/null +++ b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/MedrxivClusteringS2S.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "35191c8c0dca72d8ff3efcd72aa802307d469663", + "evaluation_time": 16.029958724975586, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.2831937611037462, + "v_measure": 0.2831937611037462, + "v_measure_std": 0.012210763731996581, + "v_measures": [ + 0.2697087478679298, + 0.26673623026266374, + 0.27221249462114955, + 0.26861109913635123, + 0.2902184252048006, + 0.2953367455305727, + 0.290187864103038, + 0.3031806231209158, + 0.29071121955070284, + 0.2850341616393377 + ] + } + ] + }, + "task_name": "MedrxivClusteringS2S" +} \ No newline at end of file diff --git a/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/MedrxivClusteringS2S.v2.json b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/MedrxivClusteringS2S.v2.json new file mode 100644 index 0000000000..dd30553f1f --- /dev/null +++ b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/MedrxivClusteringS2S.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "35191c8c0dca72d8ff3efcd72aa802307d469663", + "evaluation_time": 3.918783664703369, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3231702728191858, + "v_measure": 0.3231702728191858, + "v_measure_std": 0.006798674817544176, + "v_measures": { + "Level 0": [ + 0.3253833635796724, + 0.3221212019595597, + 0.30703952062360224, + 0.32218863578668505, + 0.31688874888994273, + 0.32337613471341947, + 0.33156700467830635, + 0.32789118438027476, + 0.33102220094748824, + 0.32422473263290713 + ] + } + } + ] + }, + "task_name": "MedrxivClusteringS2S.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/RedditClustering.json b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/RedditClustering.json new file mode 100644 index 0000000000..35c91718e0 --- /dev/null +++ b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/RedditClustering.json @@ -0,0 +1,47 @@ +{ + "dataset_revision": "24640382cdbf8abc73003fb0fa6d111a705499eb", + "evaluation_time": 164.93480920791626, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.4327047084994605, + "v_measure": 0.4327047084994605, + "v_measure_std": 0.05476087692658286, + "v_measures": [ + 0.44088612447430425, + 0.5096513526076663, + 0.3735846603660321, + 0.38624138871154556, + 0.42430514840107847, + 0.3953161927361215, + 0.4715006909314474, + 0.3898450625446227, + 0.37264931018001096, + 0.4027837789377052, + 0.3894256491245102, + 0.47604995209628154, + 0.44933118846897296, + 0.4396330507800492, + 0.5189167344261403, + 0.40503350045267733, + 0.4503236973574068, + 0.5770028620531704, + 0.4476077506495646, + 0.3793491897019061, + 0.3805444680673142, + 0.39477610817071596, + 0.5396674937471533, + 0.40036510824267263, + 0.40282724925744107 + ] + } + ] + }, + "task_name": "RedditClustering" +} \ No newline at end of file diff --git a/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/RedditClustering.v2.json b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/RedditClustering.v2.json new file mode 100644 index 0000000000..d96f592871 --- /dev/null +++ b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/RedditClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "24640382cdbf8abc73003fb0fa6d111a705499eb", + "evaluation_time": 15.564559936523438, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.38340024602522027, + "v_measure": 0.38340024602522027, + "v_measure_std": 0.014601857402454751, + "v_measures": { + "Level 0": [ + 0.37362238918735513, + 0.3700908350081886, + 0.3646546552124134, + 0.3964838254593654, + 0.3706587969952726, + 0.41324745623101083, + 0.3911805571943866, + 0.38328004915632385, + 0.3750204402520099, + 0.3957634555558763 + ] + } + } + ] + }, + "task_name": "RedditClustering.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/RedditClusteringP2P.json b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/RedditClusteringP2P.json new file mode 100644 index 0000000000..423454cc78 --- /dev/null +++ b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/RedditClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "385e3cb46b4cfa89021f56c4380204149d0efe33", + "evaluation_time": 1032.4352898597717, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.5722310334636329, + "v_measure": 0.5722310334636329, + "v_measure_std": 0.11033412595562977, + "v_measures": [ + 0.6040467373335107, + 0.6321062697642864, + 0.6116000438597108, + 0.3451529726225897, + 0.64720311659247, + 0.5620197633876244, + 0.37193064062059156, + 0.6596459110125397, + 0.635663018471953, + 0.652941860971054 + ] + } + ] + }, + "task_name": "RedditClusteringP2P" +} \ No newline at end of file diff --git a/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/RedditClusteringP2P.v2.json b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/RedditClusteringP2P.v2.json new file mode 100644 index 0000000000..2c84f0d95f --- /dev/null +++ b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/RedditClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "385e3cb46b4cfa89021f56c4380204149d0efe33", + "evaluation_time": 48.234893560409546, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.5564603367498093, + "v_measure": 0.5564603367498093, + "v_measure_std": 0.004899508854361777, + "v_measures": { + "Level 0": [ + 0.5668694637683581, + 0.5560191376653916, + 0.5557000888844499, + 0.5532307713157685, + 0.5593284300088811, + 0.5559344009767576, + 0.5500987305075771, + 0.5583506180941834, + 0.5600379652923252, + 0.5490337609844006 + ] + } + } + ] + }, + "task_name": "RedditClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/StackExchangeClustering.json b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/StackExchangeClustering.json new file mode 100644 index 0000000000..6e9ffd156a --- /dev/null +++ b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/StackExchangeClustering.json @@ -0,0 +1,47 @@ +{ + "dataset_revision": "6cbc1f7b2bc0622f2e39d2c77fa502909748c259", + "evaluation_time": 132.01438355445862, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.5960135841004834, + "v_measure": 0.5960135841004834, + "v_measure_std": 0.048719951869163454, + "v_measures": [ + 0.5820946350018588, + 0.6387984274019307, + 0.5159054623096903, + 0.6062163818171245, + 0.5919232706866341, + 0.5247116850669843, + 0.5582223325992901, + 0.6464465473042557, + 0.5894142288152241, + 0.598077978088507, + 0.7419711594107024, + 0.633290833214199, + 0.696695337501811, + 0.6115921034372186, + 0.5416970965450053, + 0.5938298393135336, + 0.586443970047695, + 0.6049720748378516, + 0.5611051670017797, + 0.5484294241207932, + 0.6007509780522686, + 0.5627019704715103, + 0.5695686392407111, + 0.6065474196159544, + 0.5889326406095527 + ] + } + ] + }, + "task_name": "StackExchangeClustering" +} \ No newline at end of file diff --git a/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/StackExchangeClustering.v2.json b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/StackExchangeClustering.v2.json new file mode 100644 index 0000000000..a1af972191 --- /dev/null +++ b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/StackExchangeClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "6cbc1f7b2bc0622f2e39d2c77fa502909748c259", + "evaluation_time": 15.65767502784729, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.4832468137399329, + "v_measure": 0.4832468137399329, + "v_measure_std": 0.010346589738808878, + "v_measures": { + "Level 0": [ + 0.4955314048509599, + 0.4787323683986079, + 0.49171539254483143, + 0.48894789855493825, + 0.47050271721465076, + 0.47940093466933154, + 0.48131799084205873, + 0.473195662159697, + 0.4708921611904218, + 0.5022316069738313 + ] + } + } + ] + }, + "task_name": "StackExchangeClustering.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/StackExchangeClusteringP2P.json b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/StackExchangeClusteringP2P.json new file mode 100644 index 0000000000..73d7cef638 --- /dev/null +++ b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/StackExchangeClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "815ca46b2622cec33ccafc3735d572c266efdb44", + "evaluation_time": 259.8926947116852, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.30815510580894634, + "v_measure": 0.30815510580894634, + "v_measure_std": 0.01859119283034541, + "v_measures": [ + 0.29285637252595914, + 0.2929903765497153, + 0.29552500280858307, + 0.2846094546011709, + 0.28540107511881424, + 0.33211585845476277, + 0.3217244746999102, + 0.3185837829855361, + 0.3246752102094282, + 0.33306945013558337 + ] + } + ] + }, + "task_name": "StackExchangeClusteringP2P" +} \ No newline at end of file diff --git a/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/StackExchangeClusteringP2P.v2.json b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/StackExchangeClusteringP2P.v2.json new file mode 100644 index 0000000000..b664185a4c --- /dev/null +++ b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/StackExchangeClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "815ca46b2622cec33ccafc3735d572c266efdb44", + "evaluation_time": 15.19907283782959, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3661429204340775, + "v_measure": 0.3661429204340775, + "v_measure_std": 0.005568642707545272, + "v_measures": { + "Level 0": [ + 0.3680515244788594, + 0.37297979609129345, + 0.3668163585569195, + 0.3612736085262788, + 0.36741278815556927, + 0.3726459359321665, + 0.3572093991320925, + 0.35654337106756995, + 0.368799951478008, + 0.3696964709220172 + ] + } + } + ] + }, + "task_name": "StackExchangeClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/TwentyNewsgroupsClustering.json b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/TwentyNewsgroupsClustering.json new file mode 100644 index 0000000000..4cc634aa8b --- /dev/null +++ b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/TwentyNewsgroupsClustering.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "6125ec4e24fa026cec8a478383ee943acfbd5449", + "evaluation_time": 16.825819730758667, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3765399430736874, + "v_measure": 0.3765399430736874, + "v_measure_std": 0.016090914254943717, + "v_measures": [ + 0.40220811176478893, + 0.40782917397845825, + 0.362391006207059, + 0.379399356613916, + 0.3777669960536164, + 0.3745829005038882, + 0.3659256034200708, + 0.3613630755824965, + 0.35668796418392584, + 0.3772452424286534 + ] + } + ] + }, + "task_name": "TwentyNewsgroupsClustering" +} \ No newline at end of file diff --git a/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/TwentyNewsgroupsClustering.v2.json b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/TwentyNewsgroupsClustering.v2.json new file mode 100644 index 0000000000..17ba05ad9c --- /dev/null +++ b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/TwentyNewsgroupsClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "6125ec4e24fa026cec8a478383ee943acfbd5449", + "evaluation_time": 3.740474224090576, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3833947263662072, + "v_measure": 0.3833947263662072, + "v_measure_std": 0.017521082305739805, + "v_measures": { + "Level 0": [ + 0.3862972903987586, + 0.3723775785967087, + 0.3981709111245807, + 0.34362468095178866, + 0.3844685618794919, + 0.393578572467558, + 0.3630475482556308, + 0.39639986489295154, + 0.39438740056952276, + 0.4015948545250801 + ] + } + } + ] + }, + "task_name": "TwentyNewsgroupsClustering.v2" +} \ No newline at end of file diff --git a/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/model_meta.json b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/model_meta.json new file mode 100644 index 0000000000..5f6a537aab --- /dev/null +++ b/results/intfloat__e5-small/e272f3049e853b47cb5ca3952268c6662abda68f/model_meta.json @@ -0,0 +1 @@ +{"name": "intfloat/e5-small", "revision": "e272f3049e853b47cb5ca3952268c6662abda68f", "release_date": "2024-02-08", "languages": ["eng_Latn"], "n_parameters": null, "memory_usage": null, "max_tokens": null, "embed_dim": null, "license": null, "open_source": true, "framework": [], "loader": "E5Wrapper"} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/ArxivClusteringP2P.json b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/ArxivClusteringP2P.json new file mode 100644 index 0000000000..df98f091dd --- /dev/null +++ b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/ArxivClusteringP2P.json @@ -0,0 +1,53 @@ +{ + "dataset_revision": "a122ad7f3f0291bf49cc6f4d32aa80929df69d5d", + "evaluation_time": 5956.89071726799, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.43349302457921374, + "v_measure": 0.43349302457921374, + "v_measure_std": 0.1364251955618546, + "v_measures": [ + 0.4375374710331693, + 0.4335833284349304, + 0.4442562202883246, + 0.42886174476641203, + 0.440046121701213, + 0.42365577956034545, + 0.4479905027317126, + 0.4416411502662394, + 0.44979388529802605, + 0.4264278118014404, + 0.49015474228134426, + 0.4965549566321279, + 0.49913208095301126, + 0.49311519626206174, + 0.5020592583507317, + 0.4961742409523277, + 0.4981036648421845, + 0.5016195447907335, + 0.49085665434830283, + 0.4876233393905936, + 0.48673005513268247, + 0.27635101777404647, + 0.35199688618967534, + 0.39971187959824844, + 0.33500264004632047, + 0.250705054268768, + 0.29851885382362764, + 0.18783946095273527, + 0.26450069861624764, + 1.0, + 0.25773952086804053 + ] + } + ] + }, + "task_name": "ArxivClusteringP2P" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/ArxivClusteringS2S.json b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/ArxivClusteringS2S.json new file mode 100644 index 0000000000..34379a8de5 --- /dev/null +++ b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/ArxivClusteringS2S.json @@ -0,0 +1,53 @@ +{ + "dataset_revision": "f910caf1a6075f7329cdf8c1a6135696f37dbd53", + "evaluation_time": 642.6562016010284, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3599685331336122, + "v_measure": 0.3599685331336122, + "v_measure_std": 0.14195867445473556, + "v_measures": [ + 0.3426487605848568, + 0.36724242846846333, + 0.3731124032012833, + 0.3763011618674275, + 0.36131760012019704, + 0.3655304153402566, + 0.35266898380937584, + 0.3627276679385288, + 0.369701361173338, + 0.36735078275468586, + 0.4107434429231091, + 0.40636568528715544, + 0.4069515322665795, + 0.41629982571430263, + 0.4133061305493453, + 0.4042995862810529, + 0.4071682767838659, + 0.41016983893517645, + 0.40133492327322157, + 0.406152286710825, + 0.3974544822753718, + 0.21979922296243998, + 0.24967571742716974, + 0.3477254687952808, + 0.26337043134517085, + 0.18409340225001208, + 0.23796358995125597, + 0.13419300996472683, + 0.22323250704891567, + 1.0, + 0.18012360113858691 + ] + } + ] + }, + "task_name": "ArxivClusteringS2S" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/BiorxivClusteringP2P.json b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/BiorxivClusteringP2P.json new file mode 100644 index 0000000000..e8680ac696 --- /dev/null +++ b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/BiorxivClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "65b79d1d13f80053f67aca9498d9402c2d9f1f40", + "evaluation_time": 820.3113701343536, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.37546545327462166, + "v_measure": 0.37546545327462166, + "v_measure_std": 0.007224219589964202, + "v_measures": [ + 0.3847993083126385, + 0.36012736021567093, + 0.3764092094693905, + 0.37456870676066123, + 0.37447242205156217, + 0.37698920069059166, + 0.3768374024688923, + 0.3771127731522384, + 0.36699903153320285, + 0.3863391180913681 + ] + } + ] + }, + "task_name": "BiorxivClusteringP2P" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/BiorxivClusteringP2P.v2.json b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/BiorxivClusteringP2P.v2.json index 52237acd20..a9506b05a1 100644 --- a/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/BiorxivClusteringP2P.v2.json +++ b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/BiorxivClusteringP2P.v2.json @@ -1,8 +1,8 @@ { "dataset_revision": "f5dbc242e11dd8e24def4c4268607a49e02946dc", - "evaluation_time": 24.2448787689209, + "evaluation_time": 25.730472087860107, "kg_co2_emissions": null, - "mteb_version": "1.8.3", + "mteb_version": "1.12.22", "scores": { "test": [ { @@ -10,20 +10,21 @@ "languages": [ "eng-Latn" ], - "main_score": 0.38075345988938974, - "v_measure": 0.38075345988938974, + "main_score": 0.38867753499529095, + "v_measure": 0.38867753499529095, + "v_measure_std": 0.007195898753384672, "v_measures": { "Level 0": [ - 0.3775795542321043, - 0.37277274434904106, - 0.39419813536344916, - 0.378585437364803, - 0.3823755549760364, - 0.3776130891340631, - 0.379783619915026, - 0.37622214405595134, - 0.3860120835546164, - 0.38239223594880634 + 0.3769547144324447, + 0.38640087665448475, + 0.3903090997170115, + 0.37538733516667133, + 0.3992968670691309, + 0.390101530111181, + 0.39106849981951025, + 0.39368669999574535, + 0.39572142768358787, + 0.3878482993031414 ] } } diff --git a/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/BiorxivClusteringS2S.json b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/BiorxivClusteringS2S.json new file mode 100644 index 0000000000..b026846e34 --- /dev/null +++ b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/BiorxivClusteringS2S.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "258694dd0231531bc1fd9de6ceb52a0853c6d908", + "evaluation_time": 68.6751868724823, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3033472429952135, + "v_measure": 0.3033472429952135, + "v_measure_std": 0.00927590986782203, + "v_measures": [ + 0.29574428391631413, + 0.30084877704798857, + 0.2965637526409565, + 0.2866292192818315, + 0.30432888055487695, + 0.29756708051203545, + 0.3141251911435577, + 0.3177041467358545, + 0.31360059194785106, + 0.3063605061708683 + ] + } + ] + }, + "task_name": "BiorxivClusteringS2S" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/BiorxivClusteringS2S.v2.json b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/BiorxivClusteringS2S.v2.json index 6a2a9a6058..845b8856d0 100644 --- a/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/BiorxivClusteringS2S.v2.json +++ b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/BiorxivClusteringS2S.v2.json @@ -1,8 +1,8 @@ { "dataset_revision": "eb4edb10386758d274cd161093eb351381a16dbf", - "evaluation_time": 3.969054698944092, + "evaluation_time": 5.476711988449097, "kg_co2_emissions": null, - "mteb_version": "1.8.3", + "mteb_version": "1.12.22", "scores": { "test": [ { @@ -10,20 +10,21 @@ "languages": [ "eng-Latn" ], - "main_score": 0.3339370426981849, - "v_measure": 0.3339370426981849, + "main_score": 0.32227564209897747, + "v_measure": 0.32227564209897747, + "v_measure_std": 0.009992728684163581, "v_measures": { "Level 0": [ - 0.3302061666870833, - 0.3281281937981429, - 0.3247804236909797, - 0.328161210623474, - 0.3447496976066929, - 0.3265987750170304, - 0.3537641508943676, - 0.3291396991260163, - 0.34049174690560796, - 0.333350362632454 + 0.3102017449685675, + 0.30833918488785594, + 0.32129054462162604, + 0.3378411872623731, + 0.3309189139523531, + 0.31444430751870256, + 0.31134026990061114, + 0.32809804896382716, + 0.33115005216890725, + 0.32913216674495016 ] } } diff --git a/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/MedrxivClusteringP2P.json b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/MedrxivClusteringP2P.json new file mode 100644 index 0000000000..f3a5421752 --- /dev/null +++ b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/MedrxivClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "e7a26af6f3ae46b30dde8737f02c07b1505bcc73", + "evaluation_time": 440.3515968322754, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3059857191163335, + "v_measure": 0.3059857191163335, + "v_measure_std": 0.012997533528741575, + "v_measures": [ + 0.30581603045947914, + 0.292543051114527, + 0.2920950295962386, + 0.28928610220817924, + 0.2981607931447702, + 0.309293422480486, + 0.3200625261927456, + 0.33311435679255, + 0.3086768856802283, + 0.31080899349413055 + ] + } + ] + }, + "task_name": "MedrxivClusteringP2P" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/MedrxivClusteringP2P.v2.json b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/MedrxivClusteringP2P.v2.json index 97a2c9fd0e..a4d7a922e1 100644 --- a/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/MedrxivClusteringP2P.v2.json +++ b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/MedrxivClusteringP2P.v2.json @@ -1,8 +1,8 @@ { - "dataset_revision": "9894e30672c61db02f10a8593519d84e2b7a1a1c", - "evaluation_time": 25.459837913513184, + "dataset_revision": "e7a26af6f3ae46b30dde8737f02c07b1505bcc73", + "evaluation_time": 20.822232961654663, "kg_co2_emissions": null, - "mteb_version": "1.8.3", + "mteb_version": "1.12.22", "scores": { "test": [ { @@ -10,20 +10,21 @@ "languages": [ "eng-Latn" ], - "main_score": 0.3451514118693984, - "v_measure": 0.3451514118693984, + "main_score": 0.3438593334716001, + "v_measure": 0.3438593334716001, + "v_measure_std": 0.009797227512717147, "v_measures": { "Level 0": [ - 0.3350660058115947, - 0.3463088014650183, - 0.36955511878974534, - 0.3364081769617164, - 0.3391988138188023, - 0.3623025442569412, - 0.3348984057814975, - 0.3377475214308677, - 0.3646608855802199, - 0.3253678447975809 + 0.3552367044880743, + 0.34417062384346003, + 0.34561687946145303, + 0.3331156937504119, + 0.323658973833394, + 0.3564774656387454, + 0.35054809271663673, + 0.3404001083222112, + 0.3381093887704985, + 0.35125940389111565 ] } } diff --git a/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/MedrxivClusteringS2S.json b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/MedrxivClusteringS2S.json new file mode 100644 index 0000000000..b4fa9f513f --- /dev/null +++ b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/MedrxivClusteringS2S.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "35191c8c0dca72d8ff3efcd72aa802307d469663", + "evaluation_time": 40.70884728431702, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.28729247758093046, + "v_measure": 0.28729247758093046, + "v_measure_std": 0.012688958178104587, + "v_measures": [ + 0.27707842775026437, + 0.27389233936947205, + 0.2758802471031439, + 0.2734935746145515, + 0.27801490433431497, + 0.30198160905542243, + 0.2945325940704253, + 0.3010574408357491, + 0.3087619387587898, + 0.2882316999171712 + ] + } + ] + }, + "task_name": "MedrxivClusteringS2S" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/MedrxivClusteringS2S.v2.json b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/MedrxivClusteringS2S.v2.json index 19c299dfcf..22d69686b9 100644 --- a/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/MedrxivClusteringS2S.v2.json +++ b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/MedrxivClusteringS2S.v2.json @@ -1,8 +1,8 @@ { - "dataset_revision": "ec20c81676a749c0f06fb4a9397fc7e168521458", - "evaluation_time": 4.423388242721558, + "dataset_revision": "35191c8c0dca72d8ff3efcd72aa802307d469663", + "evaluation_time": 5.617826700210571, "kg_co2_emissions": null, - "mteb_version": "1.8.3", + "mteb_version": "1.12.22", "scores": { "test": [ { @@ -10,20 +10,21 @@ "languages": [ "eng-Latn" ], - "main_score": 0.3317860603999151, - "v_measure": 0.3317860603999151, + "main_score": 0.3208302771703123, + "v_measure": 0.3208302771703123, + "v_measure_std": 0.00570709389236284, "v_measures": { "Level 0": [ - 0.3360525258957095, - 0.3245928773634347, - 0.33335253284457933, - 0.3249579530334003, - 0.3330799819970639, - 0.31834960163901105, - 0.32824526044140706, - 0.3379051909660825, - 0.35300373848206046, - 0.32832094133640183 + 0.3205857958813099, + 0.3129654084776898, + 0.3204078853183542, + 0.3233631713646348, + 0.32175264346539295, + 0.3243699737043447, + 0.3200438946729818, + 0.3266348380922192, + 0.32917540510925697, + 0.3090037556169383 ] } } diff --git a/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/RedditClustering.json b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/RedditClustering.json new file mode 100644 index 0000000000..d00b73bb09 --- /dev/null +++ b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/RedditClustering.json @@ -0,0 +1,47 @@ +{ + "dataset_revision": "24640382cdbf8abc73003fb0fa6d111a705499eb", + "evaluation_time": 333.2109739780426, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.4315016803356789, + "v_measure": 0.4315016803356789, + "v_measure_std": 0.050046769105753355, + "v_measures": [ + 0.3899135788336536, + 0.5222611855652423, + 0.4000214183807749, + 0.41669890655780106, + 0.4350556771316963, + 0.43546212061602335, + 0.4704746876298788, + 0.37845532083531574, + 0.3986206963164758, + 0.3968334546709837, + 0.4214596817687342, + 0.5068502845662192, + 0.3973528487984853, + 0.4512344962141797, + 0.5125666672366576, + 0.38427016639848643, + 0.43924342920164716, + 0.5078631117279251, + 0.42861193894654226, + 0.3948749829862104, + 0.3757822633989318, + 0.3952698829310342, + 0.5449360560026447, + 0.41371502319555176, + 0.36971412848087937 + ] + } + ] + }, + "task_name": "RedditClustering" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/RedditClustering.v2.json b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/RedditClustering.v2.json new file mode 100644 index 0000000000..e7550233dd --- /dev/null +++ b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/RedditClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "24640382cdbf8abc73003fb0fa6d111a705499eb", + "evaluation_time": 28.79456114768982, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3795780973778102, + "v_measure": 0.3795780973778102, + "v_measure_std": 0.01375930110633421, + "v_measures": { + "Level 0": [ + 0.393899771090546, + 0.3776586353358133, + 0.3923447800262125, + 0.3743311654229293, + 0.3676471836497551, + 0.3610821313777014, + 0.36813952569397274, + 0.37720444526280533, + 0.40872616812460166, + 0.3747471677937645 + ] + } + } + ] + }, + "task_name": "RedditClustering.v2" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/RedditClusteringP2P.json b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/RedditClusteringP2P.json new file mode 100644 index 0000000000..be4bd85d22 --- /dev/null +++ b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/RedditClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "385e3cb46b4cfa89021f56c4380204149d0efe33", + "evaluation_time": 2453.8660345077515, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.6169121989934536, + "v_measure": 0.6169121989934536, + "v_measure_std": 0.11030125277753228, + "v_measures": [ + 0.6553078084743721, + 0.656397577043616, + 0.6638586266282993, + 0.38674081198065285, + 0.6992092144039028, + 0.6048964807128823, + 0.4204187925018359, + 0.6896299252821184, + 0.6993311288855372, + 0.6933316240213201 + ] + } + ] + }, + "task_name": "RedditClusteringP2P" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/RedditClusteringP2P.v2.json b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/RedditClusteringP2P.v2.json index c52fed66e3..00eee52c1f 100644 --- a/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/RedditClusteringP2P.v2.json +++ b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/RedditClusteringP2P.v2.json @@ -1,8 +1,8 @@ { "dataset_revision": "385e3cb46b4cfa89021f56c4380204149d0efe33", - "evaluation_time": 90.81473398208618, + "evaluation_time": 108.42505097389221, "kg_co2_emissions": null, - "mteb_version": "1.8.3", + "mteb_version": "1.12.22", "scores": { "test": [ { @@ -10,20 +10,21 @@ "languages": [ "eng-Latn" ], - "main_score": 0.6322187313666577, - "v_measure": 0.6322187313666577, + "main_score": 0.5892478675267292, + "v_measure": 0.5892478675267292, + "v_measure_std": 0.00790178249532879, "v_measures": { "Level 0": [ - 0.6309276538148396, - 0.6187034042508489, - 0.6237643579419107, - 0.6193449830466853, - 0.6452689787697535, - 0.6385791102691598, - 0.6542826933879669, - 0.6302256968225023, - 0.6344905620654006, - 0.6265998732975097 + 0.5904887104518106, + 0.5914686741944213, + 0.5793461388791847, + 0.5711346175951495, + 0.5879419156323403, + 0.5961329479768771, + 0.5936851842566048, + 0.5944369026140076, + 0.5888051965583738, + 0.599038387108521 ] } } diff --git a/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/RedditClusteringS2S.v2.json b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/RedditClusteringS2S.v2.json deleted file mode 100644 index d585628da1..0000000000 --- a/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/RedditClusteringS2S.v2.json +++ /dev/null @@ -1,33 +0,0 @@ -{ - "dataset_revision": "24640382cdbf8abc73003fb0fa6d111a705499eb", - "evaluation_time": 13.900465726852417, - "kg_co2_emissions": null, - "mteb_version": "1.8.3", - "scores": { - "test": [ - { - "hf_subset": "default", - "languages": [ - "eng-Latn" - ], - "main_score": 0.39510169078059737, - "v_measure": 0.39510169078059737, - "v_measures": { - "Level 0": [ - 0.41325622684946195, - 0.3810173457972112, - 0.3875515027417737, - 0.3774330996615185, - 0.42543570466284153, - 0.39395796510384407, - 0.41382099670517764, - 0.385113100173911, - 0.3740271503958871, - 0.39940381571434685 - ] - } - } - ] - }, - "task_name": "RedditClusteringS2S.v2" -} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/StackExchangeClustering.json b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/StackExchangeClustering.json new file mode 100644 index 0000000000..e340e03bd9 --- /dev/null +++ b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/StackExchangeClustering.json @@ -0,0 +1,47 @@ +{ + "dataset_revision": "6cbc1f7b2bc0622f2e39d2c77fa502909748c259", + "evaluation_time": 243.16987895965576, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.5530618688738845, + "v_measure": 0.5530618688738845, + "v_measure_std": 0.05210089468183967, + "v_measures": [ + 0.5506182631851375, + 0.6098472794008257, + 0.44884905130888936, + 0.5516385405128469, + 0.5194284248733142, + 0.4914320610158897, + 0.5029636446257895, + 0.6068214257212708, + 0.5511591838426464, + 0.5625517095297468, + 0.6248970053480281, + 0.6152856080318063, + 0.7018985364271394, + 0.5914797519615147, + 0.5229708722434635, + 0.5475301598702013, + 0.528510437313286, + 0.538358895793387, + 0.5217772773576943, + 0.5409771373530979, + 0.5812137020536748, + 0.48807763749190974, + 0.5173798706624534, + 0.5828855479501713, + 0.527994697972928 + ] + } + ] + }, + "task_name": "StackExchangeClustering" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/StackExchangeClustering.v2.json b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/StackExchangeClustering.v2.json index 1ef85b49b6..65d550f8f1 100644 --- a/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/StackExchangeClustering.v2.json +++ b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/StackExchangeClustering.v2.json @@ -1,8 +1,8 @@ { "dataset_revision": "6cbc1f7b2bc0622f2e39d2c77fa502909748c259", - "evaluation_time": 13.482004642486572, + "evaluation_time": 26.358269691467285, "kg_co2_emissions": null, - "mteb_version": "1.8.3", + "mteb_version": "1.12.22", "scores": { "test": [ { @@ -10,20 +10,21 @@ "languages": [ "eng-Latn" ], - "main_score": 0.4703427318380077, - "v_measure": 0.4703427318380077, + "main_score": 0.4488357488649742, + "v_measure": 0.4488357488649742, + "v_measure_std": 0.004838030659190088, "v_measures": { "Level 0": [ - 0.47540436840034184, - 0.48130248468146364, - 0.4515014951676904, - 0.4523062801357879, - 0.4774471097128135, - 0.47161530151282127, - 0.48470733199065164, - 0.45767313869338483, - 0.460773830163638, - 0.4906959779214842 + 0.4475366915829305, + 0.4420953447790183, + 0.44937842894282226, + 0.4502850848233301, + 0.4534784816548607, + 0.44715157752051804, + 0.4599109889840537, + 0.4437921353520995, + 0.4453984828047111, + 0.4493302722053972 ] } } diff --git a/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/StackExchangeClusteringP2P.json b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/StackExchangeClusteringP2P.json new file mode 100644 index 0000000000..d239cfbee9 --- /dev/null +++ b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/StackExchangeClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "815ca46b2622cec33ccafc3735d572c266efdb44", + "evaluation_time": 576.6836857795715, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.33514810885686347, + "v_measure": 0.33514810885686347, + "v_measure_std": 0.011921231043784609, + "v_measures": [ + 0.32496891088801366, + 0.32305740541637007, + 0.3295693910461244, + 0.32265447677868436, + 0.32306155240574636, + 0.3578432648851771, + 0.3473428653812899, + 0.3447150355631154, + 0.3441825637619173, + 0.33408562244219664 + ] + } + ] + }, + "task_name": "StackExchangeClusteringP2P" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/StackExchangeClusteringP2P.v2.json b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/StackExchangeClusteringP2P.v2.json index 1dc5d91b58..4ce58afc6a 100644 --- a/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/StackExchangeClusteringP2P.v2.json +++ b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/StackExchangeClusteringP2P.v2.json @@ -1,8 +1,8 @@ { "dataset_revision": "815ca46b2622cec33ccafc3735d572c266efdb44", - "evaluation_time": 130.416344165802, + "evaluation_time": 29.734455108642578, "kg_co2_emissions": null, - "mteb_version": "1.8.3", + "mteb_version": "1.12.22", "scores": { "test": [ { @@ -10,20 +10,21 @@ "languages": [ "eng-Latn" ], - "main_score": 0.44354949364963064, - "v_measure": 0.44354949364963064, + "main_score": 0.391233099747441, + "v_measure": 0.391233099747441, + "v_measure_std": 0.005454439593422022, "v_measures": { "Level 0": [ - 0.4412825423562223, - 0.44095927415529707, - 0.43835596747998645, - 0.4358974616050223, - 0.4323619768898551, - 0.45427938940056944, - 0.4461413878298764, - 0.4547683270327954, - 0.43860241558357094, - 0.45284619416311084 + 0.38590662311946533, + 0.383588616193751, + 0.3958720998307544, + 0.3948893794244771, + 0.3885266458761183, + 0.3988845332880307, + 0.3996739462462243, + 0.39110239184627876, + 0.3879111744581548, + 0.385975587191156 ] } } diff --git a/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/TwentyNewsgroupsClustering.json b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/TwentyNewsgroupsClustering.json new file mode 100644 index 0000000000..efdfaaddef --- /dev/null +++ b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/TwentyNewsgroupsClustering.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "6125ec4e24fa026cec8a478383ee943acfbd5449", + "evaluation_time": 31.626814126968384, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.35549107308649774, + "v_measure": 0.35549107308649774, + "v_measure_std": 0.019272059566643098, + "v_measures": [ + 0.366697342712263, + 0.3247801821787894, + 0.35569877719138465, + 0.3791207085404633, + 0.3612360580168597, + 0.37231432973232126, + 0.3741259392637825, + 0.32304831890336566, + 0.3369977997463862, + 0.36089127457936215 + ] + } + ] + }, + "task_name": "TwentyNewsgroupsClustering" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/TwentyNewsgroupsClustering.v2.json b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/TwentyNewsgroupsClustering.v2.json index d7591e48a4..8476f5ad6f 100644 --- a/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/TwentyNewsgroupsClustering.v2.json +++ b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/TwentyNewsgroupsClustering.v2.json @@ -1,8 +1,8 @@ { "dataset_revision": "6125ec4e24fa026cec8a478383ee943acfbd5449", - "evaluation_time": 3.0396666526794434, + "evaluation_time": 4.351445913314819, "kg_co2_emissions": null, - "mteb_version": "1.8.3", + "mteb_version": "1.12.22", "scores": { "test": [ { @@ -10,20 +10,21 @@ "languages": [ "eng-Latn" ], - "main_score": 0.34945949012173144, - "v_measure": 0.34945949012173144, + "main_score": 0.3440775150414054, + "v_measure": 0.3440775150414054, + "v_measure_std": 0.020291006911712595, "v_measures": { "Level 0": [ - 0.3149729799214405, - 0.39740220557727307, - 0.321103238598569, - 0.3353245105400759, - 0.35602311589488445, - 0.3302274999942934, - 0.33523235040802457, - 0.3551810193958485, - 0.36378633311819675, - 0.38534164776870783 + 0.31873449377081414, + 0.36768680080742905, + 0.3343389313246565, + 0.3194104974430423, + 0.3790064831328666, + 0.3270114612789705, + 0.35984625372694173, + 0.34240713852426274, + 0.361046504358655, + 0.3312865860464154 ] } } diff --git a/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/model_meta.json b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/model_meta.json new file mode 100644 index 0000000000..74c0cc6818 --- /dev/null +++ b/results/intfloat__multilingual-e5-base/d13f1b27baf31030b7fd040960d60d909913633f/model_meta.json @@ -0,0 +1 @@ +{"name": "intfloat/multilingual-e5-base", "revision": "d13f1b27baf31030b7fd040960d60d909913633f", "release_date": "2024-02-08", "languages": ["afr_Latn", "amh_Latn", "ara_Latn", "asm_Latn", "aze_Latn", "bel_Latn", "bul_Latn", "ben_Latn", "ben_Beng", "bre_Latn", "bos_Latn", "cat_Latn", "ces_Latn", "cym_Latn", "dan_Latn", "deu_Latn", "ell_Latn", "eng_Latn", "epo_Latn", "spa_Latn", "est_Latn", "eus_Latn", "fas_Latn", "fin_Latn", "fra_Latn", "fry_Latn", "gle_Latn", "gla_Latn", "glg_Latn", "guj_Latn", "hau_Latn", "heb_Latn", "hin_Latn", "hin_Deva", "hrv_Latn", "hun_Latn", "hye_Latn", "ind_Latn", "isl_Latn", "ita_Latn", "jpn_Latn", "jav_Latn", "kat_Latn", "kaz_Latn", "khm_Latn", "kan_Latn", "kor_Latn", "kur_Latn", "kir_Latn", "lat_Latn", "lao_Latn", "lit_Latn", "lav_Latn", "mlg_Latn", "mkd_Latn", "mal_Latn", "mon_Latn", "mar_Latn", "msa_Latn", "mya_Latn", "nep_Latn", "nld_Latn", "nob_Latn", "orm_Latn", "ori_Latn", "pan_Latn", "pol_Latn", "pus_Latn", "por_Latn", "ron_Latn", "rus_Latn", "san_Latn", "snd_Latn", "sin_Latn", "slk_Latn", "slv_Latn", "som_Latn", "sqi_Latn", "srp_Latn", "sun_Latn", "swe_Latn", "swa_Latn", "tam_Latn", "tam_Taml", "tel_Latn", "tel_Telu", "tha_Latn", "tgl_Latn", "tur_Latn", "uig_Latn", "ukr_Latn", "urd_Latn", "urd_Arab", "uzb_Latn", "vie_Latn", "xho_Latn", "yid_Latn", "zho_Hant", "zho_Hans"], "n_parameters": null, "memory_usage": null, "max_tokens": null, "embed_dim": null, "license": null, "open_source": true, "framework": [], "loader": "E5Wrapper"} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/BiorxivClusteringP2P.json b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/BiorxivClusteringP2P.json new file mode 100644 index 0000000000..06bbd15f65 --- /dev/null +++ b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/BiorxivClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "65b79d1d13f80053f67aca9498d9402c2d9f1f40", + "evaluation_time": 2588.5654129981995, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3550357435571952, + "v_measure": 0.3550357435571952, + "v_measure_std": 0.00975677085642146, + "v_measures": [ + 0.3574848861415261, + 0.35854807574868586, + 0.3421775854055586, + 0.3355525069038631, + 0.3468659476502996, + 0.3620779576653161, + 0.35731676404709883, + 0.35875465100753573, + 0.3624711937179693, + 0.3691078672840989 + ] + } + ] + }, + "task_name": "BiorxivClusteringP2P" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/BiorxivClusteringP2P.v2.json b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/BiorxivClusteringP2P.v2.json new file mode 100644 index 0000000000..a907e34591 --- /dev/null +++ b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/BiorxivClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "f5dbc242e11dd8e24def4c4268607a49e02946dc", + "evaluation_time": 75.71730923652649, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.37782864895025936, + "v_measure": 0.37782864895025936, + "v_measure_std": 0.005401276710455373, + "v_measures": { + "Level 0": [ + 0.3706146024521105, + 0.3764543877048404, + 0.37451805756624523, + 0.3722572751752651, + 0.38032886093273804, + 0.3833484934218802, + 0.3841073477239218, + 0.37855004633517014, + 0.38667417033405027, + 0.3714332478563719 + ] + } + } + ] + }, + "task_name": "BiorxivClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/BiorxivClusteringS2S.json b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/BiorxivClusteringS2S.json new file mode 100644 index 0000000000..f2710d09c4 --- /dev/null +++ b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/BiorxivClusteringS2S.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "258694dd0231531bc1fd9de6ceb52a0853c6d908", + "evaluation_time": 220.60643410682678, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.33296302380437415, + "v_measure": 0.33296302380437415, + "v_measure_std": 0.007033722094574496, + "v_measures": [ + 0.32517245629328445, + 0.33881752211948307, + 0.33895813652323065, + 0.3283098626230251, + 0.3200766766036506, + 0.33362056459694117, + 0.34261039867643844, + 0.33852480276919256, + 0.32682883062732365, + 0.33671098721117165 + ] + } + ] + }, + "task_name": "BiorxivClusteringS2S" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/BiorxivClusteringS2S.v2.json b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/BiorxivClusteringS2S.v2.json new file mode 100644 index 0000000000..74bb4cc46f --- /dev/null +++ b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/BiorxivClusteringS2S.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "eb4edb10386758d274cd161093eb351381a16dbf", + "evaluation_time": 10.2559654712677, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.361711408639092, + "v_measure": 0.361711408639092, + "v_measure_std": 0.012015292550621138, + "v_measures": { + "Level 0": [ + 0.3592180079187936, + 0.37203646196182355, + 0.355525747467753, + 0.36777715348003986, + 0.3508203562069542, + 0.3863097956194116, + 0.3700217369125274, + 0.3613900394364385, + 0.34310121252946935, + 0.35091357485770935 + ] + } + } + ] + }, + "task_name": "BiorxivClusteringS2S.v2" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/MedrxivClusteringP2P.json b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/MedrxivClusteringP2P.json new file mode 100644 index 0000000000..9b0ecb0dd9 --- /dev/null +++ b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/MedrxivClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "e7a26af6f3ae46b30dde8737f02c07b1505bcc73", + "evaluation_time": 1368.5693545341492, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3170461503468875, + "v_measure": 0.3170461503468875, + "v_measure_std": 0.01211263294931151, + "v_measures": [ + 0.3064000471314256, + 0.30906325283716407, + 0.31114858621179653, + 0.29847275182949756, + 0.308878435539186, + 0.33680662732989325, + 0.3185428112025414, + 0.3355932929749976, + 0.31823852352269444, + 0.32731717488967876 + ] + } + ] + }, + "task_name": "MedrxivClusteringP2P" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/MedrxivClusteringP2P.v2.json b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/MedrxivClusteringP2P.v2.json new file mode 100644 index 0000000000..be97804adb --- /dev/null +++ b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/MedrxivClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "e7a26af6f3ae46b30dde8737f02c07b1505bcc73", + "evaluation_time": 56.80961084365845, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.34888474080490084, + "v_measure": 0.34888474080490084, + "v_measure_std": 0.0058159366542501895, + "v_measures": { + "Level 0": [ + 0.3458707072097676, + 0.3467953776493341, + 0.35274835859496234, + 0.3448740933319091, + 0.34671778775915285, + 0.355968257300468, + 0.3535356605292112, + 0.35920599622206234, + 0.3402207485562152, + 0.34291042089592505 + ] + } + } + ] + }, + "task_name": "MedrxivClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/MedrxivClusteringS2S.json b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/MedrxivClusteringS2S.json new file mode 100644 index 0000000000..5b1ead4664 --- /dev/null +++ b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/MedrxivClusteringS2S.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "35191c8c0dca72d8ff3efcd72aa802307d469663", + "evaluation_time": 124.09738898277283, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.2975568632212487, + "v_measure": 0.2975568632212487, + "v_measure_std": 0.011451355732813825, + "v_measures": [ + 0.2943106254697954, + 0.28028416337977696, + 0.2875879134065354, + 0.29616601628713085, + 0.2834121052216028, + 0.30215106521956636, + 0.3094788174999991, + 0.3195817329031507, + 0.30481480264544325, + 0.2977813901794862 + ] + } + ] + }, + "task_name": "MedrxivClusteringS2S" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/MedrxivClusteringS2S.v2.json b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/MedrxivClusteringS2S.v2.json new file mode 100644 index 0000000000..83e4934066 --- /dev/null +++ b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/MedrxivClusteringS2S.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "35191c8c0dca72d8ff3efcd72aa802307d469663", + "evaluation_time": 8.830669164657593, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3300850381198015, + "v_measure": 0.3300850381198015, + "v_measure_std": 0.007028730159397851, + "v_measures": { + "Level 0": [ + 0.32585677549961156, + 0.32431154055626255, + 0.3419815026473494, + 0.31877258486426274, + 0.32965864944073914, + 0.32303554618038627, + 0.32822365699648, + 0.3376249238334836, + 0.3353460051183, + 0.33603919606113974 + ] + } + } + ] + }, + "task_name": "MedrxivClusteringS2S.v2" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/RedditClustering.json b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/RedditClustering.json new file mode 100644 index 0000000000..2a3a101af9 --- /dev/null +++ b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/RedditClustering.json @@ -0,0 +1,47 @@ +{ + "dataset_revision": "24640382cdbf8abc73003fb0fa6d111a705499eb", + "evaluation_time": 1038.227093219757, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.4690683227522037, + "v_measure": 0.4690683227522037, + "v_measure_std": 0.06311426976967667, + "v_measures": [ + 0.5480269333378893, + 0.4983641774142771, + 0.40428009229498907, + 0.4572569102977324, + 0.5016433521339552, + 0.4200969919045957, + 0.4874222428435611, + 0.424774792761486, + 0.4271797683501383, + 0.40745929515934043, + 0.45283217551666843, + 0.5183701127997492, + 0.4417487747102521, + 0.4659079559947688, + 0.6310998875955774, + 0.4241757302028172, + 0.4936740621416464, + 0.6047135837401434, + 0.456872630260866, + 0.4002594273625891, + 0.37796926993435404, + 0.4154221455363117, + 0.5618674876148675, + 0.47398007910060497, + 0.4313101897959134 + ] + } + ] + }, + "task_name": "RedditClustering" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/RedditClustering.v2.json b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/RedditClustering.v2.json new file mode 100644 index 0000000000..e54639ad81 --- /dev/null +++ b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/RedditClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "24640382cdbf8abc73003fb0fa6d111a705499eb", + "evaluation_time": 83.57516241073608, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.41578010505305374, + "v_measure": 0.41578010505305374, + "v_measure_std": 0.01215897871457087, + "v_measures": { + "Level 0": [ + 0.40609256621983136, + 0.39769870353242887, + 0.42107018464152, + 0.4242338675060048, + 0.4322920909894932, + 0.43372688770959883, + 0.39693265711314124, + 0.41743765471657024, + 0.4138391405913953, + 0.41447729751055346 + ] + } + } + ] + }, + "task_name": "RedditClustering.v2" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/RedditClusteringP2P.json b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/RedditClusteringP2P.json new file mode 100644 index 0000000000..56778e64db --- /dev/null +++ b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/RedditClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "385e3cb46b4cfa89021f56c4380204149d0efe33", + "evaluation_time": 7784.600197315216, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.6300255425042132, + "v_measure": 0.6300255425042132, + "v_measure_std": 0.11846723815443064, + "v_measures": [ + 0.6708994312637823, + 0.6790276241355099, + 0.6710702718023583, + 0.3953919744201308, + 0.7190138192613187, + 0.6410702160746005, + 0.4012988656653108, + 0.7034210064717134, + 0.6855576812960705, + 0.7335045346513356 + ] + } + ] + }, + "task_name": "RedditClusteringP2P" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/RedditClusteringP2P.v2.json b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/RedditClusteringP2P.v2.json new file mode 100644 index 0000000000..13cce8cad5 --- /dev/null +++ b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/RedditClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "385e3cb46b4cfa89021f56c4380204149d0efe33", + "evaluation_time": 330.6445038318634, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.6129823486986854, + "v_measure": 0.6129823486986854, + "v_measure_std": 0.006553177656735589, + "v_measures": { + "Level 0": [ + 0.6161200861520895, + 0.6286568173770195, + 0.6048002559011295, + 0.6071668305833974, + 0.608487965923218, + 0.6147721797574445, + 0.6111306032843626, + 0.612956401131941, + 0.6080557412150089, + 0.6176766056612446 + ] + } + } + ] + }, + "task_name": "RedditClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/StackExchangeClustering.json b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/StackExchangeClustering.json new file mode 100644 index 0000000000..e3708ea181 --- /dev/null +++ b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/StackExchangeClustering.json @@ -0,0 +1,47 @@ +{ + "dataset_revision": "6cbc1f7b2bc0622f2e39d2c77fa502909748c259", + "evaluation_time": 762.5493402481079, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.5837312129318919, + "v_measure": 0.5837312129318919, + "v_measure_std": 0.05049774654708862, + "v_measures": [ + 0.6295997789610954, + 0.6283153032775785, + 0.5093546397212798, + 0.5799467525525586, + 0.5390360305126893, + 0.5349524240915096, + 0.5202410268896647, + 0.6656177534416677, + 0.5951424997183259, + 0.6079780427410808, + 0.6488748469360486, + 0.699905303943518, + 0.680762948936147, + 0.598563961159552, + 0.5598941308286685, + 0.5554098194379443, + 0.5646274661493497, + 0.5565892090916954, + 0.556013393724937, + 0.5663514278951832, + 0.5830354323824856, + 0.5295394730230879, + 0.523939052972823, + 0.600046291358453, + 0.559543313549954 + ] + } + ] + }, + "task_name": "StackExchangeClustering" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/StackExchangeClustering.v2.json b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/StackExchangeClustering.v2.json new file mode 100644 index 0000000000..50da2c940b --- /dev/null +++ b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/StackExchangeClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "6cbc1f7b2bc0622f2e39d2c77fa502909748c259", + "evaluation_time": 72.70891284942627, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.4594824005760283, + "v_measure": 0.4594824005760283, + "v_measure_std": 0.009665162994694535, + "v_measures": { + "Level 0": [ + 0.46952084278432876, + 0.46987520339226546, + 0.4591929971587815, + 0.46825539261683546, + 0.44798989438976744, + 0.4458871930537055, + 0.4731636474797577, + 0.4517722947603411, + 0.45029425111968646, + 0.45887228900481314 + ] + } + } + ] + }, + "task_name": "StackExchangeClustering.v2" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/StackExchangeClusteringP2P.json b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/StackExchangeClusteringP2P.json new file mode 100644 index 0000000000..e2ba54a9d5 --- /dev/null +++ b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/StackExchangeClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "815ca46b2622cec33ccafc3735d572c266efdb44", + "evaluation_time": 1832.2122027873993, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3290068489971592, + "v_measure": 0.3290068489971592, + "v_measure_std": 0.014535106075796889, + "v_measures": [ + 0.31665505763991364, + 0.30858738781189965, + 0.31892453779711055, + 0.32304411699294766, + 0.3170551048124535, + 0.3599653114910528, + 0.32884229365653983, + 0.33928992994585283, + 0.3372623140557331, + 0.3404424357680881 + ] + } + ] + }, + "task_name": "StackExchangeClusteringP2P" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/StackExchangeClusteringP2P.v2.json b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/StackExchangeClusteringP2P.v2.json new file mode 100644 index 0000000000..e4d794e776 --- /dev/null +++ b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/StackExchangeClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "815ca46b2622cec33ccafc3735d572c266efdb44", + "evaluation_time": 81.38813066482544, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3871452341367957, + "v_measure": 0.3871452341367957, + "v_measure_std": 0.007834837417058425, + "v_measures": { + "Level 0": [ + 0.3687428518980269, + 0.3934617774029864, + 0.3902567130128312, + 0.38125813198768144, + 0.38470413817451427, + 0.3871770372623639, + 0.3825086655265749, + 0.39418606795028527, + 0.39327008707720784, + 0.3958868710754848 + ] + } + } + ] + }, + "task_name": "StackExchangeClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/TwentyNewsgroupsClustering.json b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/TwentyNewsgroupsClustering.json new file mode 100644 index 0000000000..9214ba46dd --- /dev/null +++ b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/TwentyNewsgroupsClustering.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "6125ec4e24fa026cec8a478383ee943acfbd5449", + "evaluation_time": 90.8305401802063, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.39396391218501564, + "v_measure": 0.39396391218501564, + "v_measure_std": 0.027380648967402766, + "v_measures": [ + 0.40899048036098523, + 0.3950918770166858, + 0.3834541828265394, + 0.39071413466448374, + 0.39864100309472916, + 0.45204858802359116, + 0.4175530404739191, + 0.38164193514955097, + 0.3478582273853781, + 0.36364565285429373 + ] + } + ] + }, + "task_name": "TwentyNewsgroupsClustering" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/TwentyNewsgroupsClustering.v2.json b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/TwentyNewsgroupsClustering.v2.json new file mode 100644 index 0000000000..0230076184 --- /dev/null +++ b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/TwentyNewsgroupsClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "6125ec4e24fa026cec8a478383ee943acfbd5449", + "evaluation_time": 6.9396812915802, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3859549710223528, + "v_measure": 0.3859549710223528, + "v_measure_std": 0.016970708035846535, + "v_measures": { + "Level 0": [ + 0.398991469739776, + 0.37443259709887444, + 0.39262879727773525, + 0.3836129936905975, + 0.42485638947094584, + 0.3865701163848389, + 0.38353698132612546, + 0.3866477075021634, + 0.35888383004073743, + 0.3693888276917341 + ] + } + } + ] + }, + "task_name": "TwentyNewsgroupsClustering.v2" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/model_meta.json b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/model_meta.json new file mode 100644 index 0000000000..fc851b23d4 --- /dev/null +++ b/results/intfloat__multilingual-e5-large/4dc6d853a804b9c8886ede6dda8a073b7dc08a81/model_meta.json @@ -0,0 +1 @@ +{"name": "intfloat/multilingual-e5-large", "revision": "4dc6d853a804b9c8886ede6dda8a073b7dc08a81", "release_date": "2024-02-08", "languages": ["afr_Latn", "amh_Latn", "ara_Latn", "asm_Latn", "aze_Latn", "bel_Latn", "bul_Latn", "ben_Latn", "ben_Beng", "bre_Latn", "bos_Latn", "cat_Latn", "ces_Latn", "cym_Latn", "dan_Latn", "deu_Latn", "ell_Latn", "eng_Latn", "epo_Latn", "spa_Latn", "est_Latn", "eus_Latn", "fas_Latn", "fin_Latn", "fra_Latn", "fry_Latn", "gle_Latn", "gla_Latn", "glg_Latn", "guj_Latn", "hau_Latn", "heb_Latn", "hin_Latn", "hin_Deva", "hrv_Latn", "hun_Latn", "hye_Latn", "ind_Latn", "isl_Latn", "ita_Latn", "jpn_Latn", "jav_Latn", "kat_Latn", "kaz_Latn", "khm_Latn", "kan_Latn", "kor_Latn", "kur_Latn", "kir_Latn", "lat_Latn", "lao_Latn", "lit_Latn", "lav_Latn", "mlg_Latn", "mkd_Latn", "mal_Latn", "mon_Latn", "mar_Latn", "msa_Latn", "mya_Latn", "nep_Latn", "nld_Latn", "nob_Latn", "orm_Latn", "ori_Latn", "pan_Latn", "pol_Latn", "pus_Latn", "por_Latn", "ron_Latn", "rus_Latn", "san_Latn", "snd_Latn", "sin_Latn", "slk_Latn", "slv_Latn", "som_Latn", "sqi_Latn", "srp_Latn", "sun_Latn", "swe_Latn", "swa_Latn", "tam_Latn", "tam_Taml", "tel_Latn", "tel_Telu", "tha_Latn", "tgl_Latn", "tur_Latn", "uig_Latn", "ukr_Latn", "urd_Latn", "urd_Arab", "uzb_Latn", "vie_Latn", "xho_Latn", "yid_Latn", "zho_Hant", "zho_Hans"], "n_parameters": null, "memory_usage": null, "max_tokens": null, "embed_dim": null, "license": null, "open_source": true, "framework": [], "loader": "E5Wrapper"} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/BiorxivClusteringP2P.json b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/BiorxivClusteringP2P.json new file mode 100644 index 0000000000..4366ddc88a --- /dev/null +++ b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/BiorxivClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "65b79d1d13f80053f67aca9498d9402c2d9f1f40", + "evaluation_time": 373.4567942619324, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.35840067155026445, + "v_measure": 0.35840067155026445, + "v_measure_std": 0.011300755643698134, + "v_measures": [ + 0.37703912185534694, + 0.3673236583371325, + 0.36030838134496246, + 0.35414715597428426, + 0.346589019265193, + 0.34288816486682117, + 0.35564802450672894, + 0.376980567794252, + 0.35234232355148476, + 0.35074029800643797 + ] + } + ] + }, + "task_name": "BiorxivClusteringP2P" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/BiorxivClusteringP2P.v2.json b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/BiorxivClusteringP2P.v2.json new file mode 100644 index 0000000000..a0e845a819 --- /dev/null +++ b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/BiorxivClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "f5dbc242e11dd8e24def4c4268607a49e02946dc", + "evaluation_time": 13.810868978500366, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3738270289843687, + "v_measure": 0.3738270289843687, + "v_measure_std": 0.00793531540293255, + "v_measures": { + "Level 0": [ + 0.3745086321210854, + 0.37561123888027487, + 0.36377712323804773, + 0.3796471337821347, + 0.37599322294105303, + 0.38473160317367633, + 0.3580601842171862, + 0.383215120635189, + 0.3744204304634002, + 0.36830560039163995 + ] + } + } + ] + }, + "task_name": "BiorxivClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/BiorxivClusteringS2S.json b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/BiorxivClusteringS2S.json new file mode 100644 index 0000000000..70a2af0ad4 --- /dev/null +++ b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/BiorxivClusteringS2S.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "258694dd0231531bc1fd9de6ceb52a0853c6d908", + "evaluation_time": 30.032146453857422, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.2734880263329374, + "v_measure": 0.2734880263329374, + "v_measure_std": 0.007532488581889927, + "v_measures": [ + 0.27585463366760715, + 0.264396763158794, + 0.2774073534668043, + 0.26264506641736296, + 0.27213376615230245, + 0.2825130077828003, + 0.26485325125552744, + 0.28104465637608445, + 0.2843084538619933, + 0.2697233111900977 + ] + } + ] + }, + "task_name": "BiorxivClusteringS2S" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/BiorxivClusteringS2S.v2.json b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/BiorxivClusteringS2S.v2.json new file mode 100644 index 0000000000..022eaa6002 --- /dev/null +++ b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/BiorxivClusteringS2S.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "eb4edb10386758d274cd161093eb351381a16dbf", + "evaluation_time": 4.051107883453369, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.28862328809555005, + "v_measure": 0.28862328809555005, + "v_measure_std": 0.010630546329771028, + "v_measures": { + "Level 0": [ + 0.2920232889998999, + 0.2984654062105169, + 0.29769851350421395, + 0.27812242142541654, + 0.28236388974269133, + 0.29753816676907235, + 0.295810767286731, + 0.29475498138875056, + 0.2638892768401008, + 0.28556616878810714 + ] + } + } + ] + }, + "task_name": "BiorxivClusteringS2S.v2" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/MedrxivClusteringP2P.json b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/MedrxivClusteringP2P.json new file mode 100644 index 0000000000..b10fd84215 --- /dev/null +++ b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/MedrxivClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "e7a26af6f3ae46b30dde8737f02c07b1505bcc73", + "evaluation_time": 205.5523705482483, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.30722540604458687, + "v_measure": 0.30722540604458687, + "v_measure_std": 0.014588652154123818, + "v_measures": [ + 0.29967000310421416, + 0.2850330881134532, + 0.28837123576483065, + 0.3033341846788103, + 0.30280308172969833, + 0.3172055177847937, + 0.31135906713827854, + 0.33486588979367504, + 0.3246271344801741, + 0.30498485785794066 + ] + } + ] + }, + "task_name": "MedrxivClusteringP2P" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/MedrxivClusteringP2P.v2.json b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/MedrxivClusteringP2P.v2.json new file mode 100644 index 0000000000..4d86202e95 --- /dev/null +++ b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/MedrxivClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "e7a26af6f3ae46b30dde8737f02c07b1505bcc73", + "evaluation_time": 10.985667705535889, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3384026113550393, + "v_measure": 0.3384026113550393, + "v_measure_std": 0.00890536645810488, + "v_measures": { + "Level 0": [ + 0.35437244468613255, + 0.33013256937599755, + 0.3343315021102052, + 0.33237504869781614, + 0.3249842694921395, + 0.3495327602720878, + 0.335776566367746, + 0.3345780329623614, + 0.3477951447454561, + 0.3401477748404507 + ] + } + } + ] + }, + "task_name": "MedrxivClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/MedrxivClusteringS2S.json b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/MedrxivClusteringS2S.json new file mode 100644 index 0000000000..beb9caf110 --- /dev/null +++ b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/MedrxivClusteringS2S.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "35191c8c0dca72d8ff3efcd72aa802307d469663", + "evaluation_time": 17.568665027618408, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.26996988111535514, + "v_measure": 0.26996988111535514, + "v_measure_std": 0.0119414541402319, + "v_measures": [ + 0.2594862944173476, + 0.26021154851901757, + 0.26181699391386687, + 0.2503715924553382, + 0.26100221510595145, + 0.28272454647012957, + 0.2760414572428568, + 0.2841464491253968, + 0.2808628612726323, + 0.28303485263101386 + ] + } + ] + }, + "task_name": "MedrxivClusteringS2S" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/MedrxivClusteringS2S.v2.json b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/MedrxivClusteringS2S.v2.json new file mode 100644 index 0000000000..5eaafb5cf0 --- /dev/null +++ b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/MedrxivClusteringS2S.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "35191c8c0dca72d8ff3efcd72aa802307d469663", + "evaluation_time": 3.8231515884399414, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.31796932981915316, + "v_measure": 0.31796932981915316, + "v_measure_std": 0.00870567446846545, + "v_measures": { + "Level 0": [ + 0.2998698818319255, + 0.3092255725042243, + 0.3177205705203365, + 0.3235577478548142, + 0.328687753583177, + 0.3146211043932908, + 0.31111725390057726, + 0.3254084493450746, + 0.3258411684185387, + 0.32364379583957287 + ] + } + } + ] + }, + "task_name": "MedrxivClusteringS2S.v2" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/RedditClustering.json b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/RedditClustering.json new file mode 100644 index 0000000000..85fd508385 --- /dev/null +++ b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/RedditClustering.json @@ -0,0 +1,47 @@ +{ + "dataset_revision": "24640382cdbf8abc73003fb0fa6d111a705499eb", + "evaluation_time": 143.39311242103577, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.4011555396409509, + "v_measure": 0.4011555396409509, + "v_measure_std": 0.06532973117942373, + "v_measures": [ + 0.43924415547815493, + 0.4648204019496003, + 0.3634670245059431, + 0.34996271631961057, + 0.3755802403823603, + 0.36625814922396, + 0.39978514515292285, + 0.35586798358803196, + 0.33131383396695796, + 0.37495760001729866, + 0.3779173495615085, + 0.49280279451125475, + 0.39631239594264267, + 0.41286392832069285, + 0.5727645148361832, + 0.34535579003657113, + 0.4344376870664589, + 0.5522002199174861, + 0.3605330364708775, + 0.35072864937515813, + 0.31824360817273484, + 0.3617872826280434, + 0.4803591464281226, + 0.40640128709706164, + 0.34492355007413544 + ] + } + ] + }, + "task_name": "RedditClustering" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/RedditClustering.v2.json b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/RedditClustering.v2.json new file mode 100644 index 0000000000..17264e9b43 --- /dev/null +++ b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/RedditClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "24640382cdbf8abc73003fb0fa6d111a705499eb", + "evaluation_time": 13.848104000091553, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.34014974750909766, + "v_measure": 0.34014974750909766, + "v_measure_std": 0.007528777352876526, + "v_measures": { + "Level 0": [ + 0.3267997569761271, + 0.3346454173605815, + 0.33475558021845914, + 0.33308222562091033, + 0.34599684483160403, + 0.3398782875589474, + 0.3410782283463533, + 0.34647424965132984, + 0.3534703683874866, + 0.34531651613917763 + ] + } + } + ] + }, + "task_name": "RedditClustering.v2" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/RedditClusteringP2P.json b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/RedditClusteringP2P.json new file mode 100644 index 0000000000..3fd521f457 --- /dev/null +++ b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/RedditClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "385e3cb46b4cfa89021f56c4380204149d0efe33", + "evaluation_time": 1067.6302752494812, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.5949355777379512, + "v_measure": 0.5949355777379512, + "v_measure_std": 0.1201949717543935, + "v_measures": [ + 0.6400556284396514, + 0.6451079234762306, + 0.6453039470979828, + 0.38070266991858365, + 0.6742530388521604, + 0.5958766416873841, + 0.34071630971253514, + 0.6688777000369198, + 0.6582062579138896, + 0.7002556602441763 + ] + } + ] + }, + "task_name": "RedditClusteringP2P" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/RedditClusteringP2P.v2.json b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/RedditClusteringP2P.v2.json new file mode 100644 index 0000000000..faba535f37 --- /dev/null +++ b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/RedditClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "385e3cb46b4cfa89021f56c4380204149d0efe33", + "evaluation_time": 49.83731269836426, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.5689204529010279, + "v_measure": 0.5689204529010279, + "v_measure_std": 0.006875726831712545, + "v_measures": { + "Level 0": [ + 0.5674536948994331, + 0.5750045361791122, + 0.5582313174518326, + 0.5714581198675189, + 0.5617327732376419, + 0.568007208559642, + 0.5606027557590141, + 0.578659108896322, + 0.5787288425660168, + 0.5693261715937451 + ] + } + } + ] + }, + "task_name": "RedditClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/StackExchangeClustering.json b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/StackExchangeClustering.json new file mode 100644 index 0000000000..0fd01947d4 --- /dev/null +++ b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/StackExchangeClustering.json @@ -0,0 +1,47 @@ +{ + "dataset_revision": "6cbc1f7b2bc0622f2e39d2c77fa502909748c259", + "evaluation_time": 112.3986005783081, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.533157712339661, + "v_measure": 0.533157712339661, + "v_measure_std": 0.05881134497723907, + "v_measures": [ + 0.5149556026506005, + 0.5741545702686627, + 0.4469995562276755, + 0.5678006543665266, + 0.4795679317121149, + 0.5022047071386572, + 0.45589623369775, + 0.5537312345148071, + 0.5253922380464688, + 0.5416090263799735, + 0.7025820670938749, + 0.6087271458345636, + 0.6543947895366301, + 0.5845274688607025, + 0.5143120405618706, + 0.5246145874584811, + 0.5048436197861124, + 0.5132818015677498, + 0.4943860431578122, + 0.5039302350689131, + 0.5678584103975669, + 0.4647173198070034, + 0.4738303077323309, + 0.5388959950955831, + 0.5157292215290958 + ] + } + ] + }, + "task_name": "StackExchangeClustering" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/StackExchangeClustering.v2.json b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/StackExchangeClustering.v2.json new file mode 100644 index 0000000000..960e3e9381 --- /dev/null +++ b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/StackExchangeClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "6cbc1f7b2bc0622f2e39d2c77fa502909748c259", + "evaluation_time": 13.450961351394653, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.43652678448376847, + "v_measure": 0.43652678448376847, + "v_measure_std": 0.014149799933808186, + "v_measures": { + "Level 0": [ + 0.44775353790989714, + 0.455171778791717, + 0.44289019637752913, + 0.4397277232940181, + 0.43570152533163947, + 0.4349189465572853, + 0.44108769754080585, + 0.40143386784784624, + 0.4433221312383573, + 0.423260439948589 + ] + } + } + ] + }, + "task_name": "StackExchangeClustering.v2" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/StackExchangeClusteringP2P.json b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/StackExchangeClusteringP2P.json new file mode 100644 index 0000000000..11468ffd2a --- /dev/null +++ b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/StackExchangeClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "815ca46b2622cec33ccafc3735d572c266efdb44", + "evaluation_time": 262.87545895576477, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3186981585334296, + "v_measure": 0.3186981585334296, + "v_measure_std": 0.01179815056338052, + "v_measures": [ + 0.3104513218943992, + 0.31135684126285157, + 0.3039045169872521, + 0.30526753516320304, + 0.30704674355490064, + 0.33406890061086314, + 0.3267613164859199, + 0.336680541252623, + 0.32814703264342143, + 0.32329683547886234 + ] + } + ] + }, + "task_name": "StackExchangeClusteringP2P" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/StackExchangeClusteringP2P.v2.json b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/StackExchangeClusteringP2P.v2.json new file mode 100644 index 0000000000..c7ce705f7a --- /dev/null +++ b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/StackExchangeClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "815ca46b2622cec33ccafc3735d572c266efdb44", + "evaluation_time": 15.542395830154419, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.37538281657760325, + "v_measure": 0.37538281657760325, + "v_measure_std": 0.00631255183685697, + "v_measures": { + "Level 0": [ + 0.3763564787588726, + 0.36765788247068193, + 0.37088588255107185, + 0.37887421781176844, + 0.3743385786327181, + 0.37980136169483214, + 0.37771220275871853, + 0.3840096426144594, + 0.38167142737956133, + 0.36252049110334833 + ] + } + } + ] + }, + "task_name": "StackExchangeClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/TwentyNewsgroupsClustering.json b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/TwentyNewsgroupsClustering.json new file mode 100644 index 0000000000..a0f3129e47 --- /dev/null +++ b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/TwentyNewsgroupsClustering.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "6125ec4e24fa026cec8a478383ee943acfbd5449", + "evaluation_time": 16.9054114818573, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3367465525011798, + "v_measure": 0.3367465525011798, + "v_measure_std": 0.02030592426159109, + "v_measures": [ + 0.331427808172204, + 0.3498562516396635, + 0.355293705851231, + 0.3475249777317855, + 0.28591250510981736, + 0.3330056569745029, + 0.33807270518930627, + 0.3608033964040712, + 0.34403140010601063, + 0.3215371178332055 + ] + } + ] + }, + "task_name": "TwentyNewsgroupsClustering" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/TwentyNewsgroupsClustering.v2.json b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/TwentyNewsgroupsClustering.v2.json new file mode 100644 index 0000000000..789d54022a --- /dev/null +++ b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/TwentyNewsgroupsClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "6125ec4e24fa026cec8a478383ee943acfbd5449", + "evaluation_time": 3.2124361991882324, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3393812319511116, + "v_measure": 0.3393812319511116, + "v_measure_std": 0.020116338694840856, + "v_measures": { + "Level 0": [ + 0.3274518376622219, + 0.34364107490710766, + 0.34733693851046116, + 0.37369989588781444, + 0.3286569879352603, + 0.3014423670066226, + 0.34536830241280353, + 0.32703014184991974, + 0.3682183560366374, + 0.33096641730226684 + ] + } + } + ] + }, + "task_name": "TwentyNewsgroupsClustering.v2" +} \ No newline at end of file diff --git a/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/model_meta.json b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/model_meta.json new file mode 100644 index 0000000000..f02ab56fc5 --- /dev/null +++ b/results/intfloat__multilingual-e5-small/e4ce9877abf3edfe10b0d82785e83bdcb973e22e/model_meta.json @@ -0,0 +1 @@ +{"name": "intfloat/multilingual-e5-small", "revision": "e4ce9877abf3edfe10b0d82785e83bdcb973e22e", "release_date": "2024-02-08", "languages": ["afr_Latn", "amh_Latn", "ara_Latn", "asm_Latn", "aze_Latn", "bel_Latn", "bul_Latn", "ben_Latn", "ben_Beng", "bre_Latn", "bos_Latn", "cat_Latn", "ces_Latn", "cym_Latn", "dan_Latn", "deu_Latn", "ell_Latn", "eng_Latn", "epo_Latn", "spa_Latn", "est_Latn", "eus_Latn", "fas_Latn", "fin_Latn", "fra_Latn", "fry_Latn", "gle_Latn", "gla_Latn", "glg_Latn", "guj_Latn", "hau_Latn", "heb_Latn", "hin_Latn", "hin_Deva", "hrv_Latn", "hun_Latn", "hye_Latn", "ind_Latn", "isl_Latn", "ita_Latn", "jpn_Latn", "jav_Latn", "kat_Latn", "kaz_Latn", "khm_Latn", "kan_Latn", "kor_Latn", "kur_Latn", "kir_Latn", "lat_Latn", "lao_Latn", "lit_Latn", "lav_Latn", "mlg_Latn", "mkd_Latn", "mal_Latn", "mon_Latn", "mar_Latn", "msa_Latn", "mya_Latn", "nep_Latn", "nld_Latn", "nob_Latn", "orm_Latn", "ori_Latn", "pan_Latn", "pol_Latn", "pus_Latn", "por_Latn", "ron_Latn", "rus_Latn", "san_Latn", "snd_Latn", "sin_Latn", "slk_Latn", "slv_Latn", "som_Latn", "sqi_Latn", "srp_Latn", "sun_Latn", "swe_Latn", "swa_Latn", "tam_Latn", "tam_Taml", "tel_Latn", "tel_Telu", "tha_Latn", "tgl_Latn", "tur_Latn", "uig_Latn", "ukr_Latn", "urd_Latn", "urd_Arab", "uzb_Latn", "vie_Latn", "xho_Latn", "yid_Latn", "zho_Hant", "zho_Hans"], "n_parameters": null, "memory_usage": null, "max_tokens": null, "embed_dim": null, "license": null, "open_source": true, "framework": [], "loader": "E5Wrapper"} \ No newline at end of file diff --git a/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/BiorxivClusteringP2P.json b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/BiorxivClusteringP2P.json new file mode 100644 index 0000000000..65ecaef72f --- /dev/null +++ b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/BiorxivClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "65b79d1d13f80053f67aca9498d9402c2d9f1f40", + "evaluation_time": 2453.920761823654, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.4035489115547205, + "v_measure": 0.4035489115547205, + "v_measure_std": 0.013344732627977219, + "v_measures": [ + 0.39155763576440866, + 0.391778158785331, + 0.40381362022257206, + 0.3808596153381086, + 0.3922439568389595, + 0.4060505517951984, + 0.41538014808018703, + 0.4216650336690922, + 0.41024757389916766, + 0.42189282115417975 + ] + } + ] + }, + "task_name": "BiorxivClusteringP2P" +} \ No newline at end of file diff --git a/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/BiorxivClusteringP2P.v2.json b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/BiorxivClusteringP2P.v2.json new file mode 100644 index 0000000000..c5c11915dd --- /dev/null +++ b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/BiorxivClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "f5dbc242e11dd8e24def4c4268607a49e02946dc", + "evaluation_time": 72.90839457511902, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.4187022064365139, + "v_measure": 0.4187022064365139, + "v_measure_std": 0.009724522380459165, + "v_measures": { + "Level 0": [ + 0.4050463078726262, + 0.423314158639693, + 0.4294480555829178, + 0.4236138861805959, + 0.4205368593703068, + 0.4237515095591415, + 0.41529568456910054, + 0.41819647292063516, + 0.4299041172937787, + 0.39791501237634286 + ] + } + } + ] + }, + "task_name": "BiorxivClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/BiorxivClusteringS2S.json b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/BiorxivClusteringS2S.json new file mode 100644 index 0000000000..4cb66e6d39 --- /dev/null +++ b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/BiorxivClusteringS2S.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "258694dd0231531bc1fd9de6ceb52a0853c6d908", + "evaluation_time": 190.13294434547424, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.36683148479894867, + "v_measure": 0.36683148479894867, + "v_measure_std": 0.01037265767335365, + "v_measures": [ + 0.364816385186632, + 0.3879806357656108, + 0.3554289501689786, + 0.3539339657758455, + 0.37111102710002974, + 0.36856941336895194, + 0.3667435301776565, + 0.3808693062854585, + 0.3597958202288718, + 0.35906581393145187 + ] + } + ] + }, + "task_name": "BiorxivClusteringS2S" +} \ No newline at end of file diff --git a/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/BiorxivClusteringS2S.v2.json b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/BiorxivClusteringS2S.v2.json new file mode 100644 index 0000000000..e12ed5848e --- /dev/null +++ b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/BiorxivClusteringS2S.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "eb4edb10386758d274cd161093eb351381a16dbf", + "evaluation_time": 9.293036460876465, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.4001329292384076, + "v_measure": 0.4001329292384076, + "v_measure_std": 0.008126409315880075, + "v_measures": { + "Level 0": [ + 0.3935275983135327, + 0.3949789304615553, + 0.4077240814883973, + 0.39965328828360536, + 0.3859014409906691, + 0.4032977783899114, + 0.41564726256824186, + 0.3996189886013326, + 0.40675775192085317, + 0.39422217136597776 + ] + } + } + ] + }, + "task_name": "BiorxivClusteringS2S.v2" +} \ No newline at end of file diff --git a/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/MedrxivClusteringP2P.json b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/MedrxivClusteringP2P.json new file mode 100644 index 0000000000..e5a900dc35 --- /dev/null +++ b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/MedrxivClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "e7a26af6f3ae46b30dde8737f02c07b1505bcc73", + "evaluation_time": 1350.4132771492004, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3317955166454995, + "v_measure": 0.3317955166454995, + "v_measure_std": 0.013552434074404698, + "v_measures": [ + 0.3203703653192594, + 0.3228535463207019, + 0.32120090353414227, + 0.31756803980451553, + 0.31828581501634207, + 0.3541646090149659, + 0.3443653583220722, + 0.34831340199961275, + 0.3446786125689817, + 0.3261545145544012 + ] + } + ] + }, + "task_name": "MedrxivClusteringP2P" +} \ No newline at end of file diff --git a/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/MedrxivClusteringP2P.v2.json b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/MedrxivClusteringP2P.v2.json new file mode 100644 index 0000000000..c0ea836cf7 --- /dev/null +++ b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/MedrxivClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "e7a26af6f3ae46b30dde8737f02c07b1505bcc73", + "evaluation_time": 58.00021147727966, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.36656059517378203, + "v_measure": 0.36656059517378203, + "v_measure_std": 0.00828927231716789, + "v_measures": { + "Level 0": [ + 0.37018780341085833, + 0.3569680328932698, + 0.3627604353551965, + 0.36179251165973003, + 0.37122315475734796, + 0.36054803536441477, + 0.36540717978054493, + 0.3849840925354074, + 0.35734786060971746, + 0.3743868453713331 + ] + } + } + ] + }, + "task_name": "MedrxivClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/MedrxivClusteringS2S.json b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/MedrxivClusteringS2S.json new file mode 100644 index 0000000000..54866c88e8 --- /dev/null +++ b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/MedrxivClusteringS2S.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "35191c8c0dca72d8ff3efcd72aa802307d469663", + "evaluation_time": 105.49251294136047, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3141524627143847, + "v_measure": 0.3141524627143847, + "v_measure_std": 0.016210263185160487, + "v_measures": [ + 0.29965696563163347, + 0.30247924316343905, + 0.3001395475020178, + 0.3033801046213946, + 0.29612318605575966, + 0.33698746009814484, + 0.3433427529318742, + 0.3303934048355355, + 0.316292428046378, + 0.31272953425766914 + ] + } + ] + }, + "task_name": "MedrxivClusteringS2S" +} \ No newline at end of file diff --git a/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/MedrxivClusteringS2S.v2.json b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/MedrxivClusteringS2S.v2.json new file mode 100644 index 0000000000..c9a069cf06 --- /dev/null +++ b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/MedrxivClusteringS2S.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "35191c8c0dca72d8ff3efcd72aa802307d469663", + "evaluation_time": 8.469618320465088, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3516571061876409, + "v_measure": 0.3516571061876409, + "v_measure_std": 0.009555061820861818, + "v_measures": { + "Level 0": [ + 0.3545343684779735, + 0.3353303623127802, + 0.35697666314165516, + 0.33216660899868033, + 0.3569018087583997, + 0.35840399674177176, + 0.3502664185208431, + 0.35630774905585527, + 0.35250819271705514, + 0.3631748931513943 + ] + } + } + ] + }, + "task_name": "MedrxivClusteringS2S.v2" +} \ No newline at end of file diff --git a/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/RedditClustering.json b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/RedditClustering.json new file mode 100644 index 0000000000..a208d9ba34 --- /dev/null +++ b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/RedditClustering.json @@ -0,0 +1,47 @@ +{ + "dataset_revision": "24640382cdbf8abc73003fb0fa6d111a705499eb", + "evaluation_time": 1177.9379081726074, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.5877539950912152, + "v_measure": 0.5877539950912152, + "v_measure_std": 0.04688180544372522, + "v_measures": [ + 0.5938450489115217, + 0.6491643259861977, + 0.5208877728903546, + 0.5648881672018695, + 0.558786320030191, + 0.5642104725127111, + 0.6221069472499868, + 0.559159611392674, + 0.5653177907579733, + 0.5622123276776294, + 0.5421734935429708, + 0.5659360346263855, + 0.5861831125559152, + 0.6121044393840697, + 0.7046177766636607, + 0.5491433508103596, + 0.6127067965255044, + 0.6527287563781005, + 0.5695294184440446, + 0.5592058933030177, + 0.5385662747339949, + 0.5553329849659868, + 0.6960434030167377, + 0.6262942135811407, + 0.5627051441373787 + ] + } + ] + }, + "task_name": "RedditClustering" +} \ No newline at end of file diff --git a/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/RedditClustering.v2.json b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/RedditClustering.v2.json new file mode 100644 index 0000000000..5a8bb74544 --- /dev/null +++ b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/RedditClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "24640382cdbf8abc73003fb0fa6d111a705499eb", + "evaluation_time": 97.7238450050354, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.5613695733020986, + "v_measure": 0.5613695733020986, + "v_measure_std": 0.010141984816188256, + "v_measures": { + "Level 0": [ + 0.5768648884850722, + 0.562778458286498, + 0.5779593789488652, + 0.5451581167172895, + 0.5521888277197725, + 0.5524077934762526, + 0.5571529265439831, + 0.5577418816188128, + 0.5684652178247105, + 0.5629782433997302 + ] + } + } + ] + }, + "task_name": "RedditClustering.v2" +} \ No newline at end of file diff --git a/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/RedditClusteringP2P.json b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/RedditClusteringP2P.json new file mode 100644 index 0000000000..36968a162f --- /dev/null +++ b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/RedditClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "385e3cb46b4cfa89021f56c4380204149d0efe33", + "evaluation_time": 7558.53716468811, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.6475138413034877, + "v_measure": 0.6475138413034877, + "v_measure_std": 0.1266144454300707, + "v_measures": [ + 0.696195565013078, + 0.6854169139285026, + 0.6701935993922018, + 0.3989287791288467, + 0.7272842719648743, + 0.6431148800093455, + 0.40993584285454576, + 0.7597775530866567, + 0.7214416598449416, + 0.7628493478118838 + ] + } + ] + }, + "task_name": "RedditClusteringP2P" +} \ No newline at end of file diff --git a/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/RedditClusteringP2P.v2.json b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/RedditClusteringP2P.v2.json new file mode 100644 index 0000000000..0d50e114ed --- /dev/null +++ b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/RedditClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "385e3cb46b4cfa89021f56c4380204149d0efe33", + "evaluation_time": 322.99111819267273, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.6582303143101478, + "v_measure": 0.6582303143101478, + "v_measure_std": 0.003940220883935089, + "v_measures": { + "Level 0": [ + 0.6577883239687152, + 0.6636324313844517, + 0.6546280224302481, + 0.6537490518168375, + 0.6627460019467355, + 0.6566953856186603, + 0.6607568298046633, + 0.6637964903012642, + 0.6535128429286692, + 0.6549977629012332 + ] + } + } + ] + }, + "task_name": "RedditClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/StackExchangeClustering.json b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/StackExchangeClustering.json new file mode 100644 index 0000000000..bf97a85fda --- /dev/null +++ b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/StackExchangeClustering.json @@ -0,0 +1,47 @@ +{ + "dataset_revision": "6cbc1f7b2bc0622f2e39d2c77fa502909748c259", + "evaluation_time": 909.9153478145599, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.6524256372565289, + "v_measure": 0.6524256372565289, + "v_measure_std": 0.04047467160184454, + "v_measures": [ + 0.712677772120035, + 0.6730581487051284, + 0.5702109060331013, + 0.6701450301098236, + 0.6668381926668918, + 0.6122491129344874, + 0.6297789157905174, + 0.7228341099693218, + 0.6655300264396213, + 0.6538806129718214, + 0.7317061446360874, + 0.6986297671890418, + 0.7049779522281712, + 0.6696928210098196, + 0.6066351476554503, + 0.6548449841063315, + 0.6313921055225882, + 0.6182259790345701, + 0.6335150803111455, + 0.6404073153637525, + 0.656988056369104, + 0.6072461833418159, + 0.585018216989664, + 0.6471914983299971, + 0.6469668515849322 + ] + } + ] + }, + "task_name": "StackExchangeClustering" +} \ No newline at end of file diff --git a/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/StackExchangeClustering.v2.json b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/StackExchangeClustering.v2.json new file mode 100644 index 0000000000..743b4ec3e3 --- /dev/null +++ b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/StackExchangeClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "6cbc1f7b2bc0622f2e39d2c77fa502909748c259", + "evaluation_time": 93.00119757652283, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.550802570899201, + "v_measure": 0.550802570899201, + "v_measure_std": 0.010730581816619057, + "v_measures": { + "Level 0": [ + 0.568494593940954, + 0.5582614299332992, + 0.551242267552277, + 0.5517510152895378, + 0.5397901827263524, + 0.5546177164520344, + 0.5444744477556533, + 0.5347041769061387, + 0.5392695909753441, + 0.5654202874604203 + ] + } + } + ] + }, + "task_name": "StackExchangeClustering.v2" +} \ No newline at end of file diff --git a/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/StackExchangeClusteringP2P.json b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/StackExchangeClusteringP2P.json new file mode 100644 index 0000000000..5cd858e7fa --- /dev/null +++ b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/StackExchangeClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "815ca46b2622cec33ccafc3735d572c266efdb44", + "evaluation_time": 1818.7690072059631, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.35649528356036947, + "v_measure": 0.35649528356036947, + "v_measure_std": 0.015035142503373945, + "v_measures": [ + 0.3464105261114723, + 0.3340451700207264, + 0.34679346734682226, + 0.3398355162150171, + 0.3444361377320941, + 0.3799761693222242, + 0.36545618056350265, + 0.37163647597750904, + 0.3695424604002989, + 0.36682073191402786 + ] + } + ] + }, + "task_name": "StackExchangeClusteringP2P" +} \ No newline at end of file diff --git a/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/StackExchangeClusteringP2P.v2.json b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/StackExchangeClusteringP2P.v2.json new file mode 100644 index 0000000000..34e73275e4 --- /dev/null +++ b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/StackExchangeClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "815ca46b2622cec33ccafc3735d572c266efdb44", + "evaluation_time": 80.80399250984192, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.40465001207381013, + "v_measure": 0.40465001207381013, + "v_measure_std": 0.0038850347956484723, + "v_measures": { + "Level 0": [ + 0.40379638807112206, + 0.4085550806574614, + 0.399688240991745, + 0.39888486933304207, + 0.40864951475413885, + 0.4053971411560196, + 0.3997468372715058, + 0.4085641141386234, + 0.40920801739874785, + 0.404009916965696 + ] + } + } + ] + }, + "task_name": "StackExchangeClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/TwentyNewsgroupsClustering.json b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/TwentyNewsgroupsClustering.json new file mode 100644 index 0000000000..59412cef2d --- /dev/null +++ b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/TwentyNewsgroupsClustering.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "6125ec4e24fa026cec8a478383ee943acfbd5449", + "evaluation_time": 79.21000981330872, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.5230111060085674, + "v_measure": 0.5230111060085674, + "v_measure_std": 0.016015964835050155, + "v_measures": [ + 0.544379473183073, + 0.5229479535700808, + 0.5348929683697258, + 0.5304165308238298, + 0.49325855181125505, + 0.5267648921156715, + 0.5282076914784095, + 0.5164145529238753, + 0.49573066561577994, + 0.5370977801939733 + ] + } + ] + }, + "task_name": "TwentyNewsgroupsClustering" +} \ No newline at end of file diff --git a/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/TwentyNewsgroupsClustering.v2.json b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/TwentyNewsgroupsClustering.v2.json new file mode 100644 index 0000000000..4a05058a15 --- /dev/null +++ b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/TwentyNewsgroupsClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "6125ec4e24fa026cec8a478383ee943acfbd5449", + "evaluation_time": 42.75296902656555, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.5110890076508168, + "v_measure": 0.5110890076508168, + "v_measure_std": 0.021040564503322787, + "v_measures": { + "Level 0": [ + 0.5305814828553521, + 0.49762656115511467, + 0.5047357572677348, + 0.5303274753178404, + 0.5422138170276668, + 0.5122902948386954, + 0.49116437739100466, + 0.5256060942383903, + 0.46783648726157, + 0.5085077291547982 + ] + } + } + ] + }, + "task_name": "TwentyNewsgroupsClustering.v2" +} \ No newline at end of file diff --git a/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/model_meta.json b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/model_meta.json new file mode 100644 index 0000000000..1c86ecd25a --- /dev/null +++ b/results/mixedbread-ai__mxbai-embed-large-v1/990580e27d329c7408b3741ecff85876e128e203/model_meta.json @@ -0,0 +1 @@ +{"name": "mixedbread-ai/mxbai-embed-large-v1", "revision": "990580e27d329c7408b3741ecff85876e128e203", "release_date": "2024-03-07", "languages": ["eng_Latn"], "n_parameters": null, "memory_usage": null, "max_tokens": null, "embed_dim": null, "license": null, "open_source": true, "framework": [], "loader": "MxbaiWrapper"} \ No newline at end of file diff --git a/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/BiorxivClusteringP2P.json b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/BiorxivClusteringP2P.json new file mode 100644 index 0000000000..b116ae2271 --- /dev/null +++ b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/BiorxivClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "65b79d1d13f80053f67aca9498d9402c2d9f1f40", + "evaluation_time": 452.0289957523346, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.29980397900118877, + "v_measure": 0.29980397900118877, + "v_measure_std": 0.004558208340759507, + "v_measures": [ + 0.2928962846562101, + 0.30226820102340113, + 0.30064914632632295, + 0.29234724131547635, + 0.30307339570413155, + 0.29705791421575334, + 0.30235451173285627, + 0.3052288656174225, + 0.29659686524442913, + 0.30556736417588465 + ] + } + ] + }, + "task_name": "BiorxivClusteringP2P" +} \ No newline at end of file diff --git a/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/BiorxivClusteringP2P.v2.json b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/BiorxivClusteringP2P.v2.json new file mode 100644 index 0000000000..b062a0a73f --- /dev/null +++ b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/BiorxivClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "f5dbc242e11dd8e24def4c4268607a49e02946dc", + "evaluation_time": 16.100839138031006, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.32427862133174284, + "v_measure": 0.32427862133174284, + "v_measure_std": 0.005562756779092928, + "v_measures": { + "Level 0": [ + 0.3256031481807181, + 0.3296448816618552, + 0.33131505104993664, + 0.3271590285261483, + 0.3154619031213426, + 0.3205109192478168, + 0.3217111581594313, + 0.32092388999203564, + 0.33262758114198293, + 0.31782865223616047 + ] + } + } + ] + }, + "task_name": "BiorxivClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/BiorxivClusteringS2S.json b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/BiorxivClusteringS2S.json new file mode 100644 index 0000000000..9a64efa8a4 --- /dev/null +++ b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/BiorxivClusteringS2S.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "258694dd0231531bc1fd9de6ceb52a0853c6d908", + "evaluation_time": 60.62066864967346, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.20244564175375618, + "v_measure": 0.20244564175375618, + "v_measure_std": 0.00571727466742521, + "v_measures": [ + 0.1960854498176421, + 0.1996488729813874, + 0.2109762254548716, + 0.20602756589987153, + 0.2023032326441298, + 0.19126007246945118, + 0.20185740247502665, + 0.20238925249414688, + 0.2106186750889891, + 0.20328966821204525 + ] + } + ] + }, + "task_name": "BiorxivClusteringS2S" +} \ No newline at end of file diff --git a/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/BiorxivClusteringS2S.v2.json b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/BiorxivClusteringS2S.v2.json new file mode 100644 index 0000000000..37f991dc3d --- /dev/null +++ b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/BiorxivClusteringS2S.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "eb4edb10386758d274cd161093eb351381a16dbf", + "evaluation_time": 5.374221563339233, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.22792290067475257, + "v_measure": 0.22792290067475257, + "v_measure_std": 0.007510838407945796, + "v_measures": { + "Level 0": [ + 0.23484834077255048, + 0.21530302009205388, + 0.23361195403115007, + 0.22733069965811717, + 0.2253734052131732, + 0.2382142578051887, + 0.23832532123344344, + 0.221290304053139, + 0.22237813796212497, + 0.2225535659265849 + ] + } + } + ] + }, + "task_name": "BiorxivClusteringS2S.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/MedrxivClusteringP2P.json b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/MedrxivClusteringP2P.json new file mode 100644 index 0000000000..b969c64ec8 --- /dev/null +++ b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/MedrxivClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "e7a26af6f3ae46b30dde8737f02c07b1505bcc73", + "evaluation_time": 228.96853113174438, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.29843146622960776, + "v_measure": 0.29843146622960776, + "v_measure_std": 0.015648799779082463, + "v_measures": [ + 0.27705890110080456, + 0.2813315781015411, + 0.28667206771784914, + 0.2878476061447996, + 0.2913238527926979, + 0.309100224011698, + 0.3178183270218534, + 0.32799884730172413, + 0.30208846360914093, + 0.3030747944939689 + ] + } + ] + }, + "task_name": "MedrxivClusteringP2P" +} \ No newline at end of file diff --git a/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/MedrxivClusteringP2P.v2.json b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/MedrxivClusteringP2P.v2.json new file mode 100644 index 0000000000..e189a4afde --- /dev/null +++ b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/MedrxivClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "e7a26af6f3ae46b30dde8737f02c07b1505bcc73", + "evaluation_time": 12.906177282333374, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.33465525266167695, + "v_measure": 0.33465525266167695, + "v_measure_std": 0.004282901779416489, + "v_measures": { + "Level 0": [ + 0.33927799882791837, + 0.33690860878830137, + 0.32723798543586596, + 0.3353715930532126, + 0.33839796119354354, + 0.3352978755883545, + 0.33779162598622875, + 0.3319464747610406, + 0.3375193893707444, + 0.32680301361155906 + ] + } + } + ] + }, + "task_name": "MedrxivClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/MedrxivClusteringS2S.json b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/MedrxivClusteringS2S.json new file mode 100644 index 0000000000..082adfb766 --- /dev/null +++ b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/MedrxivClusteringS2S.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "35191c8c0dca72d8ff3efcd72aa802307d469663", + "evaluation_time": 35.80358386039734, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.24888186887461528, + "v_measure": 0.24888186887461528, + "v_measure_std": 0.01227259478889196, + "v_measures": [ + 0.23719549932589995, + 0.23738660505888437, + 0.23357763761251463, + 0.23963445502959843, + 0.23964237230069138, + 0.270571050706782, + 0.2583649277466303, + 0.25556780200559576, + 0.26316232230129716, + 0.2537160166582584 + ] + } + ] + }, + "task_name": "MedrxivClusteringS2S" +} \ No newline at end of file diff --git a/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/MedrxivClusteringS2S.v2.json b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/MedrxivClusteringS2S.v2.json new file mode 100644 index 0000000000..b6ee92dab9 --- /dev/null +++ b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/MedrxivClusteringS2S.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "35191c8c0dca72d8ff3efcd72aa802307d469663", + "evaluation_time": 5.340449810028076, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.2936939173847978, + "v_measure": 0.2936939173847978, + "v_measure_std": 0.005870869964751773, + "v_measures": { + "Level 0": [ + 0.3008537505198166, + 0.29376610046701207, + 0.2971169750993412, + 0.29696858146558813, + 0.29749099643281396, + 0.2821031995923562, + 0.2944308819035401, + 0.299409644041809, + 0.28960723058696836, + 0.28519181373873187 + ] + } + } + ] + }, + "task_name": "MedrxivClusteringS2S.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/RedditClustering.json b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/RedditClustering.json new file mode 100644 index 0000000000..8768d64f91 --- /dev/null +++ b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/RedditClustering.json @@ -0,0 +1,47 @@ +{ + "dataset_revision": "24640382cdbf8abc73003fb0fa6d111a705499eb", + "evaluation_time": 307.25623869895935, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.2852647661241243, + "v_measure": 0.2852647661241243, + "v_measure_std": 0.046541286384913276, + "v_measures": [ + 0.24363228421475558, + 0.34043169555380004, + 0.22964118413581855, + 0.24863399927464433, + 0.27502168003446575, + 0.27584882670660615, + 0.30566822453867776, + 0.26839075387728606, + 0.2873554099848955, + 0.27180147485292916, + 0.280207936114476, + 0.3650824981161492, + 0.3173318019904034, + 0.27932363582245245, + 0.39634347440814777, + 0.2544441003901316, + 0.2639829419211798, + 0.34128129770364235, + 0.26499348289385266, + 0.23138823351503354, + 0.2417541532796834, + 0.24566518584671995, + 0.3893088585719239, + 0.2698371525094972, + 0.2442488668459369 + ] + } + ] + }, + "task_name": "RedditClustering" +} \ No newline at end of file diff --git a/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/RedditClustering.v2.json b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/RedditClustering.v2.json new file mode 100644 index 0000000000..79be663f36 --- /dev/null +++ b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/RedditClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "24640382cdbf8abc73003fb0fa6d111a705499eb", + "evaluation_time": 27.289865016937256, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.24198601323536625, + "v_measure": 0.24198601323536625, + "v_measure_std": 0.013276420365121354, + "v_measures": { + "Level 0": [ + 0.2300593505885338, + 0.23508268360807033, + 0.23241548342834958, + 0.26915706772301773, + 0.25256127786287275, + 0.23688608522848298, + 0.22232488289061633, + 0.2380801297008098, + 0.2545237468566588, + 0.24876942446625025 + ] + } + } + ] + }, + "task_name": "RedditClustering.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/RedditClusteringP2P.json b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/RedditClusteringP2P.json new file mode 100644 index 0000000000..d5c45c248e --- /dev/null +++ b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/RedditClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "385e3cb46b4cfa89021f56c4380204149d0efe33", + "evaluation_time": 1725.828932762146, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.4922799685377598, + "v_measure": 0.4922799685377598, + "v_measure_std": 0.10960211117941973, + "v_measures": [ + 0.5303850140552447, + 0.5710657754857009, + 0.5315898474280252, + 0.34014024178861285, + 0.5405184006635801, + 0.5018686513661716, + 0.23146826899458403, + 0.576155181757918, + 0.5069058983713225, + 0.5927024054664375 + ] + } + ] + }, + "task_name": "RedditClusteringP2P" +} \ No newline at end of file diff --git a/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/RedditClusteringP2P.v2.json b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/RedditClusteringP2P.v2.json new file mode 100644 index 0000000000..c13939f7b8 --- /dev/null +++ b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/RedditClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "385e3cb46b4cfa89021f56c4380204149d0efe33", + "evaluation_time": 78.87403702735901, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.4941360861305967, + "v_measure": 0.4941360861305967, + "v_measure_std": 0.005065091553415061, + "v_measures": { + "Level 0": [ + 0.4972053831844197, + 0.4985317539170386, + 0.48588039473406214, + 0.49818045391020777, + 0.49491989166666556, + 0.49847502790322196, + 0.5001941562157675, + 0.49231581344434666, + 0.4863656959301545, + 0.4892922904000829 + ] + } + } + ] + }, + "task_name": "RedditClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/StackExchangeClustering.json b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/StackExchangeClustering.json new file mode 100644 index 0000000000..f7e9a549aa --- /dev/null +++ b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/StackExchangeClustering.json @@ -0,0 +1,47 @@ +{ + "dataset_revision": "6cbc1f7b2bc0622f2e39d2c77fa502909748c259", + "evaluation_time": 226.1578724384308, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.35014774013118655, + "v_measure": 0.35014774013118655, + "v_measure_std": 0.04686752103894884, + "v_measures": [ + 0.3750147172345799, + 0.37201260290878313, + 0.28029848169659227, + 0.37793593822586846, + 0.3314146394658391, + 0.32550877729943695, + 0.33333744040405267, + 0.38459654974281204, + 0.32653372544618653, + 0.3260379060990616, + 0.4689698865814095, + 0.3663203144607196, + 0.4836923756818127, + 0.35600746626574953, + 0.32089047756239863, + 0.38539075383457355, + 0.31282434305392787, + 0.3464231593041693, + 0.2922090104586941, + 0.3158772397833245, + 0.345046212687298, + 0.3692562646506149, + 0.3051856466992528, + 0.3067089244979542, + 0.3462006492345518 + ] + } + ] + }, + "task_name": "StackExchangeClustering" +} \ No newline at end of file diff --git a/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/StackExchangeClustering.v2.json b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/StackExchangeClustering.v2.json new file mode 100644 index 0000000000..84722d6262 --- /dev/null +++ b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/StackExchangeClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "6cbc1f7b2bc0622f2e39d2c77fa502909748c259", + "evaluation_time": 24.55757451057434, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3049649205554989, + "v_measure": 0.3049649205554989, + "v_measure_std": 0.005761116828829286, + "v_measures": { + "Level 0": [ + 0.3111924542773924, + 0.3088338102567898, + 0.303348727065143, + 0.31032766892158536, + 0.30247627118772, + 0.2950471222236022, + 0.3022421972467931, + 0.2959344941633458, + 0.3099670273083923, + 0.3102794329042253 + ] + } + } + ] + }, + "task_name": "StackExchangeClustering.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/StackExchangeClusteringP2P.json b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/StackExchangeClusteringP2P.json new file mode 100644 index 0000000000..beed95a9d8 --- /dev/null +++ b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/StackExchangeClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "815ca46b2622cec33ccafc3735d572c266efdb44", + "evaluation_time": 379.2468492984772, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.28444477069227553, + "v_measure": 0.28444477069227553, + "v_measure_std": 0.016567365836052467, + "v_measures": [ + 0.27154964181591484, + 0.2714102835391841, + 0.2704795422614713, + 0.262524205454055, + 0.26704151585094443, + 0.3097585497580317, + 0.29481747753476684, + 0.3012979509692772, + 0.2932078510221693, + 0.30236068871694066 + ] + } + ] + }, + "task_name": "StackExchangeClusteringP2P" +} \ No newline at end of file diff --git a/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/StackExchangeClusteringP2P.v2.json b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/StackExchangeClusteringP2P.v2.json new file mode 100644 index 0000000000..46387b55a7 --- /dev/null +++ b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/StackExchangeClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "815ca46b2622cec33ccafc3735d572c266efdb44", + "evaluation_time": 22.35237693786621, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.35434391394334347, + "v_measure": 0.35434391394334347, + "v_measure_std": 0.005613563004630377, + "v_measures": { + "Level 0": [ + 0.3604722599027116, + 0.35873711972786937, + 0.3577606921736584, + 0.35303146365845345, + 0.34904346291727806, + 0.3475668657399349, + 0.3601070895590226, + 0.36070508164563186, + 0.35091154417408815, + 0.3451035599347864 + ] + } + } + ] + }, + "task_name": "StackExchangeClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/TwentyNewsgroupsClustering.json b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/TwentyNewsgroupsClustering.json new file mode 100644 index 0000000000..49b9c6e250 --- /dev/null +++ b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/TwentyNewsgroupsClustering.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "6125ec4e24fa026cec8a478383ee943acfbd5449", + "evaluation_time": 27.634557247161865, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.22530621700805079, + "v_measure": 0.22530621700805079, + "v_measure_std": 0.017624896606380162, + "v_measures": [ + 0.2408495922817028, + 0.24321152879482444, + 0.22524508546896446, + 0.22903674022120507, + 0.235878482401794, + 0.25172436163444933, + 0.2085609054500412, + 0.21966025145630855, + 0.20540344953397088, + 0.19349177283724703 + ] + } + ] + }, + "task_name": "TwentyNewsgroupsClustering" +} \ No newline at end of file diff --git a/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/TwentyNewsgroupsClustering.v2.json b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/TwentyNewsgroupsClustering.v2.json new file mode 100644 index 0000000000..e7023cb053 --- /dev/null +++ b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/TwentyNewsgroupsClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "6125ec4e24fa026cec8a478383ee943acfbd5449", + "evaluation_time": 4.464260578155518, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.23406441864090793, + "v_measure": 0.23406441864090793, + "v_measure_std": 0.016923375201639494, + "v_measures": { + "Level 0": [ + 0.23005964605170978, + 0.24190884234084375, + 0.2523466456610527, + 0.2235366072851982, + 0.20131696880970046, + 0.22558011590535004, + 0.23875092833154557, + 0.24602512897812592, + 0.26232638681008014, + 0.2187929162354727 + ] + } + } + ] + }, + "task_name": "TwentyNewsgroupsClustering.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/model_meta.json b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/model_meta.json new file mode 100644 index 0000000000..3b6812e464 --- /dev/null +++ b/results/sentence-transformers__LaBSE/e34fab64a3011d2176c99545a93d5cbddc9a91b7/model_meta.json @@ -0,0 +1 @@ +{"name": "sentence-transformers/LaBSE", "revision": "e34fab64a3011d2176c99545a93d5cbddc9a91b7", "release_date": "2019-11-01", "languages": ["ara_Arab", "bul_Cyrl", "cat_Latn", "ces_Latn", "dan_Latn", "deu_Latn", "ell_Grek", "eng_Latn", "spa_Latn", "est_Latn", "fas_Arab", "fin_Latn", "fra_Latn", "fra_Latn", "glg_Latn", "guj_Gujr", "heb_Hebr", "hin_Deva", "hrv_Latn", "hun_Latn", "hye_Armn", "ind_Latn", "ita_Latn", "jpn_Jpan", "kat_Geor", "kor_Hang", "kur_Arab", "lit_Latn", "lav_Latn", "mkd_Cyrl", "mon_Cyrl", "mar_Deva", "msa_Latn", "mya_Mymr", "nob_Latn", "nld_Latn", "pol_Latn", "por_Latn", "por_Latn", "ron_Latn", "rus_Cyrl", "slk_Latn", "slv_Latn", "sqi_Latn", "srp_Cyrl", "swe_Latn", "tha_Thai", "tur_Latn", "ukr_Cyrl", "urd_Arab", "vie_Latn", "zho_Hans", "zho_Hant"], "n_parameters": null, "memory_usage": null, "max_tokens": null, "embed_dim": null, "license": null, "open_source": true, "framework": [], "loader": null} \ No newline at end of file diff --git a/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/BiorxivClusteringP2P.json b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/BiorxivClusteringP2P.json new file mode 100644 index 0000000000..0af381666a --- /dev/null +++ b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/BiorxivClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "65b79d1d13f80053f67aca9498d9402c2d9f1f40", + "evaluation_time": 98.5497043132782, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.38367725707685313, + "v_measure": 0.38367725707685313, + "v_measure_std": 0.007571234916434395, + "v_measures": [ + 0.3861705063354808, + 0.3908363036054753, + 0.36683683351327706, + 0.3775626404470107, + 0.3861680968182999, + 0.3885964276452892, + 0.3794722162395541, + 0.39404353725901037, + 0.37911589265639545, + 0.38797011624873873 + ] + } + ] + }, + "task_name": "BiorxivClusteringP2P" +} \ No newline at end of file diff --git a/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/BiorxivClusteringP2P.v2.json b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/BiorxivClusteringP2P.v2.json new file mode 100644 index 0000000000..618141f111 --- /dev/null +++ b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/BiorxivClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "f5dbc242e11dd8e24def4c4268607a49e02946dc", + "evaluation_time": 5.810603380203247, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.4098882677943815, + "v_measure": 0.4098882677943815, + "v_measure_std": 0.009523964872488806, + "v_measures": { + "Level 0": [ + 0.40340827806278495, + 0.39573473629113115, + 0.40472315486134164, + 0.40466543954198453, + 0.41225738056040917, + 0.4320035763957874, + 0.41230791075241163, + 0.4183864046249508, + 0.40392814949459005, + 0.4114676473584234 + ] + } + } + ] + }, + "task_name": "BiorxivClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/BiorxivClusteringS2S.json b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/BiorxivClusteringS2S.json new file mode 100644 index 0000000000..908a00a45b --- /dev/null +++ b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/BiorxivClusteringS2S.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "258694dd0231531bc1fd9de6ceb52a0853c6d908", + "evaluation_time": 16.593175411224365, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3287710086348273, + "v_measure": 0.3287710086348273, + "v_measure_std": 0.00754288373295063, + "v_measures": [ + 0.3343374637587593, + 0.3181285851530612, + 0.3201177688100758, + 0.32260555991021944, + 0.32095136778756267, + 0.32851713281865713, + 0.3349897363095164, + 0.34179497690287103, + 0.33458951069687476, + 0.33167798420067457 + ] + } + ] + }, + "task_name": "BiorxivClusteringS2S" +} \ No newline at end of file diff --git a/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/BiorxivClusteringS2S.v2.json b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/BiorxivClusteringS2S.v2.json new file mode 100644 index 0000000000..9a50851743 --- /dev/null +++ b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/BiorxivClusteringS2S.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "eb4edb10386758d274cd161093eb351381a16dbf", + "evaluation_time": 3.4249987602233887, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3460325961542299, + "v_measure": 0.3460325961542299, + "v_measure_std": 0.007091287185323974, + "v_measures": { + "Level 0": [ + 0.3415053195400624, + 0.3501730201986574, + 0.34476649934171943, + 0.3435084141967574, + 0.3512337731982489, + 0.33829414482907105, + 0.3580611653492557, + 0.35208407931158975, + 0.3324625064910066, + 0.34823703908593034 + ] + } + } + ] + }, + "task_name": "BiorxivClusteringS2S.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/MedrxivClusteringP2P.json b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/MedrxivClusteringP2P.json new file mode 100644 index 0000000000..a39c5a321b --- /dev/null +++ b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/MedrxivClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "e7a26af6f3ae46b30dde8737f02c07b1505bcc73", + "evaluation_time": 51.42057704925537, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3438933185926368, + "v_measure": 0.3438933185926368, + "v_measure_std": 0.015084000520185457, + "v_measures": [ + 0.3344861697809059, + 0.32330612725732444, + 0.33021387443753913, + 0.3256789461617313, + 0.33508463484520723, + 0.3508774540978055, + 0.3584833006559594, + 0.3634095257399166, + 0.352152136023761, + 0.36524101692621685 + ] + } + ] + }, + "task_name": "MedrxivClusteringP2P" +} \ No newline at end of file diff --git a/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/MedrxivClusteringP2P.v2.json b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/MedrxivClusteringP2P.v2.json new file mode 100644 index 0000000000..32a200a1de --- /dev/null +++ b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/MedrxivClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "e7a26af6f3ae46b30dde8737f02c07b1505bcc73", + "evaluation_time": 5.184590816497803, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3749003434256308, + "v_measure": 0.3749003434256308, + "v_measure_std": 0.005011124593256334, + "v_measures": { + "Level 0": [ + 0.3804562589583136, + 0.37265465986935176, + 0.3738142840484856, + 0.3733953665484042, + 0.37293652434333635, + 0.36915067866870116, + 0.37012466487262546, + 0.38068700701148767, + 0.3707979779366562, + 0.3849860119989459 + ] + } + } + ] + }, + "task_name": "MedrxivClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/MedrxivClusteringS2S.json b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/MedrxivClusteringS2S.json new file mode 100644 index 0000000000..3545435434 --- /dev/null +++ b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/MedrxivClusteringS2S.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "35191c8c0dca72d8ff3efcd72aa802307d469663", + "evaluation_time": 11.041844606399536, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3186351621903202, + "v_measure": 0.3186351621903202, + "v_measure_std": 0.017336971951213677, + "v_measures": [ + 0.3077296511498838, + 0.29904952852458616, + 0.3060929599710469, + 0.2970532738518561, + 0.30029734479645276, + 0.3388872475509636, + 0.3296070693515537, + 0.3445063570391233, + 0.329366888655632, + 0.33376130101210333 + ] + } + ] + }, + "task_name": "MedrxivClusteringS2S" +} \ No newline at end of file diff --git a/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/MedrxivClusteringS2S.v2.json b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/MedrxivClusteringS2S.v2.json new file mode 100644 index 0000000000..0bbee02531 --- /dev/null +++ b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/MedrxivClusteringS2S.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "35191c8c0dca72d8ff3efcd72aa802307d469663", + "evaluation_time": 3.4713029861450195, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3573284184639764, + "v_measure": 0.3573284184639764, + "v_measure_std": 0.004761289124762311, + "v_measures": { + "Level 0": [ + 0.35801629627588133, + 0.36336914675415627, + 0.354206767936412, + 0.35149185609198985, + 0.36711239942457935, + 0.3563095036960868, + 0.35517357641828384, + 0.35909690160279617, + 0.35090096359889156, + 0.357606772840687 + ] + } + } + ] + }, + "task_name": "MedrxivClusteringS2S.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/RedditClustering.json b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/RedditClustering.json new file mode 100644 index 0000000000..1a2f5b11d0 --- /dev/null +++ b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/RedditClustering.json @@ -0,0 +1,47 @@ +{ + "dataset_revision": "24640382cdbf8abc73003fb0fa6d111a705499eb", + "evaluation_time": 95.8737952709198, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.5070247309457051, + "v_measure": 0.5070247309457051, + "v_measure_std": 0.046023553759731356, + "v_measures": [ + 0.5458214255110118, + 0.5622544906476535, + 0.4538430874547047, + 0.49637605656515765, + 0.4976283037951732, + 0.4607871175950756, + 0.5442028029621981, + 0.4577985257952042, + 0.4732551816736723, + 0.4836487358836577, + 0.47198194679419647, + 0.5471434185457192, + 0.4983610711984165, + 0.5361379959098989, + 0.6004024304603816, + 0.4657103555436244, + 0.5194551231641161, + 0.5661006802509085, + 0.4860318985756045, + 0.47139153610589085, + 0.45756167836780137, + 0.47491629399151053, + 0.6226717778745392, + 0.5115157201003764, + 0.47062061887613343 + ] + } + ] + }, + "task_name": "RedditClustering" +} \ No newline at end of file diff --git a/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/RedditClustering.v2.json b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/RedditClustering.v2.json new file mode 100644 index 0000000000..60c46e58eb --- /dev/null +++ b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/RedditClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "24640382cdbf8abc73003fb0fa6d111a705499eb", + "evaluation_time": 10.571322679519653, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.4684306389535521, + "v_measure": 0.4684306389535521, + "v_measure_std": 0.012451615302298344, + "v_measures": { + "Level 0": [ + 0.4776516178184836, + 0.48726773884100827, + 0.4832894894517653, + 0.45704163603856507, + 0.4767720425479976, + 0.4709993981890916, + 0.45606604088092023, + 0.44683330913814795, + 0.46040828203979733, + 0.46797683458974443 + ] + } + } + ] + }, + "task_name": "RedditClustering.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/RedditClusteringP2P.json b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/RedditClusteringP2P.json new file mode 100644 index 0000000000..2b25450c36 --- /dev/null +++ b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/RedditClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "385e3cb46b4cfa89021f56c4380204149d0efe33", + "evaluation_time": 395.5768036842346, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.5479845419577372, + "v_measure": 0.5479845419577372, + "v_measure_std": 0.11285422691786078, + "v_measures": [ + 0.5921809745660865, + 0.6024168793148268, + 0.593524744034557, + 0.3498261574451654, + 0.6104173689193234, + 0.5342672688863244, + 0.312455830539192, + 0.6506173884904118, + 0.590003066897206, + 0.6441357404842775 + ] + } + ] + }, + "task_name": "RedditClusteringP2P" +} \ No newline at end of file diff --git a/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/RedditClusteringP2P.v2.json b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/RedditClusteringP2P.v2.json new file mode 100644 index 0000000000..9e89e0a51f --- /dev/null +++ b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/RedditClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "385e3cb46b4cfa89021f56c4380204149d0efe33", + "evaluation_time": 22.49931812286377, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.5533863397932278, + "v_measure": 0.5533863397932278, + "v_measure_std": 0.0051046624452894054, + "v_measures": { + "Level 0": [ + 0.5556214499167038, + 0.5570348008414748, + 0.5502529486050846, + 0.5527225075660551, + 0.5595459451291612, + 0.5624113037721554, + 0.5504843579249107, + 0.5461144895078845, + 0.5534526045726675, + 0.5462229900961804 + ] + } + } + ] + }, + "task_name": "RedditClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/StackExchangeClustering.json b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/StackExchangeClustering.json new file mode 100644 index 0000000000..f761c61232 --- /dev/null +++ b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/StackExchangeClustering.json @@ -0,0 +1,47 @@ +{ + "dataset_revision": "6cbc1f7b2bc0622f2e39d2c77fa502909748c259", + "evaluation_time": 107.18429803848267, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.5313685840246208, + "v_measure": 0.5313685840246208, + "v_measure_std": 0.05607312786136465, + "v_measures": [ + 0.5699789837324569, + 0.5023978222167677, + 0.4331146927285657, + 0.5962629454189619, + 0.44917091475706905, + 0.48287570864149876, + 0.4981355660927683, + 0.6563400348094675, + 0.5258406383723092, + 0.5058631085759934, + 0.640469974032931, + 0.5547465151261819, + 0.6386327256451769, + 0.5775728041978352, + 0.520756144514187, + 0.5110527487973027, + 0.506464304344723, + 0.5135727024551129, + 0.5287482583443012, + 0.5202826020703899, + 0.5274259248669895, + 0.45710787777652157, + 0.4836275072870198, + 0.5322556191308159, + 0.5515184766801733 + ] + } + ] + }, + "task_name": "StackExchangeClustering" +} \ No newline at end of file diff --git a/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/StackExchangeClustering.v2.json b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/StackExchangeClustering.v2.json new file mode 100644 index 0000000000..51b56f4723 --- /dev/null +++ b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/StackExchangeClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "6cbc1f7b2bc0622f2e39d2c77fa502909748c259", + "evaluation_time": 11.085692405700684, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.4527490279269508, + "v_measure": 0.4527490279269508, + "v_measure_std": 0.006210618436455052, + "v_measures": { + "Level 0": [ + 0.465665270830961, + 0.4517775008013562, + 0.4513574484844022, + 0.44858709951425446, + 0.44517383459701515, + 0.45219366677412964, + 0.45738579126907536, + 0.46014965894201226, + 0.44518125553615034, + 0.45001875252015106 + ] + } + } + ] + }, + "task_name": "StackExchangeClustering.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/StackExchangeClusteringP2P.json b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/StackExchangeClusteringP2P.json new file mode 100644 index 0000000000..19bb3092eb --- /dev/null +++ b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/StackExchangeClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "815ca46b2622cec33ccafc3735d572c266efdb44", + "evaluation_time": 95.12732815742493, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3425688415281717, + "v_measure": 0.3425688415281717, + "v_measure_std": 0.015371257942944163, + "v_measures": [ + 0.3328629626442746, + 0.33663564770540927, + 0.32893308104314106, + 0.31803619262828103, + 0.32550306205321433, + 0.3641024611302483, + 0.3491232718030816, + 0.35184987529254175, + 0.3589580998501727, + 0.3596837611313524 + ] + } + ] + }, + "task_name": "StackExchangeClusteringP2P" +} \ No newline at end of file diff --git a/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/StackExchangeClusteringP2P.v2.json b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/StackExchangeClusteringP2P.v2.json new file mode 100644 index 0000000000..8caf223ae3 --- /dev/null +++ b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/StackExchangeClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "815ca46b2622cec33ccafc3735d572c266efdb44", + "evaluation_time": 8.378719329833984, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.40313067289877563, + "v_measure": 0.40313067289877563, + "v_measure_std": 0.0036385032559879465, + "v_measures": { + "Level 0": [ + 0.4085967124308061, + 0.3977003490998413, + 0.4007687823403818, + 0.4065817519942862, + 0.39777835121444316, + 0.4012319579897013, + 0.4058332122722177, + 0.40704179982975236, + 0.40341635724346203, + 0.40235745457286426 + ] + } + } + ] + }, + "task_name": "StackExchangeClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/TwentyNewsgroupsClustering.json b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/TwentyNewsgroupsClustering.json new file mode 100644 index 0000000000..090b35f5ee --- /dev/null +++ b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/TwentyNewsgroupsClustering.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "6125ec4e24fa026cec8a478383ee943acfbd5449", + "evaluation_time": 11.419964075088501, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.46490211003880566, + "v_measure": 0.46490211003880566, + "v_measure_std": 0.009833035575193027, + "v_measures": [ + 0.4581793083177559, + 0.475029910066843, + 0.4686199049113967, + 0.44284585890400796, + 0.4639602584753287, + 0.4612930792820161, + 0.4614906471845176, + 0.4638395847140715, + 0.47527857348367675, + 0.4784839750484431 + ] + } + ] + }, + "task_name": "TwentyNewsgroupsClustering" +} \ No newline at end of file diff --git a/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/TwentyNewsgroupsClustering.v2.json b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/TwentyNewsgroupsClustering.v2.json new file mode 100644 index 0000000000..42b44e2837 --- /dev/null +++ b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/TwentyNewsgroupsClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "6125ec4e24fa026cec8a478383ee943acfbd5449", + "evaluation_time": 3.0748984813690186, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.4539168574138728, + "v_measure": 0.4539168574138728, + "v_measure_std": 0.012479565426155482, + "v_measures": { + "Level 0": [ + 0.44918264860947477, + 0.4568723737498788, + 0.45062777897735407, + 0.4706201064828361, + 0.45585733884153495, + 0.46629728179940527, + 0.4636032206354712, + 0.46099705080933767, + 0.4359326036031247, + 0.42917817063031044 + ] + } + } + ] + }, + "task_name": "TwentyNewsgroupsClustering.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/model_meta.json b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/model_meta.json new file mode 100644 index 0000000000..0401016ddb --- /dev/null +++ b/results/sentence-transformers__all-MiniLM-L6-v2/8b3219a92973c328a8e22fadcfa821b5dc75636a/model_meta.json @@ -0,0 +1 @@ +{"name": "sentence-transformers/all-MiniLM-L6-v2", "revision": "8b3219a92973c328a8e22fadcfa821b5dc75636a", "release_date": "2021-08-30", "languages": ["eng-Latn"], "n_parameters": null, "memory_usage": null, "max_tokens": null, "embed_dim": null, "license": null, "open_source": true, "framework": [], "loader": null} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/BiorxivClusteringP2P.json b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/BiorxivClusteringP2P.json new file mode 100644 index 0000000000..ab7d7cdeaa --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/BiorxivClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "65b79d1d13f80053f67aca9498d9402c2d9f1f40", + "evaluation_time": 86.20054388046265, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3379499800191673, + "v_measure": 0.3379499800191673, + "v_measure_std": 0.007363142291778588, + "v_measures": [ + 0.3388278348821894, + 0.3389938702496332, + 0.33380982401332177, + 0.3250569447414619, + 0.34429063730788506, + 0.3476260664365516, + 0.32648295875990074, + 0.34550264455622065, + 0.3355793362288068, + 0.3433296830157024 + ] + } + ] + }, + "task_name": "BiorxivClusteringP2P" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/BiorxivClusteringP2P.v2.json b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/BiorxivClusteringP2P.v2.json new file mode 100644 index 0000000000..4fa9b1a154 --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/BiorxivClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "f5dbc242e11dd8e24def4c4268607a49e02946dc", + "evaluation_time": 6.319845914840698, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.36183432722474873, + "v_measure": 0.36183432722474873, + "v_measure_std": 0.00813462822681188, + "v_measures": { + "Level 0": [ + 0.36618974043711316, + 0.3498324250683925, + 0.35763508155830276, + 0.3712159483843975, + 0.35822636320352436, + 0.3670716434453229, + 0.3487922653036461, + 0.35757961943542244, + 0.37103609620411276, + 0.37076408920725257 + ] + } + } + ] + }, + "task_name": "BiorxivClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/BiorxivClusteringS2S.json b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/BiorxivClusteringS2S.json new file mode 100644 index 0000000000..9fe8996b69 --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/BiorxivClusteringS2S.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "258694dd0231531bc1fd9de6ceb52a0853c6d908", + "evaluation_time": 28.146885871887207, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.29406331533783037, + "v_measure": 0.29406331533783037, + "v_measure_std": 0.00618892141729645, + "v_measures": [ + 0.2924433147949919, + 0.29932688843474764, + 0.2857066528699547, + 0.2983150175434375, + 0.28466164799912747, + 0.29807711383412405, + 0.29394690883713687, + 0.2861357994600734, + 0.30168662645225436, + 0.30033318315245594 + ] + } + ] + }, + "task_name": "BiorxivClusteringS2S" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/BiorxivClusteringS2S.v2.json b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/BiorxivClusteringS2S.v2.json new file mode 100644 index 0000000000..d0fb240ac4 --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/BiorxivClusteringS2S.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "eb4edb10386758d274cd161093eb351381a16dbf", + "evaluation_time": 3.829831600189209, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.30828880315412366, + "v_measure": 0.30828880315412366, + "v_measure_std": 0.009854743673576279, + "v_measures": { + "Level 0": [ + 0.29210939671579855, + 0.30630172655480137, + 0.32148561819732374, + 0.3095268025820234, + 0.3008072194167711, + 0.31987283862959837, + 0.31435028913976354, + 0.2927893776414545, + 0.3161014859247864, + 0.3095432767389159 + ] + } + } + ] + }, + "task_name": "BiorxivClusteringS2S.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/MedrxivClusteringP2P.json b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/MedrxivClusteringP2P.json new file mode 100644 index 0000000000..664a93f095 --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/MedrxivClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "e7a26af6f3ae46b30dde8737f02c07b1505bcc73", + "evaluation_time": 46.297199010849, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3099500095937434, + "v_measure": 0.3099500095937434, + "v_measure_std": 0.013342849420790667, + "v_measures": [ + 0.30866169412362804, + 0.3055391265943512, + 0.29722194308689054, + 0.30441277761598334, + 0.2873984955866315, + 0.32883883785663315, + 0.30976921346307285, + 0.3333849237672754, + 0.32057418650204034, + 0.30369889734092786 + ] + } + ] + }, + "task_name": "MedrxivClusteringP2P" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/MedrxivClusteringP2P.v2.json b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/MedrxivClusteringP2P.v2.json new file mode 100644 index 0000000000..4b3b6dea4c --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/MedrxivClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "e7a26af6f3ae46b30dde8737f02c07b1505bcc73", + "evaluation_time": 5.908262729644775, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3453134135054978, + "v_measure": 0.3453134135054978, + "v_measure_std": 0.004720893145060998, + "v_measures": { + "Level 0": [ + 0.33683896477963954, + 0.3395433014779958, + 0.3498270221907992, + 0.34422359141202735, + 0.34771602038538424, + 0.3490118369699795, + 0.3394997619120008, + 0.3507565167070456, + 0.3482858538014652, + 0.3474312654186407 + ] + } + } + ] + }, + "task_name": "MedrxivClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/MedrxivClusteringS2S.json b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/MedrxivClusteringS2S.json new file mode 100644 index 0000000000..ce8e321123 --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/MedrxivClusteringS2S.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "35191c8c0dca72d8ff3efcd72aa802307d469663", + "evaluation_time": 16.637155294418335, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.30850717943176953, + "v_measure": 0.30850717943176953, + "v_measure_std": 0.016813669991818603, + "v_measures": [ + 0.2923604968058372, + 0.2937009923500305, + 0.28093207004718296, + 0.2998173101582566, + 0.29832420373487495, + 0.32212329283914426, + 0.3209447879947657, + 0.3347305455017347, + 0.3267305108412756, + 0.31540758404459274 + ] + } + ] + }, + "task_name": "MedrxivClusteringS2S" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/MedrxivClusteringS2S.v2.json b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/MedrxivClusteringS2S.v2.json new file mode 100644 index 0000000000..37e8fe957a --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/MedrxivClusteringS2S.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "35191c8c0dca72d8ff3efcd72aa802307d469663", + "evaluation_time": 3.5954113006591797, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3488432889914438, + "v_measure": 0.3488432889914438, + "v_measure_std": 0.011089483922831274, + "v_measures": { + "Level 0": [ + 0.3493257902407217, + 0.3385313899284641, + 0.357768844594858, + 0.3287494498270625, + 0.3553115321117743, + 0.35578291928575184, + 0.34823026321770695, + 0.33806859552722557, + 0.3695844040114814, + 0.34707970116939163 + ] + } + } + ] + }, + "task_name": "MedrxivClusteringS2S.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/RedditClustering.json b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/RedditClustering.json new file mode 100644 index 0000000000..03aa00e2c2 --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/RedditClustering.json @@ -0,0 +1,47 @@ +{ + "dataset_revision": "24640382cdbf8abc73003fb0fa6d111a705499eb", + "evaluation_time": 136.3046612739563, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.4264062223916368, + "v_measure": 0.4264062223916368, + "v_measure_std": 0.04742563464605916, + "v_measures": [ + 0.37277761581154506, + 0.46409492328260454, + 0.3825830217942452, + 0.4188753999297151, + 0.3887993665535172, + 0.3919622314341335, + 0.468578152667782, + 0.40847137153578084, + 0.4175220777386184, + 0.4154785516440778, + 0.391485810594391, + 0.48378790117918613, + 0.46772742914847565, + 0.43365677706385497, + 0.5330771268772484, + 0.39676239704994926, + 0.4132305320441305, + 0.41764820598761504, + 0.4095582509830173, + 0.40708410235702874, + 0.3829832154411731, + 0.39776158641365755, + 0.5720250244093886, + 0.4376112135122882, + 0.386613274337495 + ] + } + ] + }, + "task_name": "RedditClustering" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/RedditClustering.v2.json b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/RedditClustering.v2.json new file mode 100644 index 0000000000..d985ed66d8 --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/RedditClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "24640382cdbf8abc73003fb0fa6d111a705499eb", + "evaluation_time": 14.43251371383667, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.4038357263804599, + "v_measure": 0.4038357263804599, + "v_measure_std": 0.009060216438926223, + "v_measures": { + "Level 0": [ + 0.4019648001047694, + 0.39977488074530876, + 0.406751067875052, + 0.41442827318681896, + 0.41470047418957634, + 0.39664323029477244, + 0.384859149213283, + 0.40420249119505136, + 0.4153608079376184, + 0.3996720890623485 + ] + } + } + ] + }, + "task_name": "RedditClustering.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/RedditClusteringP2P.json b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/RedditClusteringP2P.json new file mode 100644 index 0000000000..338247dcc7 --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/RedditClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "385e3cb46b4cfa89021f56c4380204149d0efe33", + "evaluation_time": 447.8844413757324, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.5009859153407248, + "v_measure": 0.5009859153407248, + "v_measure_std": 0.10638463438559483, + "v_measures": [ + 0.5507082109425497, + 0.5306671331237389, + 0.584625826785394, + 0.32307738146641174, + 0.5349857044213202, + 0.47891247797540754, + 0.2763233848857601, + 0.5907250360912949, + 0.5424946674015012, + 0.5973393303138708 + ] + } + ] + }, + "task_name": "RedditClusteringP2P" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/RedditClusteringP2P.v2.json b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/RedditClusteringP2P.v2.json new file mode 100644 index 0000000000..243216b0b7 --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/RedditClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "385e3cb46b4cfa89021f56c4380204149d0efe33", + "evaluation_time": 24.755430459976196, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.5139378553884388, + "v_measure": 0.5139378553884388, + "v_measure_std": 0.004294079096570996, + "v_measures": { + "Level 0": [ + 0.5093000978056622, + 0.5171641700366111, + 0.5121592955268334, + 0.5092066975958384, + 0.5208776216885552, + 0.518351867722501, + 0.5184321367998201, + 0.5115468690798618, + 0.5141735393321781, + 0.5081662582965276 + ] + } + } + ] + }, + "task_name": "RedditClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/StackExchangeClustering.json b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/StackExchangeClustering.json new file mode 100644 index 0000000000..722137a37e --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/StackExchangeClustering.json @@ -0,0 +1,47 @@ +{ + "dataset_revision": "6cbc1f7b2bc0622f2e39d2c77fa502909748c259", + "evaluation_time": 107.82993912696838, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.49290455349280704, + "v_measure": 0.49290455349280704, + "v_measure_std": 0.04282922893084549, + "v_measures": [ + 0.511467632515496, + 0.48436843024496756, + 0.4460256425335859, + 0.5282684019626085, + 0.5014254912400526, + 0.4503556191599693, + 0.4790446299972, + 0.5690335673943024, + 0.47265317976614685, + 0.47742436086149176, + 0.5980683460660893, + 0.5135362965566143, + 0.5742897900021677, + 0.544466175621605, + 0.44390707965064874, + 0.4820011033553236, + 0.46792590424045855, + 0.4534974347588226, + 0.45444640000971614, + 0.4413160601623461, + 0.47538818140659894, + 0.5340349653884281, + 0.47049165397721143, + 0.4559281762911649, + 0.49324931415716167 + ] + } + ] + }, + "task_name": "StackExchangeClustering" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/StackExchangeClustering.v2.json b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/StackExchangeClustering.v2.json new file mode 100644 index 0000000000..8dfe2caccb --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/StackExchangeClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "6cbc1f7b2bc0622f2e39d2c77fa502909748c259", + "evaluation_time": 12.86415719985962, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.43605152531927394, + "v_measure": 0.43605152531927394, + "v_measure_std": 0.0034567741270241556, + "v_measures": { + "Level 0": [ + 0.4325256875004311, + 0.4382965964393776, + 0.43867021687786417, + 0.4353863910472667, + 0.42835165502745426, + 0.4392433331698399, + 0.43964178343537147, + 0.4332915258912072, + 0.43722026116947166, + 0.43788780263445476 + ] + } + } + ] + }, + "task_name": "StackExchangeClustering.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/StackExchangeClusteringP2P.json b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/StackExchangeClusteringP2P.json new file mode 100644 index 0000000000..98f587417b --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/StackExchangeClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "815ca46b2622cec33ccafc3735d572c266efdb44", + "evaluation_time": 87.4092788696289, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3166697199604255, + "v_measure": 0.3166697199604255, + "v_measure_std": 0.01646975173548221, + "v_measures": [ + 0.30410093933864535, + 0.3008697942230494, + 0.30091840189156654, + 0.29478647932436813, + 0.3044685529670446, + 0.3417391429135353, + 0.3227350191608718, + 0.3299541190021794, + 0.3364436867680772, + 0.3306810640149168 + ] + } + ] + }, + "task_name": "StackExchangeClusteringP2P" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/StackExchangeClusteringP2P.v2.json b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/StackExchangeClusteringP2P.v2.json new file mode 100644 index 0000000000..caf5b6a068 --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/StackExchangeClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "815ca46b2622cec33ccafc3735d572c266efdb44", + "evaluation_time": 8.49235725402832, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3733997178456824, + "v_measure": 0.3733997178456824, + "v_measure_std": 0.0031100199236162697, + "v_measures": { + "Level 0": [ + 0.3752076892169227, + 0.3688273549645349, + 0.38113149848953726, + 0.37242178655524144, + 0.3735764155715625, + 0.37365938509510194, + 0.3703088243075582, + 0.3730340455899842, + 0.37379670067150017, + 0.37203347799488123 + ] + } + } + ] + }, + "task_name": "StackExchangeClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/TwentyNewsgroupsClustering.json b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/TwentyNewsgroupsClustering.json new file mode 100644 index 0000000000..d48445a331 --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/TwentyNewsgroupsClustering.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "6125ec4e24fa026cec8a478383ee943acfbd5449", + "evaluation_time": 16.55503821372986, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.399864574585611, + "v_measure": 0.399864574585611, + "v_measure_std": 0.013511430601287315, + "v_measures": [ + 0.405939530348118, + 0.4292822416353654, + 0.40218222250491364, + 0.4034398532125731, + 0.3927436029503992, + 0.3869584837044961, + 0.38231231967364127, + 0.4127524485379225, + 0.3854212815878023, + 0.3976137617008783 + ] + } + ] + }, + "task_name": "TwentyNewsgroupsClustering" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/TwentyNewsgroupsClustering.v2.json b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/TwentyNewsgroupsClustering.v2.json new file mode 100644 index 0000000000..15d1f9fb84 --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-MiniLM-L12-v2/bf3bf13ab40c3157080a7ab344c831b9ad18b5eb/TwentyNewsgroupsClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "6125ec4e24fa026cec8a478383ee943acfbd5449", + "evaluation_time": 3.5297610759735107, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.40595161159909676, + "v_measure": 0.40595161159909676, + "v_measure_std": 0.014355564650500679, + "v_measures": { + "Level 0": [ + 0.4038565389407894, + 0.38989009449074696, + 0.43100632352104257, + 0.3941872036645948, + 0.40939849029092684, + 0.4016242968879055, + 0.3982765137367584, + 0.4173486171483195, + 0.386828659266098, + 0.42709937804378467 + ] + } + } + ] + }, + "task_name": "TwentyNewsgroupsClustering.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/BiorxivClusteringP2P.json b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/BiorxivClusteringP2P.json new file mode 100644 index 0000000000..000337c99a --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/BiorxivClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "65b79d1d13f80053f67aca9498d9402c2d9f1f40", + "evaluation_time": 219.2024097442627, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.33023811989847823, + "v_measure": 0.33023811989847823, + "v_measure_std": 0.007094599533026518, + "v_measures": [ + 0.33359093686046637, + 0.3327563886031374, + 0.32479840840035507, + 0.3297908693999038, + 0.3171073045793568, + 0.32847420407954947, + 0.32587173429564786, + 0.32742964010202824, + 0.3434709732754766, + 0.3390907393888608 + ] + } + ] + }, + "task_name": "BiorxivClusteringP2P" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/BiorxivClusteringP2P.v2.json b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/BiorxivClusteringP2P.v2.json new file mode 100644 index 0000000000..5a53a5f395 --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/BiorxivClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "f5dbc242e11dd8e24def4c4268607a49e02946dc", + "evaluation_time": 10.111212253570557, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.36069759040358595, + "v_measure": 0.36069759040358595, + "v_measure_std": 0.005056155075773897, + "v_measures": { + "Level 0": [ + 0.35652164979747, + 0.3618063933770063, + 0.35478084029378737, + 0.35483116643164014, + 0.3577412453894285, + 0.36628680498009286, + 0.36719725324011115, + 0.3617755233720205, + 0.3690757854628561, + 0.356959241691447 + ] + } + } + ] + }, + "task_name": "BiorxivClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/BiorxivClusteringS2S.json b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/BiorxivClusteringS2S.json new file mode 100644 index 0000000000..b58d0c17df --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/BiorxivClusteringS2S.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "258694dd0231531bc1fd9de6ceb52a0853c6d908", + "evaluation_time": 66.73296117782593, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.29447267091454243, + "v_measure": 0.29447267091454243, + "v_measure_std": 0.0050675155607236115, + "v_measures": [ + 0.2950460644617829, + 0.2912854206874072, + 0.2935105955876649, + 0.2936126599484787, + 0.28242862358760507, + 0.2935308891916816, + 0.29487308014145475, + 0.29915465626420457, + 0.3001488383379328, + 0.30113588093721205 + ] + } + ] + }, + "task_name": "BiorxivClusteringS2S" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/BiorxivClusteringS2S.v2.json b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/BiorxivClusteringS2S.v2.json new file mode 100644 index 0000000000..aa7ed27dc9 --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/BiorxivClusteringS2S.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "eb4edb10386758d274cd161093eb351381a16dbf", + "evaluation_time": 5.325770378112793, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.318947346754725, + "v_measure": 0.318947346754725, + "v_measure_std": 0.007344838288185248, + "v_measures": { + "Level 0": [ + 0.32036852370807684, + 0.3148226264339179, + 0.32102015494041364, + 0.3215229686158149, + 0.31243413907158213, + 0.3334426571368441, + 0.3170419168075022, + 0.30567758694580927, + 0.3159377012215899, + 0.327205192665699 + ] + } + } + ] + }, + "task_name": "BiorxivClusteringS2S.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/MedrxivClusteringP2P.json b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/MedrxivClusteringP2P.json new file mode 100644 index 0000000000..d006178346 --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/MedrxivClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "e7a26af6f3ae46b30dde8737f02c07b1505bcc73", + "evaluation_time": 113.67033863067627, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3193313867681617, + "v_measure": 0.3193313867681617, + "v_measure_std": 0.010271057166186467, + "v_measures": [ + 0.3126262209680086, + 0.31383140174386503, + 0.31004275777092744, + 0.30956027753072296, + 0.3051378821471224, + 0.3297844472312541, + 0.3264989128446295, + 0.33897492049202715, + 0.32056086651017957, + 0.32629618044288056 + ] + } + ] + }, + "task_name": "MedrxivClusteringP2P" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/MedrxivClusteringP2P.v2.json b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/MedrxivClusteringP2P.v2.json new file mode 100644 index 0000000000..6f0867c8d2 --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/MedrxivClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "e7a26af6f3ae46b30dde8737f02c07b1505bcc73", + "evaluation_time": 8.222451210021973, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3540119990090064, + "v_measure": 0.3540119990090064, + "v_measure_std": 0.005243137984141148, + "v_measures": { + "Level 0": [ + 0.35566416251212457, + 0.3481397912157614, + 0.35466991115408975, + 0.35547417862171443, + 0.3592320606183781, + 0.3613176209666668, + 0.3417092787031761, + 0.35390172174011864, + 0.35576616348972884, + 0.35424510106830503 + ] + } + } + ] + }, + "task_name": "MedrxivClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/MedrxivClusteringS2S.json b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/MedrxivClusteringS2S.json new file mode 100644 index 0000000000..b38e087262 --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/MedrxivClusteringS2S.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "35191c8c0dca72d8ff3efcd72aa802307d469663", + "evaluation_time": 38.51788020133972, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.31529638851604835, + "v_measure": 0.31529638851604835, + "v_measure_std": 0.014122246480347217, + "v_measures": [ + 0.30718128420539176, + 0.2964725441766383, + 0.3011809974282635, + 0.30530071539616677, + 0.3001552695945038, + 0.3303678818313436, + 0.3233434219235773, + 0.33795771082881865, + 0.3295035780853505, + 0.3215004816904291 + ] + } + ] + }, + "task_name": "MedrxivClusteringS2S" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/MedrxivClusteringS2S.v2.json b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/MedrxivClusteringS2S.v2.json new file mode 100644 index 0000000000..a3a807020a --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/MedrxivClusteringS2S.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "35191c8c0dca72d8ff3efcd72aa802307d469663", + "evaluation_time": 5.377524137496948, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3605999997935113, + "v_measure": 0.3605999997935113, + "v_measure_std": 0.006762721172457443, + "v_measures": { + "Level 0": [ + 0.3556134385808981, + 0.35442224922464144, + 0.36261061630089436, + 0.35826199357312066, + 0.3696521138354752, + 0.3611399624351116, + 0.35955994343780806, + 0.36848627631962366, + 0.34747158775160175, + 0.368781816475938 + ] + } + } + ] + }, + "task_name": "MedrxivClusteringS2S.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/RedditClustering.json b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/RedditClustering.json new file mode 100644 index 0000000000..7055734028 --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/RedditClustering.json @@ -0,0 +1,47 @@ +{ + "dataset_revision": "24640382cdbf8abc73003fb0fa6d111a705499eb", + "evaluation_time": 309.89859986305237, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.4565389661201268, + "v_measure": 0.4565389661201268, + "v_measure_std": 0.05398738737610236, + "v_measures": [ + 0.38955770898405906, + 0.5277279697001578, + 0.4204803469787914, + 0.4624887888755375, + 0.418182946834442, + 0.4287358548867993, + 0.49583734162714965, + 0.43696139510262616, + 0.4432072686687305, + 0.43681887936283664, + 0.40958152587687535, + 0.4926073503735078, + 0.47933552892726816, + 0.47468698664107944, + 0.5891354249662953, + 0.4071526630723635, + 0.4400580103397398, + 0.4639574414293356, + 0.42381277803216144, + 0.4153863162757713, + 0.41509141971004654, + 0.4223920515695139, + 0.6132150065198433, + 0.4875986651857025, + 0.4194644830625347 + ] + } + ] + }, + "task_name": "RedditClustering" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/RedditClustering.v2.json b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/RedditClustering.v2.json new file mode 100644 index 0000000000..ad36f63c7c --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/RedditClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "24640382cdbf8abc73003fb0fa6d111a705499eb", + "evaluation_time": 27.040958404541016, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.43672190868268235, + "v_measure": 0.43672190868268235, + "v_measure_std": 0.008813694747555757, + "v_measures": { + "Level 0": [ + 0.42548985343937507, + 0.4461313428846983, + 0.4279939966854714, + 0.4388807297608616, + 0.4342402286372965, + 0.423388044299789, + 0.4517655567073429, + 0.4447791083347925, + 0.4389313316669487, + 0.4356188944102478 + ] + } + } + ] + }, + "task_name": "RedditClustering.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/RedditClusteringP2P.json b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/RedditClusteringP2P.json new file mode 100644 index 0000000000..e8dc61021d --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/RedditClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "385e3cb46b4cfa89021f56c4380204149d0efe33", + "evaluation_time": 1151.222552061081, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.520548596880906, + "v_measure": 0.520548596880906, + "v_measure_std": 0.11787625789389958, + "v_measures": [ + 0.581608524382365, + 0.553781458634249, + 0.5968132432989782, + 0.3230022466339231, + 0.5661425272329945, + 0.4997944468005974, + 0.26920495834546027, + 0.6121341175048557, + 0.5691257307110584, + 0.6338787152645794 + ] + } + ] + }, + "task_name": "RedditClusteringP2P" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/RedditClusteringP2P.v2.json b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/RedditClusteringP2P.v2.json new file mode 100644 index 0000000000..a3ebb0069d --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/RedditClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "385e3cb46b4cfa89021f56c4380204149d0efe33", + "evaluation_time": 55.49957323074341, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.5318186414953125, + "v_measure": 0.5318186414953125, + "v_measure_std": 0.004010534633418256, + "v_measures": { + "Level 0": [ + 0.5371808619804662, + 0.5301052756885235, + 0.5280406225159753, + 0.5255446195033356, + 0.5308585802705889, + 0.5366996277590168, + 0.536177069277631, + 0.5277981076443224, + 0.5354708043160082, + 0.5303108459972582 + ] + } + } + ] + }, + "task_name": "RedditClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/StackExchangeClustering.json b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/StackExchangeClustering.json new file mode 100644 index 0000000000..01490b34e5 --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/StackExchangeClustering.json @@ -0,0 +1,47 @@ +{ + "dataset_revision": "6cbc1f7b2bc0622f2e39d2c77fa502909748c259", + "evaluation_time": 227.97792148590088, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.5299265157315173, + "v_measure": 0.5299265157315173, + "v_measure_std": 0.05105060083651259, + "v_measures": [ + 0.5616808543334835, + 0.4986733235161252, + 0.4701290832478378, + 0.5583960588562497, + 0.5031043773645992, + 0.516332368977028, + 0.5250577193375806, + 0.5955776723611023, + 0.524794168457929, + 0.5226991395545374, + 0.6698954864587106, + 0.5714120728578519, + 0.6449901173957622, + 0.5950372156342982, + 0.48260605974162735, + 0.5244832051678019, + 0.49706347442549453, + 0.484118923687127, + 0.49550318704230883, + 0.46341449045345395, + 0.5170193868424628, + 0.5360732496414673, + 0.49150457538528936, + 0.4937311253300482, + 0.5048655572177555 + ] + } + ] + }, + "task_name": "StackExchangeClustering" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/StackExchangeClustering.v2.json b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/StackExchangeClustering.v2.json new file mode 100644 index 0000000000..bea8e437a2 --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/StackExchangeClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "6cbc1f7b2bc0622f2e39d2c77fa502909748c259", + "evaluation_time": 24.709307193756104, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.4617920391928713, + "v_measure": 0.4617920391928713, + "v_measure_std": 0.007688246944550186, + "v_measures": { + "Level 0": [ + 0.46638849634875296, + 0.46917703606386596, + 0.45714231573316694, + 0.46975199035603815, + 0.46727678623702196, + 0.4500046462616008, + 0.4679236487597783, + 0.44688003581624575, + 0.4608410381088478, + 0.4625343982433941 + ] + } + } + ] + }, + "task_name": "StackExchangeClustering.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/StackExchangeClusteringP2P.json b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/StackExchangeClusteringP2P.json new file mode 100644 index 0000000000..8d3f24dc27 --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/StackExchangeClusteringP2P.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "815ca46b2622cec33ccafc3735d572c266efdb44", + "evaluation_time": 220.0045247077942, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.33060988268868846, + "v_measure": 0.33060988268868846, + "v_measure_std": 0.016559777342708134, + "v_measures": [ + 0.3182190286433459, + 0.3186483086992987, + 0.31183873214749, + 0.3118023062892616, + 0.31448980879769917, + 0.3582172714922931, + 0.33600667238806275, + 0.3456979612796965, + 0.3480387122831772, + 0.34314002486656 + ] + } + ] + }, + "task_name": "StackExchangeClusteringP2P" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/StackExchangeClusteringP2P.v2.json b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/StackExchangeClusteringP2P.v2.json new file mode 100644 index 0000000000..f6eb821b0e --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/StackExchangeClusteringP2P.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "815ca46b2622cec33ccafc3735d572c266efdb44", + "evaluation_time": 15.91111159324646, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.3825217679176006, + "v_measure": 0.3825217679176006, + "v_measure_std": 0.00441752805694364, + "v_measures": { + "Level 0": [ + 0.3844307381686811, + 0.37501157429269105, + 0.38308979171878016, + 0.38332106419890516, + 0.38619557975694074, + 0.38186882120782395, + 0.3888369788394953, + 0.3876616308149724, + 0.37654521504614685, + 0.37825628513157006 + ] + } + } + ] + }, + "task_name": "StackExchangeClusteringP2P.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/TwentyNewsgroupsClustering.json b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/TwentyNewsgroupsClustering.json new file mode 100644 index 0000000000..8ad8147230 --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/TwentyNewsgroupsClustering.json @@ -0,0 +1,32 @@ +{ + "dataset_revision": "6125ec4e24fa026cec8a478383ee943acfbd5449", + "evaluation_time": 27.53256845474243, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.4435684966472212, + "v_measure": 0.4435684966472212, + "v_measure_std": 0.015928670962944386, + "v_measures": [ + 0.46915521155441353, + 0.43808933081429624, + 0.426107191203892, + 0.42737834118397516, + 0.4204915208659386, + 0.4675599595162288, + 0.4528760763044844, + 0.44928188291593635, + 0.43711747303532367, + 0.44762797907772345 + ] + } + ] + }, + "task_name": "TwentyNewsgroupsClustering" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/TwentyNewsgroupsClustering.v2.json b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/TwentyNewsgroupsClustering.v2.json new file mode 100644 index 0000000000..80e8929c82 --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/TwentyNewsgroupsClustering.v2.json @@ -0,0 +1,34 @@ +{ + "dataset_revision": "6125ec4e24fa026cec8a478383ee943acfbd5449", + "evaluation_time": 4.321641206741333, + "kg_co2_emissions": null, + "mteb_version": "1.12.22", + "scores": { + "test": [ + { + "hf_subset": "default", + "languages": [ + "eng-Latn" + ], + "main_score": 0.4508690125625724, + "v_measure": 0.4508690125625724, + "v_measure_std": 0.014157869672938217, + "v_measures": { + "Level 0": [ + 0.46909076668733535, + 0.4487961579118287, + 0.44162019335031905, + 0.45685166023982643, + 0.41816441821958866, + 0.4601511040711086, + 0.4616186361062128, + 0.43880195958782814, + 0.4622555640643589, + 0.45133966538731657 + ] + } + } + ] + }, + "task_name": "TwentyNewsgroupsClustering.v2" +} \ No newline at end of file diff --git a/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/model_meta.json b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/model_meta.json new file mode 100644 index 0000000000..b7801dde31 --- /dev/null +++ b/results/sentence-transformers__paraphrase-multilingual-mpnet-base-v2/79f2382ceacceacdf38563d7c5d16b9ff8d725d6/model_meta.json @@ -0,0 +1 @@ +{"name": "sentence-transformers/paraphrase-multilingual-mpnet-base-v2", "revision": "79f2382ceacceacdf38563d7c5d16b9ff8d725d6", "release_date": "2019-11-01", "languages": ["ara_Arab", "bul_Cyrl", "cat_Latn", "ces_Latn", "dan_Latn", "deu_Latn", "ell_Grek", "eng_Latn", "spa_Latn", "est_Latn", "fas_Arab", "fin_Latn", "fra_Latn", "fra_Latn", "glg_Latn", "guj_Gujr", "heb_Hebr", "hin_Deva", "hrv_Latn", "hun_Latn", "hye_Armn", "ind_Latn", "ita_Latn", "jpn_Jpan", "kat_Geor", "kor_Hang", "kur_Arab", "lit_Latn", "lav_Latn", "mkd_Cyrl", "mon_Cyrl", "mar_Deva", "msa_Latn", "mya_Mymr", "nob_Latn", "nld_Latn", "pol_Latn", "por_Latn", "por_Latn", "ron_Latn", "rus_Cyrl", "slk_Latn", "slv_Latn", "sqi_Latn", "srp_Cyrl", "swe_Latn", "tha_Thai", "tur_Latn", "ukr_Cyrl", "urd_Arab", "vie_Latn", "zho_Hans", "zho_Hant"], "n_parameters": null, "memory_usage": null, "max_tokens": null, "embed_dim": null, "license": null, "open_source": true, "framework": [], "loader": null} \ No newline at end of file diff --git a/scripts/run_mteb_english_cluster.py b/scripts/run_mteb_english_cluster.py new file mode 100644 index 0000000000..d316972a35 --- /dev/null +++ b/scripts/run_mteb_english_cluster.py @@ -0,0 +1,71 @@ +"""Example script for benchmarking all datasets constituting the MTEB English leaderboard & average scores""" + +from __future__ import annotations + +import logging + +from mteb import MTEB, get_model, get_tasks +from mteb.models.bge_models import bge_base_en_v1_5 +from mteb.models.e5_models import ( + e5_eng_base_v2, + e5_eng_large_v2, + e5_eng_small, + e5_eng_small_v2, + e5_mult_base, + e5_mult_large, + e5_mult_small, +) +from mteb.models.mxbai_models import mxbai_embed_large_v1 +from mteb.models.sentence_transformers_models import ( + all_MiniLM_L6_v2, + labse, + paraphrase_multilingual_MiniLM_L12_v2, + paraphrase_multilingual_mpnet_base_v2, +) + +logging.basicConfig(level=logging.INFO) + +logger = logging.getLogger("main") + +TASK_LIST_CLUSTERING = [ + # "ArxivClusteringP2P", # hierarchical + # "ArxivClusteringS2S", # hierarchical + "BiorxivClusteringP2P", + "BiorxivClusteringS2S", + "MedrxivClusteringP2P", + "MedrxivClusteringS2S", + "RedditClustering", + "RedditClusteringP2P", + "StackExchangeClustering", + "StackExchangeClusteringP2P", + "TwentyNewsgroupsClustering", +] + +TASK_LIST = [x + ".v2" for x in TASK_LIST_CLUSTERING] + TASK_LIST_CLUSTERING + +MODELS = [ + paraphrase_multilingual_MiniLM_L12_v2, + all_MiniLM_L6_v2, + e5_eng_small, + e5_eng_small_v2, + e5_mult_small, + e5_mult_base, + e5_mult_large, + paraphrase_multilingual_mpnet_base_v2, + e5_eng_large_v2, + e5_eng_base_v2, + labse, + mxbai_embed_large_v1, + bge_base_en_v1_5, +] + +for model in MODELS: + model_name = model.name + revision = model.revision + + model = get_model(model_name=model_name, revision=revision, trust_remote_code=True) + + eval_splits = ["test"] + tasks = get_tasks(tasks=TASK_LIST, languages=["eng"]) + evaluation = MTEB(tasks=tasks) + evaluation.run(model, output_folder="results", eval_splits=eval_splits) diff --git a/tests/test_RerankingEvaluator.py b/tests/test_RerankingEvaluator.py index 614aa17a97..39e36e57f2 100644 --- a/tests/test_RerankingEvaluator.py +++ b/tests/test_RerankingEvaluator.py @@ -53,6 +53,6 @@ def test_nAUC(self): conf_scores = [self.evaluator.conf_scores(x) for x in pred_scores] nauc_scores_map = self.evaluator.nAUC_scores(conf_scores, ap_scores, "map") - assert nauc_scores_map["nAUC_map_max"] == pytest.approx(0.86943, TOL) + assert nauc_scores_map["nAUC_map_max"] == pytest.approx(0.8694, TOL) assert nauc_scores_map["nAUC_map_std"] == pytest.approx(0.94065, TOL) assert nauc_scores_map["nAUC_map_diff1"] == pytest.approx(0.85460, TOL) diff --git a/tests/test_reproducible_workflow.py b/tests/test_reproducible_workflow.py index ddc3dace57..7c0cd84ab2 100644 --- a/tests/test_reproducible_workflow.py +++ b/tests/test_reproducible_workflow.py @@ -14,15 +14,16 @@ @pytest.mark.parametrize("task_name", ["BornholmBitextMining"]) @pytest.mark.parametrize("model_name", ["sentence-transformers/all-MiniLM-L6-v2"]) -def test_reproducibility_workflow(task_name: str, model_name: str): +@pytest.mark.parametrize("model_revision", ["8b3219a92973c328a8e22fadcfa821b5dc75636a"]) +def test_reproducibility_workflow(task_name: str, model_name: str, model_revision: str): """Test that a model and a task can be fetched and run in a reproducible fashion.""" - model_meta = mteb.get_model_meta(model_name) + model_meta = mteb.get_model_meta(model_name, revision=model_revision) task = mteb.get_task(task_name) assert isinstance(model_meta, ModelMeta) assert isinstance(task, mteb.AbsTask) - model = mteb.get_model(model_name) + model = mteb.get_model(model_name, revision=model_revision) assert isinstance(model, (Encoder, EncoderWithQueryCorpusEncode)) eval = MTEB(tasks=[task])