Skip to content

Commit

Permalink
docs: Update annotations for tasks (#936)
Browse files Browse the repository at this point in the history
* annottations

* annotate

* annotate

* annotate

* annotate

* ann

* ann

* ann

* ann

* ann

* formatted

* add data

* add data

* Update docs/mmteb/points/936.jsonl

* lint

---------

Co-authored-by: Kenneth Enevoldsen <kennethcenevoldsen@gmail.com>
  • Loading branch information
henilp105 and KennethEnevoldsen authored Jun 16, 2024
1 parent 3fbce3d commit 8823369
Show file tree
Hide file tree
Showing 14 changed files with 93 additions and 90 deletions.
3 changes: 2 additions & 1 deletion docs/mmteb/points.md
Original file line number Diff line number Diff line change
Expand Up @@ -92,4 +92,5 @@ Please also add your first name and last name are as you want them to appear in
| ManuelFay | Manuel | Faysse | manuel.faysse@centralesupelec.fr | ~Manuel_Faysse1 | CentraleSupélec & Illuin Technology |
| hgissbkh | Hippolyte | Gisserot-Boukhlef | hippolyte.gisserot-boukhlef@centralesupelec.fr | ~Hippolyte_Gisserot-Boukhlef1 | CentraleSupélec & Artefact Research Center |
| sted97 | Simone | Tedeschi | tedeschi@diag.uniroma1.it | ~Simone_Tedeschi1 | Sapienza University of Rome |
| gentaiscool | Genta Indra | Winata | genta.winata@capitalone.com | ~Genta_Indra_Winata1 | Capital One |
| gentaiscool | Genta Indra | Winata | genta.winata@capitalone.com | ~Genta_Indra_Winata1 | Capital One |
| henilp105 | Henil | Panchal | henilp105@gmail.com | ~Henil_Shalin_Panchal1 | Nirma University |
2 changes: 2 additions & 0 deletions docs/mmteb/points/936.jsonl
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
{"GitHub": "henilp105", "Dataset annotations": 9}
{"GitHub": "KennethEnevoldsen", "Review PR": 2}
2 changes: 1 addition & 1 deletion mteb/cli.py
Original file line number Diff line number Diff line change
Expand Up @@ -271,7 +271,7 @@ def create_meta(args: argparse.Namespace) -> None:
"dataset": {
"type": task.metadata.dataset["path"],
"name": f"MTEB {task.metadata.name} ({hf_subset_score['hf_subset']})",
"config": hf_subset_score["hf_subset"],
"config": hf_subset_score["hf_subset"],
"split": split,
"revision": task_result.dataset_revision,
},
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -26,15 +26,15 @@ class AmazonReviewsClassification(MultilingualTask, AbsTaskClassification):
"zh": ["cmn-Hans"],
},
main_score="accuracy",
date=None,
form=None,
domains=None,
task_subtypes=None,
license=None,
socioeconomic_status=None,
annotations_creators=None,
dialect=None,
text_creation=None,
date=("2015-11-01", "2019-11-01"),
form=["written"],
domains=["Reviews"],
task_subtypes=[],
license="https://docs.opendata.aws/amazon-reviews-ml/license.txt",
socioeconomic_status="medium",
annotations_creators="human-annotated",
dialect=[],
text_creation="found",
bibtex_citation="""@misc{keung2020multilingual,
title={The Multilingual Amazon Reviews Corpus},
author={Phillip Keung and Yichao Lu and György Szarvas and Noah A. Smith},
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -38,15 +38,15 @@ class MasakhaNEWSClassification(AbsTaskClassification, MultilingualTask):
eval_splits=["test"],
eval_langs=_LANGUAGES,
main_score="accuracy",
date=None,
form=None,
domains=None,
task_subtypes=None,
license=None,
socioeconomic_status=None,
annotations_creators=None,
dialect=None,
text_creation=None,
date=("2023-01-01", "2023-04-19"), # rough estimate
form=["written"],
domains=["News"],
task_subtypes=[],
license="cc-by-nc-4.0",
socioeconomic_status="high",
annotations_creators="expert-annotated",
dialect=[],
text_creation="found",
bibtex_citation="""@misc{adelani2023masakhanews,
title={MasakhaNEWS: News Topic Classification for African languages},
author={David Ifeoluwa Adelani and Marek Masiak and Israel Abebe Azime and Jesujoba Alabi and Atnafu Lambebo Tonja and Christine Mwase and Odunayo Ogundepo and Bonaventure F. P. Dossou and Akintunde Oladipo and Doreen Nixdorf and Chris Chinenye Emezue and sana al-azzawi and Blessing Sibanda and Davis David and Lolwethu Ndolela and Jonathan Mukiibi and Tunde Ajayi and Tatiana Moteu and Brian Odhiambo and Abraham Owodunni and Nnaemeka Obiefuna and Muhidin Mohamed and Shamsuddeen Hassan Muhammad and Teshome Mulugeta Ababu and Saheed Abdullahi Salahudeen and Mesay Gemeda Yigezu and Tajuddeen Gwadabe and Idris Abdulmumin and Mahlet Taye and Oluwabusayo Awoyomi and Iyanuoluwa Shode and Tolulope Adelani and Habiba Abdulganiyu and Abdul-Hakeem Omotayo and Adetola Adeeko and Abeeb Afolabi and Anuoluwapo Aremu and Olanrewaju Samuel and Clemencia Siro and Wangari Kimotho and Onyekachi Ogbu and Chinedu Mbonu and Chiamaka Chukwuneke and Samuel Fanijo and Jessica Ojo and Oyinkansola Awosan and Tadesse Kebede and Toadoum Sari Sakayo and Pamela Nyatsine and Freedmore Sidume and Oreen Yousuf and Mardiyyah Oduwole and Tshinu Tshinu and Ussen Kimanuka and Thina Diko and Siyanda Nxakama and Sinodos Nigusse and Abdulmejid Johar and Shafie Mohamed and Fuad Mire Hassan and Moges Ahmed Mehamed and Evrard Ngabire and Jules Jules and Ivan Ssenkungu and Pontus Stenetorp},
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -68,7 +68,7 @@ class MassiveIntentClassification(MultilingualTask, AbsTaskClassification):
"revision": "4672e20407010da34463acc759c162ca9734bca6",
},
description="MASSIVE: A 1M-Example Multilingual Natural Language Understanding Dataset with 51 Typologically-Diverse Languages",
reference="https://arxiv.org/abs/2204.08582#:~:text=MASSIVE%20contains%201M%20realistic%2C%20parallel,diverse%20languages%20from%2029%20genera.",
reference="https://arxiv.org/abs/2204.08582",
category="s2s",
type="Classification",
eval_splits=["validation", "test"],
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -68,7 +68,7 @@ class MassiveScenarioClassification(MultilingualTask, AbsTaskClassification):
"revision": "fad2c6e8459f9e1c45d9315f4953d921437d70f8",
},
description="MASSIVE: A 1M-Example Multilingual Natural Language Understanding Dataset with 51 Typologically-Diverse Languages",
reference="https://arxiv.org/abs/2204.08582#:~:text=MASSIVE%20contains%201M%20realistic%2C%20parallel,diverse%20languages%20from%2029%20genera.",
reference="https://arxiv.org/abs/2204.08582",
category="s2s",
type="Classification",
eval_splits=["validation", "test"],
Expand Down
14 changes: 7 additions & 7 deletions mteb/tasks/Clustering/deu/TenKGnadClusteringP2P.py
Original file line number Diff line number Diff line change
Expand Up @@ -22,14 +22,14 @@ class TenKGnadClusteringP2P(AbsTaskClustering):
eval_langs=["deu-Latn"],
main_score="v_measure",
date=None,
form=None,
domains=None,
task_subtypes=None,
license=None,
socioeconomic_status=None,
form=["written"],
domains=["Web"],
task_subtypes=[],
license="cc-by-nc-sa-4.0",
socioeconomic_status="mixed",
annotations_creators=None,
dialect=None,
text_creation=None,
dialect=[],
text_creation="found",
bibtex_citation=None,
n_samples={"test": 45914},
avg_character_length={"test": 2641.03},
Expand Down
18 changes: 9 additions & 9 deletions mteb/tasks/Reranking/eng/MindSmallReranking.py
Original file line number Diff line number Diff line change
Expand Up @@ -20,15 +20,15 @@ class MindSmallReranking(AbsTaskReranking):
eval_splits=["test"],
eval_langs=["eng-Latn"],
main_score="map",
date=None,
form=None,
domains=None,
task_subtypes=None,
license=None,
socioeconomic_status=None,
annotations_creators=None,
dialect=None,
text_creation=None,
date=("2019-10-12", "2019-11-22"),
form=["written"],
domains=["News"],
task_subtypes=[],
license="https://github.com/msnews/MIND/blob/master/MSR%20License_Data.pdf",
socioeconomic_status="mixed",
annotations_creators="expert-annotated",
dialect=[],
text_creation="found",
bibtex_citation="""@inproceedings{wu-etal-2020-mind, title = "{MIND}: A Large-scale Dataset for News
Recommendation", author = "Wu, Fangzhao and Qiao, Ying and Chen, Jiun-Hung and Wu, Chuhan and Qi,
Tao and Lian, Jianxun and Liu, Danyang and Xie, Xing and Gao, Jianfeng and Wu, Winnie and Zhou, Ming",
Expand Down
22 changes: 11 additions & 11 deletions mteb/tasks/Reranking/zho/CMTEBReranking.py
Original file line number Diff line number Diff line change
Expand Up @@ -90,15 +90,15 @@ class CMedQAv1(AbsTaskReranking):
eval_splits=["test"],
eval_langs=["cmn-Hans"],
main_score="map",
date=None,
form=None,
domains=None,
task_subtypes=None,
license=None,
socioeconomic_status=None,
annotations_creators=None,
dialect=None,
text_creation=None,
date=("2017-01-01", "2017-07-26"),
form=["written"],
domains=["Medical"],
task_subtypes=[],
license="not specified.",
socioeconomic_status="mixed",
annotations_creators="expert-annotated",
dialect=[],
text_creation="found",
bibtex_citation="""@article{zhang2017chinese,
title={Chinese Medical Question Answer Matching Using End-to-End Character-Level Multi-Scale CNNs},
author={Zhang, Sheng and Zhang, Xin and Wang, Hui and Cheng, Jiajun and Li, Pei and Ding, Zhaoyun},
Expand All @@ -109,8 +109,8 @@ class CMedQAv1(AbsTaskReranking):
year={2017},
publisher={Multidisciplinary Digital Publishing Institute}
}""",
n_samples=None,
avg_character_length=None,
n_samples={"test": 2000},
avg_character_length={"test": 165},
)


Expand Down
22 changes: 11 additions & 11 deletions mteb/tasks/Retrieval/eng/HagridRetrieval.py
Original file line number Diff line number Diff line change
Expand Up @@ -28,23 +28,23 @@ class HagridRetrieval(AbsTaskRetrieval):
eval_splits=["dev"],
eval_langs=["eng-Latn"],
main_score="ndcg_at_10",
date=None,
form=None,
domains=None,
task_subtypes=None,
license=None,
socioeconomic_status=None,
annotations_creators=None,
dialect=None,
text_creation=None,
date=("2019-02-01", "2022-10-18"),
form=["written"],
domains=["Encyclopaedic"],
task_subtypes=[],
license="apache-2.0",
socioeconomic_status="mixed",
annotations_creators="expert-annotated",
dialect=[],
text_creation="found",
bibtex_citation="""@article{hagrid,
title={{HAGRID}: A Human-LLM Collaborative Dataset for Generative Information-Seeking with Attribution},
author={Ehsan Kamalloo and Aref Jafari and Xinyu Zhang and Nandan Thakur and Jimmy Lin},
year={2023},
journal={arXiv:2307.16883},
}""",
n_samples=None,
avg_character_length=None,
n_samples={"train": 1922},
avg_character_length={"train": 14.53},
)

def load_data(self, **kwargs):
Expand Down
22 changes: 11 additions & 11 deletions mteb/tasks/Retrieval/fra/AlloprofRetrieval.py
Original file line number Diff line number Diff line change
Expand Up @@ -21,15 +21,15 @@ class AlloprofRetrieval(AbsTaskRetrieval):
eval_splits=["test"],
eval_langs=["fra-Latn"],
main_score="ndcg_at_10",
date=None,
form=None,
domains=None,
task_subtypes=None,
license=None,
socioeconomic_status=None,
annotations_creators=None,
dialect=None,
text_creation=None,
date=None, # no date specified.
form=["written"],
domains=["Encyclopaedic"],
task_subtypes=[],
license="cc-by-nc-sa-4.0",
socioeconomic_status="mixed",
annotations_creators="human-annotated",
dialect=[],
text_creation="found",
bibtex_citation="""@misc{lef23,
doi = {10.48550/ARXIV.2302.07738},
url = {https://arxiv.org/abs/2302.07738},
Expand All @@ -40,8 +40,8 @@ class AlloprofRetrieval(AbsTaskRetrieval):
year = {2023},
copyright = {Creative Commons Attribution Non Commercial Share Alike 4.0 International}
}""",
n_samples=None,
avg_character_length=None,
n_samples={"train": 2048},
avg_character_length=None, # unable to extract due to invalid hf dataset
)

def load_data(self, **kwargs):
Expand Down
22 changes: 11 additions & 11 deletions mteb/tasks/Retrieval/fra/BSARDRetrieval.py
Original file line number Diff line number Diff line change
Expand Up @@ -21,15 +21,15 @@ class BSARDRetrieval(AbsTaskRetrieval):
eval_splits=["test"],
eval_langs=["fra-Latn"],
main_score="recall_at_100",
date=None,
form=None,
domains=None,
task_subtypes=None,
license=None,
socioeconomic_status=None,
annotations_creators=None,
dialect=None,
text_creation=None,
date=("2021-05-01", "2021-08-26"),
form=["spoken"],
domains=["Legal"],
task_subtypes=[],
license="cc-by-nc-sa-4.0",
socioeconomic_status="medium",
annotations_creators="expert-annotated",
dialect=[],
text_creation="found",
bibtex_citation="""@inproceedings{louis2022statutory,
title = {A Statutory Article Retrieval Dataset in French},
author = {Louis, Antoine and Spanakis, Gerasimos},
Expand All @@ -42,8 +42,8 @@ class BSARDRetrieval(AbsTaskRetrieval):
doi = {10.18653/v1/2022.acl-long.468},
pages = {6789–6803},
}""",
n_samples=None,
avg_character_length=None,
n_samples={"test": 222},
avg_character_length={"test": 71.94},
)

def load_data(self, **kwargs):
Expand Down
16 changes: 8 additions & 8 deletions mteb/tasks/Retrieval/fra/SyntecRetrieval.py
Original file line number Diff line number Diff line change
Expand Up @@ -23,15 +23,15 @@ class SyntecRetrieval(AbsTaskRetrieval):
eval_splits=_EVAL_SPLITS,
eval_langs=["fra-Latn"],
main_score="ndcg_at_10",
date=None,
form=None,
domains=None,
task_subtypes=None,
license=None,
socioeconomic_status=None,
annotations_creators=None,
date=None, # not specified
form=["written"],
domains=["Legal"],
task_subtypes=[],
license="not specified.",
socioeconomic_status="high",
annotations_creators="human-annotated",
dialect=[],
text_creation=None,
text_creation="created",
bibtex_citation="""@misc{ciancone2024extending,
title={Extending the Massive Text Embedding Benchmark to French},
author={Mathieu Ciancone and Imene Kerboua and Marion Schaeffer and Wissam Siblini},
Expand Down

0 comments on commit 8823369

Please sign in to comment.