matching_embedding / datadreamer.json
AjayP13's picture
Pushed by DataDreamer
997fe8b verified
{
"model_card": {
"Date & Time": "2025-03-06T21:12:29.381066",
"Model Card": [
"https://huggingface.co/BAAI/bge-m3"
],
"License Information": [
"mit"
],
"Citation Information": [
"\n@inproceedings{Wolf_Transformers_State-of-the-Art_Natural_2020,\n author = {Wolf, Thomas and Debut, Lysandre and Sanh, Victor and Chaumond, Julien",
"\n@Misc{peft,\n title = {PEFT: State-of-the-art Parameter-Efficient Fine-Tuning methods},\n author = {Sourab Mangrulkar and Sylvain Gugger and Lysandre Debut and Younes",
"@misc{bge-m3,\n title={BGE M3-Embedding: Multi-Lingual, Multi-Functionality, Multi-Granularity Text Embeddings Through Self-Knowledge Distillation}, \n author={Jianlv Chen and Shitao Xiao and Peitian Zhang and Kun Luo and Defu Lian and Zheng Liu},\n year={2024},\n eprint={2402.03216},\n archivePrefix={arXiv},\n primaryClass={cs.CL}\n}",
"@inproceedings{reimers-2019-sentence-bert,\n title = \"Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks\",\n author = \"Reimers, Nils and Gurevych, Iryna\",\n booktitle = \"Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing\",\n month = \"11\",\n year = \"2019\",\n publisher = \"Association for Computational Linguistics\",\n url = \"https://arxiv.org/abs/1908.10084\",\n}"
]
},
"data_card": {
"Get Matching Calibration": {
"Date & Time": "2025-03-05T12:33:06.921999",
"Dataset Name": [
"fineinstructions/matching_calibration"
],
"Dataset Card": [
"https://huggingface.co/datasets/fineinstructions/matching_calibration"
]
},
"Adjust sims for hard positives and negatives": {
"Date & Time": "2025-03-05T12:35:51.663481"
},
"Filter out too long rows": {
"Date & Time": "2025-03-05T12:37:19.256235"
},
"Filter out too long rows (train split)": {
"Date & Time": "2025-03-05T12:40:43.387535"
}
},
"__version__": "0.46.0",
"datetime": "2025-03-06T20:29:33.338084",
"type": "TrainSentenceTransformer",
"name": "Train Matching Embedding",
"version": 1.0,
"fingerprint": "66bfe8a08b39004c",
"req_versions": {
"dill": "0.3.8",
"sqlitedict": "2.1.0",
"torch": "2.5.1",
"numpy": "1.26.4",
"transformers": "4.48.2",
"datasets": "3.2.0",
"huggingface_hub": "0.27.1",
"accelerate": "1.3.0",
"peft": "0.14.0",
"tiktoken": "0.7.0",
"tokenizers": "0.21.0",
"openai": "1.59.8",
"ctransformers": "0.2.27",
"optimum": "1.23.3",
"bitsandbytes": "0.45.0",
"litellm": "1.57.8",
"trl": "0.9.6",
"setfit": "1.1.1",
"vllm": "0.7.0"
},
"interpreter": "3.11.1 (main, Apr 12 2023, 13:34:00) [GCC 7.5.0]"
}