cfli commited on
Commit
bd67852
·
verified ·
1 Parent(s): 33a79d7

Upload folder using huggingface_hub

Browse files
Files changed (2) hide show
  1. README.md +8 -23
  2. sentence_bert_config.json +1 -1
README.md CHANGED
@@ -201,28 +201,13 @@ print(scores.tolist())
201
  If you find this repository useful, please consider giving a star :star: and citation
202
 
203
  ```
204
- @article{bge-llm,
205
- title={Making text embedders few-shot learners},
206
- author={Li, Chaofan and Qin, MingHao and Xiao, Shitao and Chen, Jianlyu and Luo, Kun and Shao, Yingxia and Lian, Defu and Liu, Zheng},
207
- journal={arXiv preprint arXiv:2409.15700},
208
- year={2024}
209
- }
210
-
211
- @misc{bge-m3,
212
- title={BGE M3-Embedding: Multi-Lingual, Multi-Functionality, Multi-Granularity Text Embeddings Through Self-Knowledge Distillation},
213
- author={Jianlv Chen and Shitao Xiao and Peitian Zhang and Kun Luo and Defu Lian and Zheng Liu},
214
- year={2024},
215
- eprint={2402.03216},
216
- archivePrefix={arXiv},
217
- primaryClass={cs.CL}
218
- }
219
-
220
- @misc{bge_embedding,
221
- title={C-Pack: Packaged Resources To Advance General Chinese Embedding},
222
- author={Shitao Xiao and Zheng Liu and Peitian Zhang and Niklas Muennighoff},
223
- year={2023},
224
- eprint={2309.07597},
225
- archivePrefix={arXiv},
226
- primaryClass={cs.CL}
227
  }
228
  ```
 
201
  If you find this repository useful, please consider giving a star :star: and citation
202
 
203
  ```
204
+ @misc{bge_code,
205
+ title={Towards A Generalist Code Embedding Model Based On Massive Data Synthesis},
206
+ author={Chaofan Li and Jianlyu Chen and Yingxia Shao and Defu Lian and Zheng Liu},
207
+ year={2025},
208
+ eprint={2505.12697},
209
+ archivePrefix={arXiv},
210
+ primaryClass={cs.IR},
211
+ url={https://arxiv.org/abs/2505.12697},
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
212
  }
213
  ```
sentence_bert_config.json CHANGED
@@ -1,4 +1,4 @@
1
  {
2
- "max_seq_length": 256,
3
  "do_lower_case": false
4
  }
 
1
  {
2
+ "max_seq_length": 32768,
3
  "do_lower_case": false
4
  }