File size: 886 Bytes
094f515
ffc7b61
094f515
 
 
 
 
 
 
 
 
 
25830df
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
094f515
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
from langchain.embeddings import HuggingFaceEmbeddings
import torch

def get_hf_embeddings(model_name=None):
    """Retrieve a Hugging Face embedding model using the specified model name.."""

    if model_name is None:
        # "sentence-transformers/all-mpnet-base-v2"
        model_name = "BAAI/bge-base-en-v1.5"

    embeddings = HuggingFaceEmbeddings(model_name=model_name)

    return embeddings

def get_SFR_Code_embedding_model(
    model_name="Salesforce/SFR-Embedding-Code-400M_R", device="auto"
):
    """Get jinaai embedding."""

    # device: cpu or cuda
    if device == "auto":
        device = "cuda" if torch.cuda.is_available() else "cpu"

    model_name = model_name
    model_kwargs = {"device": device, "trust_remote_code": True}
    embeddings = HuggingFaceEmbeddings(
        model_name=model_name,
        model_kwargs=model_kwargs,
    )

    return embeddings