Namitg02 commited on
Commit
357e5f2
·
verified ·
1 Parent(s): 5e67599

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -4
app.py CHANGED
@@ -41,14 +41,13 @@ embedding_model = SentenceTransformer("mixedbread-ai/mxbai-embed-large-v1")
41
  #all-MiniLM-L6-v2, BAAI/bge-base-en-v1.5,infgrad/stella-base-en-v2, BAAI/bge-large-en-v1.5 working with default dimensions
42
  #docs_text = [doc.text for doc in docs]
43
  #embed = embedding_model.embed_documents(docs_text)
44
- #embeddings = embedding_model.encode(docs)
45
- embeddings = torch.from_numpy(dataset["train"].to_pandas().to_numpy()).to(torch.float)
46
-
47
 
 
48
 
49
  #doc_func = lambda x: x.text
50
  #dataset = list(map(doc_func, dataset))
51
- #embeddings = embedding_model.embed_documents(dataset)
 
52
  #embeddings = embedding_model.embed_documents(docs)
53
  dataset = dataset.add_column('embeddings', embeddings)
54
  embedding_dim = embedding_model.get_sentence_embedding_dimension()
 
41
  #all-MiniLM-L6-v2, BAAI/bge-base-en-v1.5,infgrad/stella-base-en-v2, BAAI/bge-large-en-v1.5 working with default dimensions
42
  #docs_text = [doc.text for doc in docs]
43
  #embed = embedding_model.embed_documents(docs_text)
 
 
 
44
 
45
+ #embeddings = embedding_model.encode(docs)
46
 
47
  #doc_func = lambda x: x.text
48
  #dataset = list(map(doc_func, dataset))
49
+ embeddings = embedding_model.embed_documents(dataset[text])
50
+
51
  #embeddings = embedding_model.embed_documents(docs)
52
  dataset = dataset.add_column('embeddings', embeddings)
53
  embedding_dim = embedding_model.get_sentence_embedding_dimension()