Spaces:
Sleeping
Sleeping
ddovidovich
commited on
Commit
·
6ecdc04
1
Parent(s):
2714936
Update app.py
Browse files
app.py
CHANGED
@@ -3,7 +3,9 @@ import streamlit as st
|
|
3 |
import pandas as pd
|
4 |
import numpy as np
|
5 |
from tqdm.auto import tqdm
|
6 |
-
from sentence_transformers import SentenceTransformer
|
|
|
|
|
7 |
|
8 |
dataList = [
|
9 |
{"Answer": "", "Distance": 0},
|
@@ -27,9 +29,12 @@ def load_documents_from_jsonl(embeddings_model, jsonl_path, createEmbeddings=Fal
|
|
27 |
|
28 |
return df
|
29 |
|
30 |
-
def generate_embeddings(model, text):
|
|
|
|
|
|
|
31 |
with torch.no_grad():
|
32 |
-
embeddings = model
|
33 |
return embeddings.cpu().numpy()
|
34 |
|
35 |
def save_to_faiss(df):
|
@@ -56,7 +61,9 @@ def main():
|
|
56 |
# Заголовок приложения
|
57 |
st.title("Demo for LLAMA-2 RAG with CPU only")
|
58 |
|
59 |
-
model = SentenceTransformer('sentence-transformers/paraphrase-multilingual-MiniLM-L12-v2')
|
|
|
|
|
60 |
|
61 |
df_qa = load_documents_from_jsonl('ExportForAI1.jsonl', model, False)
|
62 |
save_to_faiss(df_qa)
|
|
|
3 |
import pandas as pd
|
4 |
import numpy as np
|
5 |
from tqdm.auto import tqdm
|
6 |
+
#from sentence_transformers import SentenceTransformer
|
7 |
+
from transformers import AutoTokenizer, AutoModel
|
8 |
+
import torch
|
9 |
|
10 |
dataList = [
|
11 |
{"Answer": "", "Distance": 0},
|
|
|
29 |
|
30 |
return df
|
31 |
|
32 |
+
def generate_embeddings(tokenizer, model, text):
|
33 |
+
# with torch.no_grad():
|
34 |
+
# embeddings = model.encode(text, convert_to_tensor=True)
|
35 |
+
encoded_input = tokenizer(text, padding=True, truncation=True, return_tensors='pt')
|
36 |
with torch.no_grad():
|
37 |
+
embeddings = model(**encoded_input)
|
38 |
return embeddings.cpu().numpy()
|
39 |
|
40 |
def save_to_faiss(df):
|
|
|
61 |
# Заголовок приложения
|
62 |
st.title("Demo for LLAMA-2 RAG with CPU only")
|
63 |
|
64 |
+
#model = SentenceTransformer('sentence-transformers/paraphrase-multilingual-MiniLM-L12-v2')
|
65 |
+
tokenizer = AutoTokenizer.from_pretrained('sentence-transformers/paraphrase-multilingual-MiniLM-L12-v2')
|
66 |
+
model = AutoModel.from_pretrained('sentence-transformers/paraphrase-multilingual-MiniLM-L12-v2')
|
67 |
|
68 |
df_qa = load_documents_from_jsonl('ExportForAI1.jsonl', model, False)
|
69 |
save_to_faiss(df_qa)
|