Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
@@ -7,6 +7,7 @@ from threading import Thread
|
|
7 |
from sentence_transformers import SentenceTransformer
|
8 |
import faiss
|
9 |
import fitz # PyMuPDF
|
|
|
10 |
|
11 |
# 환경 변수에서 Hugging Face 토큰 가져오기
|
12 |
token = os.environ.get("HF_TOKEN")
|
@@ -45,7 +46,7 @@ data = data.map(lambda x: {"question_embedding": ST.encode(x["question"])}, batc
|
|
45 |
data.add_faiss_index(column="question_embedding")
|
46 |
|
47 |
# LLaMA 모델 설정
|
48 |
-
model_id = "
|
49 |
bnb_config = BitsAndBytesConfig(
|
50 |
load_in_4bit=True, bnb_4bit_use_double_quant=True, bnb_4bit_quant_type="nf4", bnb_4bit_compute_dtype=torch.bfloat16
|
51 |
)
|
|
|
7 |
from sentence_transformers import SentenceTransformer
|
8 |
import faiss
|
9 |
import fitz # PyMuPDF
|
10 |
+
import torchvision
|
11 |
|
12 |
# 환경 변수에서 Hugging Face 토큰 가져오기
|
13 |
token = os.environ.get("HF_TOKEN")
|
|
|
46 |
data.add_faiss_index(column="question_embedding")
|
47 |
|
48 |
# LLaMA 모델 설정
|
49 |
+
model_id = "MLP-KTLim/llama-3-Korean-Bllossom-8B"
|
50 |
bnb_config = BitsAndBytesConfig(
|
51 |
load_in_4bit=True, bnb_4bit_use_double_quant=True, bnb_4bit_quant_type="nf4", bnb_4bit_compute_dtype=torch.bfloat16
|
52 |
)
|