Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -32,7 +32,7 @@ import gradio as gr # Gradio ์ํฌํธ ์ถ๊ฐ
|
|
32 |
print("Vector DB์ ์๋ฒ ๋ฉ ๋ชจ๋ธ์ ๋ถ๋ฌ์ค๋ ์ค์
๋๋ค...")
|
33 |
index_path = "proj2_voca"
|
34 |
model_name = "jhgan/ko-sroberta-multitask"
|
35 |
-
model_kwargs = {'device': '
|
36 |
encode_kwargs = {'normalize_embeddings': True}
|
37 |
embeddings = HuggingFaceEmbeddings(
|
38 |
model_name=model_name,
|
@@ -50,7 +50,7 @@ model = AutoModelForCausalLM.from_pretrained(
|
|
50 |
model_id,
|
51 |
torch_dtype=torch.bfloat16,
|
52 |
device_map=None # ์๋ ๋ฐฐ์น ๋นํ์ฑํ
|
53 |
-
).to("
|
54 |
|
55 |
# --- 2. ์ธ์ด ๋ชจ๋ธ(LLM) ๋ถ๋ฌ์ค๊ธฐ ---
|
56 |
# ... (์ด์ ์ฝ๋ ์๋ต) ...
|
@@ -58,7 +58,7 @@ pipe = pipeline(
|
|
58 |
"text-generation",
|
59 |
model=model,
|
60 |
tokenizer=tokenizer,
|
61 |
-
device
|
62 |
max_new_tokens=170, # ์ต๋ ์์ฑ ํ ํฐ ์ ๊ฐ์
|
63 |
temperature=0.7,
|
64 |
repetition_penalty=1.2, # ๋ฐ๋ณต ๋ฐฉ์ง ํจ๋ํฐ ์ถ๊ฐ
|
|
|
32 |
print("Vector DB์ ์๋ฒ ๋ฉ ๋ชจ๋ธ์ ๋ถ๋ฌ์ค๋ ์ค์
๋๋ค...")
|
33 |
index_path = "proj2_voca"
|
34 |
model_name = "jhgan/ko-sroberta-multitask"
|
35 |
+
model_kwargs = {'device': 'cpu'}
|
36 |
encode_kwargs = {'normalize_embeddings': True}
|
37 |
embeddings = HuggingFaceEmbeddings(
|
38 |
model_name=model_name,
|
|
|
50 |
model_id,
|
51 |
torch_dtype=torch.bfloat16,
|
52 |
device_map=None # ์๋ ๋ฐฐ์น ๋นํ์ฑํ
|
53 |
+
).to("cpu") # GPU ๋ฒํธ ๋ช
์
|
54 |
|
55 |
# --- 2. ์ธ์ด ๋ชจ๋ธ(LLM) ๋ถ๋ฌ์ค๊ธฐ ---
|
56 |
# ... (์ด์ ์ฝ๋ ์๋ต) ...
|
|
|
58 |
"text-generation",
|
59 |
model=model,
|
60 |
tokenizer=tokenizer,
|
61 |
+
device=-1,
|
62 |
max_new_tokens=170, # ์ต๋ ์์ฑ ํ ํฐ ์ ๊ฐ์
|
63 |
temperature=0.7,
|
64 |
repetition_penalty=1.2, # ๋ฐ๋ณต ๋ฐฉ์ง ํจ๋ํฐ ์ถ๊ฐ
|