Spaces:
Running
on
Zero
Running
on
Zero
Update app.py
Browse files
app.py
CHANGED
@@ -682,7 +682,7 @@ def stream_chat(
|
|
682 |
print(f"입력 텐서 생성 후 CUDA 메모리: {torch.cuda.memory_allocated() / 1024**2:.2f} MB")
|
683 |
|
684 |
streamer = TextIteratorStreamer(
|
685 |
-
tokenizer, timeout=
|
686 |
)
|
687 |
|
688 |
generate_kwargs = dict(
|
|
|
682 |
print(f"입력 텐서 생성 후 CUDA 메모리: {torch.cuda.memory_allocated() / 1024**2:.2f} MB")
|
683 |
|
684 |
streamer = TextIteratorStreamer(
|
685 |
+
tokenizer, timeout=30., skip_prompt=True, skip_special_tokens=True
|
686 |
)
|
687 |
|
688 |
generate_kwargs = dict(
|