Spaces:
Paused
Paused
Update app.py
Browse files
app.py
CHANGED
@@ -58,10 +58,10 @@ def generate(
|
|
58 |
message: str,
|
59 |
chat_history: list[tuple[str, str]],
|
60 |
max_new_tokens: int = 1024,
|
61 |
-
|
62 |
-
|
63 |
-
|
64 |
-
|
65 |
) -> Iterator[str]:
|
66 |
conversation = []
|
67 |
for user, assistant in chat_history:
|
@@ -83,11 +83,11 @@ def generate(
|
|
83 |
streamer=streamer,
|
84 |
max_new_tokens=max_new_tokens,
|
85 |
do_sample=True,
|
86 |
-
|
87 |
-
|
88 |
-
|
89 |
num_beams=1,
|
90 |
-
|
91 |
)
|
92 |
t = Thread(target=model.generate, kwargs=generate_kwargs)
|
93 |
t.start()
|
|
|
58 |
message: str,
|
59 |
chat_history: list[tuple[str, str]],
|
60 |
max_new_tokens: int = 1024,
|
61 |
+
temperature: float = 0.6,
|
62 |
+
top_p: float = 0.9,
|
63 |
+
top_k: int = 40,
|
64 |
+
repetition_penalty: float = 1.0,
|
65 |
) -> Iterator[str]:
|
66 |
conversation = []
|
67 |
for user, assistant in chat_history:
|
|
|
83 |
streamer=streamer,
|
84 |
max_new_tokens=max_new_tokens,
|
85 |
do_sample=True,
|
86 |
+
top_p=top_p,
|
87 |
+
top_k=top_k,
|
88 |
+
temperature=temperature,
|
89 |
num_beams=1,
|
90 |
+
repetition_penalty=repetition_penalty,
|
91 |
)
|
92 |
t = Thread(target=model.generate, kwargs=generate_kwargs)
|
93 |
t.start()
|