sablab commited on
Commit
4f3af9f
·
verified ·
1 Parent(s): 66f2856

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +9 -2
app.py CHANGED
@@ -14,7 +14,13 @@ def format_prompt(message, history):
14
  prompt += f"[INST] {message} [/INST]"
15
  return prompt
16
 
17
- def generate(prompt, history, temperature=0.9, max_new_tokens=16000, top_p=0.95, repetition_penalty=1.0,):
 
 
 
 
 
 
18
  generate_kwargs = dict(
19
  temperature=temperature,
20
  max_new_tokens=max_new_tokens,
@@ -22,7 +28,8 @@ def generate(prompt, history, temperature=0.9, max_new_tokens=16000, top_p=0.95,
22
  repetition_penalty=repetition_penalty,
23
  do_sample=True,
24
  seed=42,)
25
- formatted_prompt = format_prompt(prompt, history)
 
26
  stream = client.text_generation(formatted_prompt, **generate_kwargs, stream=True, details=True, return_full_text=False)
27
  output = ""
28
 
 
14
  prompt += f"[INST] {message} [/INST]"
15
  return prompt
16
 
17
+ def generate(prompt, history, system_prompt, temperature=0.9, max_new_tokens=16000, top_p=0.95, repetition_penalty=1.0,):
18
+
19
+ temperature = float(temperature)
20
+ if temperature < 1e-2:
21
+ temperature = 1e-2
22
+ top_p = float(top_p)
23
+
24
  generate_kwargs = dict(
25
  temperature=temperature,
26
  max_new_tokens=max_new_tokens,
 
28
  repetition_penalty=repetition_penalty,
29
  do_sample=True,
30
  seed=42,)
31
+
32
+ formatted_prompt = format_prompt(f"{system_prompt}, {prompt}", history)
33
  stream = client.text_generation(formatted_prompt, **generate_kwargs, stream=True, details=True, return_full_text=False)
34
  output = ""
35