rajj0 commited on
Commit
aed121c
·
verified ·
1 Parent(s): a0fbc1b

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -6
app.py CHANGED
@@ -11,11 +11,7 @@ import spaces
11
  import time
12
  import subprocess
13
 
14
- subprocess.run(
15
- "pip install flash-attn --no-build-isolation",
16
- env={"FLASH_ATTENTION_SKIP_CUDA_BUILD": "TRUE"},
17
- shell=True,
18
- )
19
 
20
  token = os.environ["HF_TOKEN"]
21
 
@@ -58,7 +54,7 @@ def chat(message, history, temperature, do_sample, max_tokens):
58
  model_inputs,
59
  streamer=streamer,
60
  max_new_tokens=max_tokens,
61
- do_sample=True,
62
  temperature=temperature,
63
  eos_token_id=terminators,
64
  )
 
11
  import time
12
  import subprocess
13
 
14
+
 
 
 
 
15
 
16
  token = os.environ["HF_TOKEN"]
17
 
 
54
  model_inputs,
55
  streamer=streamer,
56
  max_new_tokens=max_tokens,
57
+ do_sample=True,r
58
  temperature=temperature,
59
  eos_token_id=terminators,
60
  )