praeclarumjj3 commited on
Commit
e01bde8
·
verified ·
1 Parent(s): f4b0271

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +8 -0
app.py CHANGED
@@ -14,6 +14,14 @@ from vcoder_llava.utils import (build_logger, server_error_msg,
14
  violates_moderation, moderation_msg)
15
  from chat import Chat
16
 
 
 
 
 
 
 
 
 
17
 
18
  logger = build_logger("gradio_app", "gradio_web_server.log")
19
 
 
14
  violates_moderation, moderation_msg)
15
  from chat import Chat
16
 
17
+ import subprocess
18
+ # Install flash attention, skipping CUDA build if necessary
19
+ subprocess.run(
20
+ "pip install flash-attn --no-build-isolation",
21
+ env={"FLASH_ATTENTION_SKIP_CUDA_BUILD": "TRUE"},
22
+ shell=True,
23
+ )
24
+
25
 
26
  logger = build_logger("gradio_app", "gradio_web_server.log")
27