Sharaf Zaman commited on
Commit
2bc10cc
·
1 Parent(s): dc169a4

Try v3 (Get rid of LoRA stuff)

Browse files
Files changed (1) hide show
  1. app.py +3 -5
app.py CHANGED
@@ -34,7 +34,7 @@ def start_worker(model_path: str, bits=16):
34
  assert bits in [4, 8, 16], "It can be only loaded with 16-bit, 8-bit, and 4-bit."
35
  if bits != 16:
36
  model_name += f"-{bits}bit"
37
- model_name += "-lora"
38
  worker_command = [
39
  sys.executable,
40
  "-m",
@@ -47,8 +47,6 @@ def start_worker(model_path: str, bits=16):
47
  model_path,
48
  "--model-name",
49
  model_name,
50
- "--model-base",
51
- "liuhaotian/llava-1.5-7b",
52
  "--use-flash-attn",
53
  ]
54
  # if bits != 16:
@@ -74,8 +72,8 @@ if __name__ == "__main__":
74
 
75
  print(f"astro args: {gws.args}")
76
 
77
- model_path = os.getenv("model", "universeTBD/AstroLLaVA_v2")
78
- bits = int(os.getenv("bits", 4))
79
  concurrency_count = int(os.getenv("concurrency_count", 5))
80
 
81
  controller_proc = start_controller()
 
34
  assert bits in [4, 8, 16], "It can be only loaded with 16-bit, 8-bit, and 4-bit."
35
  if bits != 16:
36
  model_name += f"-{bits}bit"
37
+ # model_name += "-lora"
38
  worker_command = [
39
  sys.executable,
40
  "-m",
 
47
  model_path,
48
  "--model-name",
49
  model_name,
 
 
50
  "--use-flash-attn",
51
  ]
52
  # if bits != 16:
 
72
 
73
  print(f"astro args: {gws.args}")
74
 
75
+ model_path = os.getenv("model", "universeTBD/AstroLLaVA_v3")
76
+ bits = int(os.getenv("bits", 16))
77
  concurrency_count = int(os.getenv("concurrency_count", 5))
78
 
79
  controller_proc = start_controller()