BenBranyon commited on
Commit
5ffc333
·
verified ·
1 Parent(s): 5fb4f11

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -16,7 +16,7 @@ MAX_INPUT_TOKEN_LENGTH = int(os.getenv("MAX_INPUT_TOKEN_LENGTH", "4096"))
16
  if torch.cuda.is_available():
17
  model_id = "Qwen/Qwen2.5-7B-Instruct"
18
  #model_id = "BenBranyon/sumbot7b-augmented"
19
- model = AutoModelForCausalLM.from_pretrained(model_id, torch_dtype=torch.float16, device_map="auto")
20
  tokenizer = AutoTokenizer.from_pretrained(model_id, use_fast=True, model_max_length=MAX_INPUT_TOKEN_LENGTH, padding="longest", language="en")
21
 
22
  #Transformers Code
 
16
  if torch.cuda.is_available():
17
  model_id = "Qwen/Qwen2.5-7B-Instruct"
18
  #model_id = "BenBranyon/sumbot7b-augmented"
19
+ model = AutoModelForCausalLM.from_pretrained(model_id, device_map="auto")
20
  tokenizer = AutoTokenizer.from_pretrained(model_id, use_fast=True, model_max_length=MAX_INPUT_TOKEN_LENGTH, padding="longest", language="en")
21
 
22
  #Transformers Code