TenzinGayche commited on
Commit
ba9d175
·
verified ·
1 Parent(s): 2457882

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -16,8 +16,8 @@ DEFAULT_MAX_NEW_TOKENS = 1024
16
  MAX_INPUT_TOKEN_LENGTH = int(os.getenv("MAX_INPUT_TOKEN_LENGTH", "4096"))
17
 
18
  # Load the model and tokenizer
19
- tokenizer = GemmaTokenizerFast.from_pretrained("TenzinGayche/example_v1.0.2")
20
- model = AutoModelForCausalLM.from_pretrained("TenzinGayche/example_v1.0.2", torch_dtype=torch.float16).to("cuda")
21
 
22
  model.config.sliding_window = 4096
23
  model.eval()
 
16
  MAX_INPUT_TOKEN_LENGTH = int(os.getenv("MAX_INPUT_TOKEN_LENGTH", "4096"))
17
 
18
  # Load the model and tokenizer
19
+ tokenizer = GemmaTokenizerFast.from_pretrained("TenzinGayche/ft_final")
20
+ model = AutoModelForCausalLM.from_pretrained("TenzinGayche/ft_final", torch_dtype=torch.float16).to("cuda")
21
 
22
  model.config.sliding_window = 4096
23
  model.eval()