hienbm commited on
Commit
5dc4a5d
·
verified ·
1 Parent(s): 0d265f0

Upload app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -32,7 +32,7 @@ api_token = os.getenv("API_TOKEN")
32
 
33
  os.environ["PYTORCH_CUDA_ALLOC_CONF"] = "max_split_size_mb:15000"
34
 
35
- model_id = "google/gemma-2-9b-it"
36
  quantization_config = BitsAndBytesConfig(load_in_4bit=True)
37
 
38
  tokenizer = AutoTokenizer.from_pretrained(
 
32
 
33
  os.environ["PYTORCH_CUDA_ALLOC_CONF"] = "max_split_size_mb:15000"
34
 
35
+ model_id = "mistralai/Mixtral-8x7B-Instruct-v0.1"
36
  quantization_config = BitsAndBytesConfig(load_in_4bit=True)
37
 
38
  tokenizer = AutoTokenizer.from_pretrained(