BhashiniSpace_Text_gemma

Runtime error

FlawedLLM commited on May 22, 2024

Commit

04ab46f

verified ·

1 Parent(s): 322f74c

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -64,13 +64,13 @@ from huggingface_hub import login, HfFolder
 # model = AutoModelForCausalLM.from_pretrained("FlawedLLM/Bhashini_9",config=config, ignore_mismatched_sizes=True).to('cuda')
 # Load model directly
-tokenizer = AutoTokenizer.from_pretrained("FlawedLLM/Bhashini_00", trust_remote_code=True)
 quantization_config = BitsAndBytesConfig(
         load_in_4bit=True,
         bnb_4bit_use_double_quant=True,
         bnb_4bit_quant_type="nf4",
         bnb_4bit_compute_dtype=torch.float16)
-model = AutoModelForCausalLM.from_pretrained("FlawedLLM/Bhashini_00",
                                              device_map="auto",
                                              quantization_config=quantization_config,
                                              torch_dtype =torch.float16,

 # model = AutoModelForCausalLM.from_pretrained("FlawedLLM/Bhashini_9",config=config, ignore_mismatched_sizes=True).to('cuda')
 # Load model directly
+tokenizer = AutoTokenizer.from_pretrained("FlawedLLM/Bhashini89", trust_remote_code=True)
 quantization_config = BitsAndBytesConfig(
         load_in_4bit=True,
         bnb_4bit_use_double_quant=True,
         bnb_4bit_quant_type="nf4",
         bnb_4bit_compute_dtype=torch.float16)
+model = AutoModelForCausalLM.from_pretrained("FlawedLLM/Bhashini89",
                                              device_map="auto",
                                              quantization_config=quantization_config,
                                              torch_dtype =torch.float16,