BhashiniSpace_Text_gemma

Runtime error

FlawedLLM commited on May 23, 2024

Commit

bc816b1

verified ·

1 Parent(s): 84092dc

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -13,7 +13,8 @@ tokenizer = AutoTokenizer.from_pretrained("FlawedLLM/Bhashini_gemma_merged4bit_c
 model = AutoModelForCausalLM.from_pretrained("FlawedLLM/Bhashini_gemma_merged4bit_clean_final")
 def quantize_model(model):
     for name, module in model.named_modules():
-        if isinstance(module, torch.nn.Linear) and not isinstance(module, torch.nn.Linear4bit):
             module = quantize_blockwise(module)
 # Quantize the model (modified)

 model = AutoModelForCausalLM.from_pretrained("FlawedLLM/Bhashini_gemma_merged4bit_clean_final")
 def quantize_model(model):
     for name, module in model.named_modules():
+        # Quantize only Linear layers that haven't already been quantized
+        if isinstance(module, torch.nn.Linear) and not isinstance(module, Linear4bit):
             module = quantize_blockwise(module)
 # Quantize the model (modified)