BhashiniSpace_Text_gemma

Runtime error

FlawedLLM commited on May 23, 2024

Commit

7a2b2c6

verified ·

1 Parent(s): 25f3272

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -6,9 +6,11 @@ import spaces
 import gradio as gr
 import torch
 from transformers import AutoTokenizer, AutoModelForCausalLM
 tokenizer = AutoTokenizer.from_pretrained("FlawedLLM/Bhashini_gemma_merged4bit_clean_final")
 model = AutoModelForCausalLM.from_pretrained("FlawedLLM/Bhashini_gemma_merged4bit_clean_final")
 # alpaca_prompt = You MUST copy from above!
 @spaces.GPU(duration=300)
 def chunk_it(input_command, item_list):

 import gradio as gr
 import torch
 from transformers import AutoTokenizer, AutoModelForCausalLM
+from bitsandbytes.functional import quantize_blockwise
 tokenizer = AutoTokenizer.from_pretrained("FlawedLLM/Bhashini_gemma_merged4bit_clean_final")
 model = AutoModelForCausalLM.from_pretrained("FlawedLLM/Bhashini_gemma_merged4bit_clean_final")
+model= quantize_blockwise(model)
 # alpaca_prompt = You MUST copy from above!
 @spaces.GPU(duration=300)
 def chunk_it(input_command, item_list):