BhashiniSpace_Text_gemma

Runtime error

FlawedLLM commited on May 22, 2024

Commit

731e7a8

verified ·

1 Parent(s): d2a5fcd

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -60,12 +60,11 @@ from transformers import AutoTokenizer, AutoModelForCausalLM, BitsAndBytesConfig
 # # torch_dtype =torch.float16
 # model = AutoModelForCausalLM.from_pretrained("FlawedLLM/Bhashini_9",config=config, ignore_mismatched_sizes=True).to('cuda')
 # Load model directly
-@spaces.GPU(duration=300)
 tokenizer = AutoTokenizer.from_pretrained("FlawedLLM/Bhashini_00")
 model = AutoModelForCausalLM.from_pretrained("FlawedLLM/Bhashini_00", load_in_4bit=True).to('cuda')
 def chunk_it(input_command):
     alpaca_prompt = """Below is an instruction that describes a task, paired with an input that provides further context. Write a response that appropriately completes the request.

 # # torch_dtype =torch.float16
 # model = AutoModelForCausalLM.from_pretrained("FlawedLLM/Bhashini_9",config=config, ignore_mismatched_sizes=True).to('cuda')
 # Load model directly
 tokenizer = AutoTokenizer.from_pretrained("FlawedLLM/Bhashini_00")
 model = AutoModelForCausalLM.from_pretrained("FlawedLLM/Bhashini_00", load_in_4bit=True).to('cuda')
+@spaces.GPU(duration=300)
 def chunk_it(input_command):
     alpaca_prompt = """Below is an instruction that describes a task, paired with an input that provides further context. Write a response that appropriately completes the request.