Spaces:

shenzhi-wang
/

Gemma-2-27B-Chinese-Chat

Runtime error

shenzhi-wang commited on Jul 3, 2024

Commit

733ec1d

1 Parent(s): df32955

[fix] load in 16 bit

Files changed (1) hide show

app.py CHANGED Viewed

@@ -45,7 +45,7 @@ CSS = """
 tokenizer = AutoTokenizer.from_pretrained("shenzhi-wang/Gemma-2-27B-Chinese-Chat")
-model = AutoModelForCausalLM.from_pretrained("shenzhi-wang/Gemma-2-27B-Chinese-Chat", device_map="auto")
 @spaces.GPU
@@ -127,4 +127,4 @@ with gr.Blocks(css=CSS) as demo:
 if __name__ == "__main__":
-    demo.launch()

 tokenizer = AutoTokenizer.from_pretrained("shenzhi-wang/Gemma-2-27B-Chinese-Chat")
+model = AutoModelForCausalLM.from_pretrained("shenzhi-wang/Gemma-2-27B-Chinese-Chat", device_map="auto", torch_dtype="auto")
 @spaces.GPU
 if __name__ == "__main__":
+    demo.launch()