webpluging

Paused

ranamhamoud commited on Apr 18, 2024

Commit

89044b5

verified ·

1 Parent(s): 4d5d8af

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -26,18 +26,18 @@ if not torch.cuda.is_available():
 if torch.cuda.is_available():
-# Model and Tokenizer Configuration
-model_id = "meta-llama/Llama-2-7b-chat-hf"
-bnb_config = BitsAndBytesConfig(
-    load_in_4bit=True,
-    bnb_4bit_use_double_quant=False,
-    bnb_4bit_quant_type="nf4",
-    bnb_4bit_compute_dtype=torch.bfloat16
-)
-base_model = AutoModelForCausalLM.from_pretrained(model_id, device_map="auto", quantization_config=bnb_config)
-model = PeftModel.from_pretrained(base_model, "ranamhamoud/storytell")
-tokenizer = AutoTokenizer.from_pretrained(model_id)
-tokenizer.pad_token = tokenizer.eos_token
 # # MongoDB Connection
 # PASSWORD = os.environ.get("MONGO_PASS")

 if torch.cuda.is_available():
+    # Model and Tokenizer Configuration
+    model_id = "meta-llama/Llama-2-7b-chat-hf"
+    bnb_config = BitsAndBytesConfig(
+        load_in_4bit=True,
+        bnb_4bit_use_double_quant=False,
+        bnb_4bit_quant_type="nf4",
+        bnb_4bit_compute_dtype=torch.bfloat16
+    )
+    base_model = AutoModelForCausalLM.from_pretrained(model_id, device_map="auto", quantization_config=bnb_config)
+    model = PeftModel.from_pretrained(base_model, "ranamhamoud/storytell")
+    tokenizer = AutoTokenizer.from_pretrained(model_id)
+    tokenizer.pad_token = tokenizer.eos_token
 # # MongoDB Connection
 # PASSWORD = os.environ.get("MONGO_PASS")