Spaces:

Harsh2001
/

Israel-Hamas-War-Knowledge

Sleeping

Harsh2001 commited on Jun 8, 2024

Commit

185e9a0

verified ·

1 Parent(s): a92113b

Update utils.py

Files changed (1) hide show

utils.py CHANGED Viewed

@@ -14,17 +14,10 @@ from transformers import StoppingCriteria, StoppingCriteriaList
 hf_auth = os.getenv('hf_auth')
 # LLM Model
-model_id = 'meta-llama/Llama-2-7b-chat-hf'
 device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
-bnb_config = transformers.BitsAndBytesConfig(
-    load_in_4bit=True,
-    bnb_4bit_quant_type='nf4',
-    bnb_4bit_use_double_quant=True,
-    bnb_4bit_compute_dtype=bfloat16
-)
 model_config = transformers.AutoConfig.from_pretrained(
     model_id,
     use_auth_token=hf_auth
@@ -34,7 +27,6 @@ llm_model = transformers.AutoModelForCausalLM.from_pretrained(
     model_id,
     trust_remote_code=True,
     config=model_config,
-    quantization_config=bnb_config,
     device_map='auto',
     use_auth_token=hf_auth
 )

 hf_auth = os.getenv('hf_auth')
 # LLM Model
+model_id = 'google-t5/t5-base'
 device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
 model_config = transformers.AutoConfig.from_pretrained(
     model_id,
     use_auth_token=hf_auth
     model_id,
     trust_remote_code=True,
     config=model_config,
     device_map='auto',
     use_auth_token=hf_auth
 )