Spaces:

Sparticle
/

Llama2_7b_chat_Japanese_Lora

Paused

zhaozitian commited on Aug 9, 2023

Commit

806585b

1 Parent(s): 6357cd4

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -8,7 +8,7 @@ assert (
 ), "LLaMA is now in HuggingFace's main branch.\nPlease reinstall it: pip uninstall transformers && pip install git+https://github.com/huggingface/transformers.git"
 from transformers import LlamaTokenizer, LlamaForCausalLM, GenerationConfig
-tokenizer = LlamaTokenizer.from_pretrained("meta-llama/Llama-2-7b-chat-hf")
 BASE_MODEL = "meta-llama/Llama-2-7b-chat-hf"
 LORA_WEIGHTS = "Sparticle/llama-2-7b-japanese-lora"
@@ -30,6 +30,7 @@ if device == "cuda":
         load_in_8bit=False,
         torch_dtype=torch.float16,
         device_map="auto",
     )
     model = PeftModel.from_pretrained(
         model, LORA_WEIGHTS, torch_dtype=torch.float16, force_download=True
@@ -39,6 +40,7 @@ elif device == "mps":
         BASE_MODEL,
         device_map={"": device},
         torch_dtype=torch.float16,
     )
     model = PeftModel.from_pretrained(
         model,

 ), "LLaMA is now in HuggingFace's main branch.\nPlease reinstall it: pip uninstall transformers && pip install git+https://github.com/huggingface/transformers.git"
 from transformers import LlamaTokenizer, LlamaForCausalLM, GenerationConfig
+tokenizer = LlamaTokenizer.from_pretrained("meta-llama/Llama-2-7b-chat-hf", use_auth_token=True)
 BASE_MODEL = "meta-llama/Llama-2-7b-chat-hf"
 LORA_WEIGHTS = "Sparticle/llama-2-7b-japanese-lora"
         load_in_8bit=False,
         torch_dtype=torch.float16,
         device_map="auto",
+        from_pretrained,
     )
     model = PeftModel.from_pretrained(
         model, LORA_WEIGHTS, torch_dtype=torch.float16, force_download=True
         BASE_MODEL,
         device_map={"": device},
         torch_dtype=torch.float16,
+        from_pretrained,
     )
     model = PeftModel.from_pretrained(
         model,