plutus-8B-instruct

Running

jiminHuang commited on Feb 18

Commit

4c52fb0

verified ·

1 Parent(s): 4922032

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -8,11 +8,10 @@ import torch
 from transformers import AutoModelForCausalLM, AutoTokenizer, TextIteratorStreamer
 DESCRIPTION = """\
-# Llama 3.2 3B Instruct
-Llama 3.2 3B is Meta's latest iteration of open LLMs.
-This is a demo of [`meta-llama/Llama-3.2-3B-Instruct`](https://huggingface.co/meta-llama/Llama-3.2-3B-Instruct), fine-tuned for instruction following.
-For more details, please check [our post](https://huggingface.co/blog/llama32).
 """
 MAX_MAX_NEW_TOKENS = 2048
@@ -21,7 +20,7 @@ MAX_INPUT_TOKEN_LENGTH = int(os.getenv("MAX_INPUT_TOKEN_LENGTH", "4096"))
 device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
-model_id = "meta-llama/Llama-3.2-3B-Instruct"
 tokenizer = AutoTokenizer.from_pretrained(model_id)
 model = AutoModelForCausalLM.from_pretrained(
     model_id,

 from transformers import AutoModelForCausalLM, AutoTokenizer, TextIteratorStreamer
 DESCRIPTION = """\
+# Plutus 8B instruct
+Plutus 8B is The Fin AI's latest iteration of open LLMs.
+This is a demo of [`TheFinAI/plutus-8B-instruct`](https://huggingface.co/TheFinAI/plutus-8B-instruct), fine-tuned for instruction following.
 """
 MAX_MAX_NEW_TOKENS = 2048
 device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
+model_id = "TheFinAI/plutus-8B-instruct"
 tokenizer = AutoTokenizer.from_pretrained(model_id)
 model = AutoModelForCausalLM.from_pretrained(
     model_id,