Spaces:

Namitg02
/

Test

Runtime error

App Files Files Community

Namitg02 commited on Jun 21, 2024

Commit

bfcdf28

verified ·

1 Parent(s): 2ff382a

Update app.py

Browse files

Files changed (1) hide show

app.py +8 -8

app.py CHANGED Viewed

@@ -50,7 +50,7 @@ If you don't know the answer, just say "I do not know." Don't make up an answer.
 llm_model = "TheBloke/TinyLlama-1.1B-Chat-v1.0-GGUF"
 # TheBloke/TinyLlama-1.1B-Chat-v1.0-GGUF and tinyllama-1.1b-chat-v1.0.Q4_K_M.gguf not working, TinyLlama/TinyLlama-1.1B-Chat-v0.6, andrijdavid/TinyLlama-1.1B-Chat-v1.0-GGUF"
-tokenizer = AutoTokenizer.from_pretrained("TinyLlama/TinyLlama-1.1B-Chat-v1.0")
 #initiate model and tokenizer
 #generation_config = AutoConfig.from_pretrained(
@@ -64,21 +64,21 @@ tokenizer = AutoTokenizer.from_pretrained("TinyLlama/TinyLlama-1.1B-Chat-v1.0")
   #  eos_token_id=terminators
 #)
 # send additional parameters to model for generation
-terminators = [
-    tokenizer.eos_token_id, # End-of-Sequence Token that indicates where the model should consider the text sequence to be complete
-    tokenizer.convert_tokens_to_ids("<|eot_id|>") # Converts a token strings in a single/ sequence of integer id using the vocabulary
-]
 # indicates the end of a sequence
 #model = llama_cpp.Llama(model_path = tinyllama-1.1b-chat-v1.0.Q4_K_M.gguf AutoModelForCausalLM.from_pretrained(llm_model, model_file = "tinyllama-1.1b-chat-v1.0.Q4_K_M.gguf", model_type="llama", gpu_layers=0, config = generation_config)
 model = Llama(
     model_path="./tinyllama-1.1b-chat-v1.0.Q4_K_M.gguf",
-    chat_format="llama-2",
     n_gpu_layers = 0,
     temperature=0.75,
     max_tokens=500,
-    top_p=0.95,
-    eos_tokens=terminators
     # callback_manager=callback_manager,
     # verbose=True,  # Verbose is required to pass to the callback manager
     )

 llm_model = "TheBloke/TinyLlama-1.1B-Chat-v1.0-GGUF"
 # TheBloke/TinyLlama-1.1B-Chat-v1.0-GGUF and tinyllama-1.1b-chat-v1.0.Q4_K_M.gguf not working, TinyLlama/TinyLlama-1.1B-Chat-v0.6, andrijdavid/TinyLlama-1.1B-Chat-v1.0-GGUF"
+#tokenizer = AutoTokenizer.from_pretrained("TinyLlama/TinyLlama-1.1B-Chat-v1.0")
 #initiate model and tokenizer
 #generation_config = AutoConfig.from_pretrained(
   #  eos_token_id=terminators
 #)
 # send additional parameters to model for generation
+#terminators = [
+#    tokenizer.eos_token_id, # End-of-Sequence Token that indicates where the model should consider the text sequence to be complete
+#    tokenizer.convert_tokens_to_ids("<|eot_id|>") # Converts a token strings in a single/ sequence of integer id using the vocabulary
+#]
 # indicates the end of a sequence
 #model = llama_cpp.Llama(model_path = tinyllama-1.1b-chat-v1.0.Q4_K_M.gguf AutoModelForCausalLM.from_pretrained(llm_model, model_file = "tinyllama-1.1b-chat-v1.0.Q4_K_M.gguf", model_type="llama", gpu_layers=0, config = generation_config)
 model = Llama(
     model_path="./tinyllama-1.1b-chat-v1.0.Q4_K_M.gguf",
+ #   chat_format="llama-2",
     n_gpu_layers = 0,
     temperature=0.75,
     max_tokens=500,
+    top_p=0.95 #,
+ #   eos_tokens=terminators
     # callback_manager=callback_manager,
     # verbose=True,  # Verbose is required to pass to the callback manager
     )