Update README.md
Browse files
README.md
CHANGED
@@ -75,7 +75,7 @@ llm = Llama.from_pretrained(
|
|
75 |
chat_history = [
|
76 |
{"role": "system", "content": """
|
77 |
You are a helpful assistant named Llama, made by Meta AI.
|
78 |
-
Always use your <|reasoning|> <|end_reasoning|> tokens, without any text formatting, plain text only.
|
79 |
"""}
|
80 |
]
|
81 |
|
@@ -93,7 +93,7 @@ while True:
|
|
93 |
# Call the chat completion API in streaming mode with the updated conversation.
|
94 |
output_stream = llm.create_chat_completion(
|
95 |
messages=chat_history,
|
96 |
-
temperature=0.
|
97 |
top_p=0.95,
|
98 |
max_tokens=4096,
|
99 |
stream=True
|
|
|
75 |
chat_history = [
|
76 |
{"role": "system", "content": """
|
77 |
You are a helpful assistant named Llama, made by Meta AI.
|
78 |
+
Always use your <|reasoning|> and <|end_reasoning|> tokens, without any text formatting, plain text only.
|
79 |
"""}
|
80 |
]
|
81 |
|
|
|
93 |
# Call the chat completion API in streaming mode with the updated conversation.
|
94 |
output_stream = llm.create_chat_completion(
|
95 |
messages=chat_history,
|
96 |
+
temperature=0.4,
|
97 |
top_p=0.95,
|
98 |
max_tokens=4096,
|
99 |
stream=True
|