PMAlpha / hippocampus.py
Sergidev's picture
v1
f1eb360 verified
raw
history blame
562 Bytes
from llama_cpp import Llama
def generate_topic(prompt, response):
llm = Llama(model_path="./loyal-macaroni-maid-7b.Q6_K.gguf", n_ctx=690, n_threads=8, n_gpu_layers=32)
system_prompt = f"Based on the following interaction between a user and an AI assistant, generate a concise topic for the conversation in 2-6 words:\n\nUser: {prompt}\nAssistant: {response}\n\nTopic:"
topic = llm(
system_prompt,
max_tokens=10,
temperature=0.7,
stop=["\\n"],
echo=False
)
return topic['choices'][0]['text'].strip()