Spaces:
Sleeping
Sleeping
File size: 414 Bytes
9657faa |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 |
from huggingface_hub import InferenceClient
api_key=os.getenv("HF_TOKEN")
client = InferenceClient(api_key=api_key)
messages = [
{ "role": "user", "content": "Tell me a story" }
]
stream = client.chat.completions.create(
model="HuggingFaceH4/zephyr-7b-beta",
messages=messages,
temperature=0.5,
max_tokens=2048,
top_p=0.7,
stream=True
)
for chunk in stream:
print(chunk.choices[0].delta.content) |