Spaces:
Runtime error
Runtime error
import time | |
import openai | |
import os | |
from utils import dotdict | |
OPENAI_API_KEY = os.environ.get('OPENAI_API_KEY') #"Enter your openai API key" | |
completion_tokens = 0 | |
prompt_tokens = 0 | |
def gpt(prompt, model, temperature=0.7, max_tokens=4000, n=1, stop=None) -> list: | |
messages = [{"role": "user", "content": prompt}] | |
if model == "gpt-4": | |
pass | |
time.sleep(30) # to prevent speed limitation exception | |
return chatgpt(messages, model=model, temperature=temperature, max_tokens=max_tokens, n=n, stop=stop) | |
def chatgpt(messages, model, temperature, max_tokens, n, stop) -> list: | |
global completion_tokens, prompt_tokens | |
outputs = [] | |
while n > 0: | |
cnt = min(n, 20) | |
n -= cnt | |
res = openai.chat.completions.create(model=model, messages=messages, temperature=temperature, max_tokens=max_tokens, | |
n=cnt, stop=stop) | |
outputs.extend([choice.message.content for choice in res.choices]) | |
# log completion tokens | |
completion_tokens += res.usage.completion_tokens | |
prompt_tokens += res.usage.prompt_tokens | |
return outputs | |
def gpt_usage(backend="gpt-4"): | |
global completion_tokens, prompt_tokens | |
if backend == "gpt-4": | |
cost = completion_tokens / 1000 * 0.06 + prompt_tokens / 1000 * 0.03 | |
elif backend == "gpt-4-turbo-preview": | |
cost = completion_tokens / 1000 * 0.03 + prompt_tokens / 1000 * 0.01 | |
elif backend == "gpt-3.5-turbo": | |
cost = completion_tokens / 1000 * 0.002 + prompt_tokens / 1000 * 0.0015 | |
return {"completion_tokens": completion_tokens, "prompt_tokens": prompt_tokens, "cost": cost} | |