def calculate_token_usage(text, model="gpt-3.5-turbo"):
encoding = tiktoken.encoding_for_model(model)
token_count = len(encoding.encode(text))
return token_count
token_usage = calculate_token_usage(str(crafted_prompt))
if token_usage < 4000:
model = "gpt-3.5-turbo"
else:
model = "gpt-3.5-turbo-16k"
response = openai.ChatCompletion.create(
model=model,
messages=crafted_prompt,
temperature=0.95,
max_tokens=700,
top_p=1,
frequency_penalty=0,
presence_penalty=0.28
)
will generate stuff bigger then 700 combined usage