import os
from openai import OpenAI
# https://model-XXXXXXX.api.baseten.co/environments/production/sync/v1
model_url = ""
client = OpenAI(
base_url=model_url,
api_key=os.environ.get("BASETEN_API_KEY"),
)
stream = client.chat.completions.create(
model="baseten",
messages=[
{"role": "system", "content": "You are a helpful assistant."},
{"role": "user", "content": "What was the role of Llamas in the Inca empire?"}
],
stream=True,
)
for chunk in stream:
if chunk.choices[0].delta.content is not None:
print(chunk.choices[0].delta.content, end="")