Chat & Text
Multi-Turn Conversations
Build a back-and-forth conversation by appending each assistant reply to your messages array before sending the next user message.
Python
python
import requests
BASE_URL = "https://api.oneinfer.ai"
token = requests.post(
f"{BASE_URL}/v1/ula/oauth-authentication?api_key=YOUR_API_KEY"
).json()["access_token"]
headers = {"Authorization": f"Bearer {token}", "Content-Type": "application/json"}
messages = [{"role": "system", "content": "You are a concise technical assistant."}]
def chat(user_message: str) -> str:
messages.append({"role": "user", "content": user_message})
response = requests.post(
f"{BASE_URL}/v1/ula/chat/completions",
headers=headers,
json={"provider": "openai", "model": "gpt-4o-mini", "messages": messages, "max_tokens": 256},
)
reply = response.json()["data"]["text"]
messages.append({"role": "assistant", "content": reply})
return reply
print(chat("What is a transformer?"))
print(chat("How does attention work in it?"))
print(chat("Give me a Python code snippet."))