Deploy Deepseek R1
Example usage
DeepSeek-R1 is optimized using SGLang and uses an OpenAI-compatible API endpoint.Input
Copy
Ask AI
import httpx
import os
MODEL_ID = "abcd1234" # Replace with your model ID
DEPLOYMENT_ID = "abcd1234" # [Optional] Replace with your deployment ID
API_KEY = os.environ["BASETEN_API_KEY"]
resp = httpx.post(
f"https://model-{MODEL_ID}.api.baseten.co/environments/production/sync/v1/chat/completions",
headers={"Authorization": f"Api-Key {API_KEY}"},
json={
"model": "deepseek_v3",
"messages": [
{"role": "system", "content": "You are a helpful AI assistant."},
{"role": "user", "content": "What weighs more, a pound of bricks or a pound of feathers?"},
],
"max_tokens": 1024,
},
timeout=None
)
print(resp.json())
Output
Copy
Ask AI
{
"id": "8456fe51db3548789f199cfb8c8efd35",
"object": "text_completion",
"created": 1735236968,
"model": "/models/deepseek_r1",
"choices": [
{
"index": 0,
"text": "Let's think through this step by step...",
"logprobs": null,
"finish_reason": "stop",
"matched_stop": 1
}
],
"usage": {
"prompt_tokens": 14,
"total_tokens": 240,
"completion_tokens": 226,
"prompt_tokens_details": null
}
}