Create a message

curl --request POST \
  --url https://openrouter.ai/api/v1/messages \
  --header 'Authorization: Bearer <token>' \
  --header 'Content-Type: application/json' \
  --data '
{
  "max_tokens": 1024,
  "messages": [
    {
      "content": "Hello, how are you?",
      "role": "user"
    }
  ],
  "model": "anthropic/claude-sonnet-4"
}
'

import requests

url = "https://openrouter.ai/api/v1/messages"

payload = {
    "max_tokens": 1024,
    "messages": [
        {
            "content": "Hello, how are you?",
            "role": "user"
        }
    ],
    "model": "anthropic/claude-sonnet-4"
}
headers = {
    "Authorization": "Bearer <token>",
    "Content-Type": "application/json"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

const options = {
  method: 'POST',
  headers: {Authorization: 'Bearer <token>', 'Content-Type': 'application/json'},
  body: JSON.stringify({
    max_tokens: 1024,
    messages: [{content: 'Hello, how are you?', role: 'user'}],
    model: 'anthropic/claude-sonnet-4'
  })
};

fetch('https://openrouter.ai/api/v1/messages', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://openrouter.ai/api/v1/messages",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'max_tokens' => 1024,
    'messages' => [
        [
                'content' => 'Hello, how are you?',
                'role' => 'user'
        ]
    ],
    'model' => 'anthropic/claude-sonnet-4'
  ]),
  CURLOPT_HTTPHEADER => [
    "Authorization: Bearer <token>",
    "Content-Type: application/json"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://openrouter.ai/api/v1/messages"

	payload := strings.NewReader("{\n  \"max_tokens\": 1024,\n  \"messages\": [\n    {\n      \"content\": \"Hello, how are you?\",\n      \"role\": \"user\"\n    }\n  ],\n  \"model\": \"anthropic/claude-sonnet-4\"\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Authorization", "Bearer <token>")
	req.Header.Add("Content-Type", "application/json")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://openrouter.ai/api/v1/messages")
  .header("Authorization", "Bearer <token>")
  .header("Content-Type", "application/json")
  .body("{\n  \"max_tokens\": 1024,\n  \"messages\": [\n    {\n      \"content\": \"Hello, how are you?\",\n      \"role\": \"user\"\n    }\n  ],\n  \"model\": \"anthropic/claude-sonnet-4\"\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://openrouter.ai/api/v1/messages")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["Authorization"] = 'Bearer <token>'
request["Content-Type"] = 'application/json'
request.body = "{\n  \"max_tokens\": 1024,\n  \"messages\": [\n    {\n      \"content\": \"Hello, how are you?\",\n      \"role\": \"user\"\n    }\n  ],\n  \"model\": \"anthropic/claude-sonnet-4\"\n}"

response = http.request(request)
puts response.read_body

{
  "container": null,
  "content": [
    {
      "citations": [],
      "text": "I'm doing well, thank you for asking! How can I help you today?",
      "type": "text"
    }
  ],
  "id": "msg_abc123",
  "model": "anthropic/claude-sonnet-4",
  "role": "assistant",
  "stop_details": null,
  "stop_reason": "end_turn",
  "stop_sequence": null,
  "type": "message",
  "usage": {
    "cache_creation": null,
    "cache_creation_input_tokens": null,
    "cache_read_input_tokens": null,
    "inference_geo": null,
    "input_tokens": 12,
    "output_tokens": 18,
    "output_tokens_details": null,
    "server_tool_use": null,
    "service_tier": "standard"
  }
}

POST

messages

Create a message

curl --request POST \
  --url https://openrouter.ai/api/v1/messages \
  --header 'Authorization: Bearer <token>' \
  --header 'Content-Type: application/json' \
  --data '
{
  "max_tokens": 1024,
  "messages": [
    {
      "content": "Hello, how are you?",
      "role": "user"
    }
  ],
  "model": "anthropic/claude-sonnet-4"
}
'

import requests

url = "https://openrouter.ai/api/v1/messages"

payload = {
    "max_tokens": 1024,
    "messages": [
        {
            "content": "Hello, how are you?",
            "role": "user"
        }
    ],
    "model": "anthropic/claude-sonnet-4"
}
headers = {
    "Authorization": "Bearer <token>",
    "Content-Type": "application/json"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

const options = {
  method: 'POST',
  headers: {Authorization: 'Bearer <token>', 'Content-Type': 'application/json'},
  body: JSON.stringify({
    max_tokens: 1024,
    messages: [{content: 'Hello, how are you?', role: 'user'}],
    model: 'anthropic/claude-sonnet-4'
  })
};

fetch('https://openrouter.ai/api/v1/messages', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://openrouter.ai/api/v1/messages",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'max_tokens' => 1024,
    'messages' => [
        [
                'content' => 'Hello, how are you?',
                'role' => 'user'
        ]
    ],
    'model' => 'anthropic/claude-sonnet-4'
  ]),
  CURLOPT_HTTPHEADER => [
    "Authorization: Bearer <token>",
    "Content-Type: application/json"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://openrouter.ai/api/v1/messages"

	payload := strings.NewReader("{\n  \"max_tokens\": 1024,\n  \"messages\": [\n    {\n      \"content\": \"Hello, how are you?\",\n      \"role\": \"user\"\n    }\n  ],\n  \"model\": \"anthropic/claude-sonnet-4\"\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Authorization", "Bearer <token>")
	req.Header.Add("Content-Type", "application/json")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://openrouter.ai/api/v1/messages")
  .header("Authorization", "Bearer <token>")
  .header("Content-Type", "application/json")
  .body("{\n  \"max_tokens\": 1024,\n  \"messages\": [\n    {\n      \"content\": \"Hello, how are you?\",\n      \"role\": \"user\"\n    }\n  ],\n  \"model\": \"anthropic/claude-sonnet-4\"\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://openrouter.ai/api/v1/messages")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["Authorization"] = 'Bearer <token>'
request["Content-Type"] = 'application/json'
request.body = "{\n  \"max_tokens\": 1024,\n  \"messages\": [\n    {\n      \"content\": \"Hello, how are you?\",\n      \"role\": \"user\"\n    }\n  ],\n  \"model\": \"anthropic/claude-sonnet-4\"\n}"

response = http.request(request)
puts response.read_body

{
  "container": null,
  "content": [
    {
      "citations": [],
      "text": "I'm doing well, thank you for asking! How can I help you today?",
      "type": "text"
    }
  ],
  "id": "msg_abc123",
  "model": "anthropic/claude-sonnet-4",
  "role": "assistant",
  "stop_details": null,
  "stop_reason": "end_turn",
  "stop_sequence": null,
  "type": "message",
  "usage": {
    "cache_creation": null,
    "cache_creation_input_tokens": null,
    "cache_read_input_tokens": null,
    "inference_geo": null,
    "input_tokens": 12,
    "output_tokens": 18,
    "output_tokens_details": null,
    "server_tool_use": null,
    "service_tier": "standard"
  }
}

Authorizations

Authorization

string

header

required

API key as bearer token in Authorization header

Headers

X-OpenRouter-Metadata

enum<string>

Opt-in to surface routing metadata on the response under openrouter_metadata. Defaults to disabled. The legacy header X-OpenRouter-Experimental-Metadata is also accepted for backward compatibility. Opt-in level for surfacing routing metadata on the response under openrouter_metadata.

Available options:

disabled,

enabled

Example:

"enabled"

Body

application/json

Request schema for Anthropic Messages API endpoint

messages

object[] | null

required

Show child attributes

model

string

required

cache_control

object

Enable automatic prompt caching. When set at the top level, the system automatically applies cache breakpoints to the last cacheable block in the request. When set on an individual content block, it marks an explicit cache breakpoint; block-level markers also work on OpenAI models that support explicit prompt caching — OpenRouter converts them to the provider's native format.

Show child attributes

Example:

{ "type": "ephemeral" }

context_management

object | null

Show child attributes

fallbacks

object[] | null

Fallback models to try if the primary model fails or refuses, in order. Handled by OpenRouter multi-model routing rather than Anthropic server-side fallbacks; cannot be combined with models. Each entry accepts only model. Maximum of 3 entries.

Show child attributes

Example:

[{ "model": "claude-opus-4-8" }]

max_tokens

integer

metadata

object

Show child attributes

models

string[]

output_config

object

Configuration for controlling output behavior. Supports the effort parameter and structured output format.

Show child attributes

Example:

{ "effort": "medium" }

plugins

object[]

Plugins you want to enable for this request, including their settings.

Show child attributes

Example:

{
  "allowed_models": ["anthropic/*", "openai/gpt-4o"],
  "cost_quality_tradeoff": 7,
  "enabled": true,
  "id": "auto-router",
  "pin_model": false
}

provider

object | null

When multiple model providers are available, optionally indicate your routing preference.

Show child attributes

Example:

{ "allow_fallbacks": true }

route

enum<string> | null

deprecated

DEPRECATED Use providers.sort.partition instead. Backwards-compatible alias for providers.sort.partition. Accepts legacy values: "fallback" (maps to "model"), "sort" (maps to "none").

Available options:

fallback,

sort,

null

Example:

"fallback"

service_tier

string

session_id

string

A unique identifier for grouping related requests (e.g., a conversation or agent workflow). When provided, OpenRouter uses it as the sticky routing key, routing all requests in the session to the same provider to maximize prompt cache hits. Also used for observability grouping. If provided in both the request body and the x-session-id header, the body value takes precedence. Maximum of 256 characters.

Maximum string length: 256

speed

enum<string> | null

Controls output generation speed. When set to fast, uses a higher-speed inference configuration at premium pricing. Defaults to standard when omitted.

Available options:

fast,

standard,

null

Example:

"fast"

stop_sequences

string[]

stop_server_tools_when

object[]

Stop conditions for the server-tool agent loop. Any condition firing halts the loop (OR logic). When set, this overrides max_tool_calls. When a condition fires while the model is still emitting tool calls, the pending tool calls are executed and one final turn is made with tool calls disabled so the response ends with a natural-language answer instead of an unfinished tool call.

Minimum array length: 1

A single condition that, when met, halts the server-tool agent loop.

Option 1
Option 2
Option 3
Option 4
Option 5

Show child attributes

Example:

{ "step_count": 5, "type": "step_count_is" }

Example:

[
  { "step_count": 5, "type": "step_count_is" },
  {
    "max_cost_in_dollars": 0.5,
    "type": "max_cost"
  }
]

stream

boolean

system

temperature

number<double>

thinking

object

Option 1
Option 2
Option 3

Show child attributes

tool_choice

object

Option 1
Option 2
Option 3
Option 4

Show child attributes

tools

object[]

Show child attributes

top_k

integer

top_p

number<double>

trace

object

Metadata for observability and tracing. Known keys (trace_id, trace_name, span_name, generation_name, parent_span_id) have special handling. Additional keys are passed through as custom metadata to configured broadcast destinations.

Show child attributes

Example:

{
  "trace_id": "trace-abc123",
  "trace_name": "my-app-trace"
}

user

string

A unique identifier representing your end-user, which helps distinguish between different users of your app. This allows your app to identify specific users in case of abuse reports, preventing your entire app from being affected by the actions of individual users. Maximum of 256 characters.

Maximum string length: 256

Response

Successful response

Non-streaming response from the Anthropic Messages API with OpenRouter extensions

container

object | null

required

Show child attributes

Example:

{
  "expires_at": "2026-04-08T00:00:00Z",
  "id": "ctr_01abc"
}

content

object[]

required

Show child attributes

Example:

{
  "citations": null,
  "text": "Hello, world!",
  "type": "text"
}

string

required

model

string

required

role

enum<string>

required

Available options:

assistant

stop_details

object | null

required

Structured information about a refusal

Show child attributes

Example:

{
  "category": "cyber",
  "explanation": "The request was refused due to policy.",
  "type": "refusal"
}

stop_reason

enum<string> | null

required

Available options:

end_turn,

max_tokens,

stop_sequence,

tool_use,

pause_turn,

refusal,

compaction,

null

Example:

"end_turn"

stop_sequence

string | null

required

type

enum<string>

required

Available options:

message

usage

object

required

Show child attributes

Example:

{
  "cache_creation": null,
  "cache_creation_input_tokens": null,
  "cache_read_input_tokens": null,
  "inference_geo": null,
  "input_tokens": 100,
  "output_tokens": 50,
  "output_tokens_details": null,
  "server_tool_use": null,
  "service_tier": "standard"
}

context_management

object | null

Show child attributes

openrouter_metadata

object

Show child attributes

Example:

{
  "attempt": 1,
  "endpoints": {
    "available": [
      {
        "model": "openai/gpt-4o",
        "provider": "OpenAI",
        "selected": true
      }
    ],
    "total": 1
  },
  "is_byok": false,
  "region": "iad",
  "requested": "openai/gpt-4o",
  "strategy": "direct",
  "summary": "available=1, selected=OpenAI"
}

provider

enum<string>

Available options:

AkashML,

AI21,

AionLabs,

Alibaba,

Ambient,

Baidu,

Amazon Bedrock,

Amazon Nova,

Anthropic,

Arcee AI,

AtlasCloud,

Avian,

Azure,

BaseTen,

BytePlus,

Black Forest Labs,

Cerebras,

Chutes,

Cirrascale,

Clarifai,

Cloudflare,

Cohere,

CoreWeave,

Crucible,

Crusoe,

Darkbloom,

Decart,

Deepgram,

DeepInfra,

DeepSeek,

DekaLLM,

DigitalOcean,

Featherless,

Fireworks,

Fish Audio,

Friendli,

GMICloud,

Google,

Google AI Studio,

Groq,

HeyGen,

Inception,

Inceptron,

InferenceNet,

Ionstream,

Infermatic,

Io Net,

Inferact vLLM,

Inflection,

Liquid,

Mara,

Mancer 2,

Meta,

Minimax,

ModelRun,

Mistral,

Modular,

Moonshot AI,

Morph,

NCompass,

Nebius,

Nex AGI,

NextBit,

Novita,

Nvidia,

OpenAI,

OpenInference,

Parasail,

Poolside,

Perceptron,

Perplexity,

Phala,

Recraft,

Reka,

Relace,

Sail Research,

Sakana AI,

SambaNova,

Seed,

SiliconFlow,

Sourceful,

StepFun,

Stealth,

StreamLake,

Switchpoint,

Tencent,

Tenstorrent,

Together,

Upstage,

Venice,

Wafer,

WandB,

Quiver,

Krea,

Runway,

Xiaomi,

xAI,

Z.AI,

FakeProvider

Example:

"OpenAI"

Update an API key Get a model by its slug

⌘I

API Guides

API Reference

Create a message

Authorizations

Headers

Body

Response