curl --request GET \
--url https://api.helicone.ai/v1/public/model-registry/models{
"data": {
"models": [
{
"id": "<string>",
"name": "<string>",
"author": "<string>",
"contextLength": 123,
"endpoints": [
{
"provider": "<string>",
"providerSlug": "<string>",
"pricing": {
"prompt": 123,
"completion": 123,
"audio": 123,
"thinking": 123,
"web_search": 123,
"image": 123,
"video": 123,
"cacheRead": 123,
"cacheWrite": 123,
"threshold": 123
},
"endpoint": {
"pricing": [
{
"threshold": 123,
"input": 123,
"output": 123,
"image": 123,
"cacheMultipliers": {
"cachedInput": 123,
"write1h": 123,
"write5m": 123
},
"cacheStoragePerHour": 123,
"thinking": 123,
"request": 123,
"audio": 123,
"video": 123,
"web_search": 123
}
],
"contextLength": 123,
"maxCompletionTokens": 123,
"ptbEnabled": true,
"modelConfig": {
"pricing": [
{
"threshold": 123,
"input": 123,
"output": 123,
"image": 123,
"cacheMultipliers": {
"cachedInput": 123,
"write1h": 123,
"write5m": 123
},
"cacheStoragePerHour": 123,
"thinking": 123,
"request": 123,
"audio": 123,
"video": 123,
"web_search": 123
}
],
"contextLength": 123,
"maxCompletionTokens": 123,
"ptbEnabled": true,
"providerModelId": "<string>",
"provider": "baseten",
"author": "anthropic",
"supportedParameters": [
"max_tokens"
],
"endpointConfigs": {},
"version": "<string>",
"unsupportedParameters": [
"max_tokens"
],
"supportedPlugins": [
"web"
],
"rateLimits": {
"rpm": 123,
"tpm": 123,
"tpd": 123
},
"crossRegion": true,
"priority": 123,
"quantization": "fp4",
"responseFormat": "ANTHROPIC",
"requireExplicitRouting": true,
"providerModelIdAliases": [
"<string>"
]
},
"userConfig": {
"region": "<string>",
"location": "<string>",
"projectId": "<string>",
"baseUri": "<string>",
"deploymentName": "<string>",
"resourceName": "<string>",
"apiVersion": "<string>",
"crossRegion": true,
"gatewayMapping": "OPENAI",
"modelName": "<string>",
"heliconeModelId": "<string>"
},
"provider": "baseten",
"author": "anthropic",
"providerModelId": "<string>",
"supportedParameters": [
"max_tokens"
],
"version": "<string>",
"unsupportedParameters": [
"max_tokens"
],
"priority": 123
},
"supportsPtb": true,
"pricingTiers": [
{
"prompt": 123,
"completion": 123,
"audio": 123,
"thinking": 123,
"web_search": 123,
"image": 123,
"video": 123,
"cacheRead": 123,
"cacheWrite": 123,
"threshold": 123
}
]
}
],
"inputModalities": [
"text"
],
"outputModalities": [
"text"
],
"supportedParameters": [
"max_tokens"
],
"maxOutput": 123,
"trainingDate": "<string>",
"description": "<string>",
"pinnedVersionOfModel": "<string>"
}
],
"total": 123,
"filters": {
"capabilities": [
"audio"
],
"authors": [
"<string>"
],
"providers": [
{
"displayName": "<string>",
"name": "<string>"
}
]
}
},
"error": null
}Returns all models and endpoints supported by the Helicone AI Gateway
curl --request GET \
--url https://api.helicone.ai/v1/public/model-registry/models{
"data": {
"models": [
{
"id": "<string>",
"name": "<string>",
"author": "<string>",
"contextLength": 123,
"endpoints": [
{
"provider": "<string>",
"providerSlug": "<string>",
"pricing": {
"prompt": 123,
"completion": 123,
"audio": 123,
"thinking": 123,
"web_search": 123,
"image": 123,
"video": 123,
"cacheRead": 123,
"cacheWrite": 123,
"threshold": 123
},
"endpoint": {
"pricing": [
{
"threshold": 123,
"input": 123,
"output": 123,
"image": 123,
"cacheMultipliers": {
"cachedInput": 123,
"write1h": 123,
"write5m": 123
},
"cacheStoragePerHour": 123,
"thinking": 123,
"request": 123,
"audio": 123,
"video": 123,
"web_search": 123
}
],
"contextLength": 123,
"maxCompletionTokens": 123,
"ptbEnabled": true,
"modelConfig": {
"pricing": [
{
"threshold": 123,
"input": 123,
"output": 123,
"image": 123,
"cacheMultipliers": {
"cachedInput": 123,
"write1h": 123,
"write5m": 123
},
"cacheStoragePerHour": 123,
"thinking": 123,
"request": 123,
"audio": 123,
"video": 123,
"web_search": 123
}
],
"contextLength": 123,
"maxCompletionTokens": 123,
"ptbEnabled": true,
"providerModelId": "<string>",
"provider": "baseten",
"author": "anthropic",
"supportedParameters": [
"max_tokens"
],
"endpointConfigs": {},
"version": "<string>",
"unsupportedParameters": [
"max_tokens"
],
"supportedPlugins": [
"web"
],
"rateLimits": {
"rpm": 123,
"tpm": 123,
"tpd": 123
},
"crossRegion": true,
"priority": 123,
"quantization": "fp4",
"responseFormat": "ANTHROPIC",
"requireExplicitRouting": true,
"providerModelIdAliases": [
"<string>"
]
},
"userConfig": {
"region": "<string>",
"location": "<string>",
"projectId": "<string>",
"baseUri": "<string>",
"deploymentName": "<string>",
"resourceName": "<string>",
"apiVersion": "<string>",
"crossRegion": true,
"gatewayMapping": "OPENAI",
"modelName": "<string>",
"heliconeModelId": "<string>"
},
"provider": "baseten",
"author": "anthropic",
"providerModelId": "<string>",
"supportedParameters": [
"max_tokens"
],
"version": "<string>",
"unsupportedParameters": [
"max_tokens"
],
"priority": 123
},
"supportsPtb": true,
"pricingTiers": [
{
"prompt": 123,
"completion": 123,
"audio": 123,
"thinking": 123,
"web_search": 123,
"image": 123,
"video": 123,
"cacheRead": 123,
"cacheWrite": 123,
"threshold": 123
}
]
}
],
"inputModalities": [
"text"
],
"outputModalities": [
"text"
],
"supportedParameters": [
"max_tokens"
],
"maxOutput": 123,
"trainingDate": "<string>",
"description": "<string>",
"pinnedVersionOfModel": "<string>"
}
],
"total": 123,
"filters": {
"capabilities": [
"audio"
],
"authors": [
"<string>"
],
"providers": [
{
"displayName": "<string>",
"name": "<string>"
}
]
}
},
"error": null
}gpt-4o-mini), the gateway consults this registry to find all providers offering that model, then applies routing logic to select the best provider based on your configuration, availability, and pricing.Complete model registry with models and filter options
Show child attributes
Show child attributes
Show child attributes
Show child attributes
Show child attributes
Show child attributes
Show child attributes
Show child attributes
Show child attributes
baseten, anthropic, azure, bedrock, canopywave, cerebras, chutes, deepinfra, deepseek, fireworks, google-ai-studio, groq, helicone, mistral, nebius, novita, openai, openrouter, perplexity, vertex, xai anthropic, deepseek, mistral, openai, perplexity, xai, google, meta-llama, amazon, microsoft, nvidia, qwen, moonshotai, alibaba, zai, baidu, passthrough max_tokens, max_completion_tokens, temperature, top_p, top_k, stop, stream, frequency_penalty, presence_penalty, repetition_penalty, seed, tools, tool_choice, functions, function_call, reasoning, include_reasoning, thinking, response_format, json_mode, truncate, min_p, logit_bias, logprobs, top_logprobs, structured_outputs, verbosity, n Construct a type with a set of properties K of type T
Show child attributes
Show child attributes
OPENAI, NO_MAPPING, RESPONSES Show child attributes
Show child attributes
Show child attributes
max_tokens, max_completion_tokens, temperature, top_p, top_k, stop, stream, frequency_penalty, presence_penalty, repetition_penalty, seed, tools, tool_choice, functions, function_call, reasoning, include_reasoning, thinking, response_format, json_mode, truncate, min_p, logit_bias, logprobs, top_logprobs, structured_outputs, verbosity, n web fp4, fp8, fp16, bf16, int4 ANTHROPIC, OPENAI, GOOGLE Show child attributes
OPENAI, NO_MAPPING, RESPONSES baseten, anthropic, azure, bedrock, canopywave, cerebras, chutes, deepinfra, deepseek, fireworks, google-ai-studio, groq, helicone, mistral, nebius, novita, openai, openrouter, perplexity, vertex, xai anthropic, deepseek, mistral, openai, perplexity, xai, google, meta-llama, amazon, microsoft, nvidia, qwen, moonshotai, alibaba, zai, baidu, passthrough max_tokens, max_completion_tokens, temperature, top_p, top_k, stop, stream, frequency_penalty, presence_penalty, repetition_penalty, seed, tools, tool_choice, functions, function_call, reasoning, include_reasoning, thinking, response_format, json_mode, truncate, min_p, logit_bias, logprobs, top_logprobs, structured_outputs, verbosity, n max_tokens, max_completion_tokens, temperature, top_p, top_k, stop, stream, frequency_penalty, presence_penalty, repetition_penalty, seed, tools, tool_choice, functions, function_call, reasoning, include_reasoning, thinking, response_format, json_mode, truncate, min_p, logit_bias, logprobs, top_logprobs, structured_outputs, verbosity, n Show child attributes
text, image, audio, video text, image, audio, video max_tokens, max_completion_tokens, temperature, top_p, top_k, stop, stream, frequency_penalty, presence_penalty, repetition_penalty, seed, tools, tool_choice, functions, function_call, reasoning, include_reasoning, thinking, response_format, json_mode, truncate, min_p, logit_bias, logprobs, top_logprobs, structured_outputs, verbosity, n Show child attributes
audio, video, image, thinking, web_search, caching, reasoning Was this page helpful?