{"kind":"llmreference.router.index","schemaVersion":1,"resource":"routers","source":"data/seed/router.json","routes":{"apiIndex":"/api/routers","apiDetail":"/api/router/{slug}","humanDirectory":"/routers","humanDetail":"/router/{slug}"},"count":18,"activeCount":17,"bestPages":[{"slug":"llm-gateways","href":"/best/llm-gateways","title":"Best LLM gateways","filter":{"types":["gateway"]},"count":4},{"slug":"llm-routers","href":"/best/llm-routers","title":"Best LLM routers","filter":{"types":["router"]},"count":10},{"slug":"openrouter-alternatives","href":"/best/openrouter-alternatives","title":"OpenRouter alternatives","filter":{"types":["gateway","hybrid"],"excludedSlugs":["openrouter"]},"count":6},{"slug":"self-hosted-router","href":"/best/self-hosted-router","title":"Self-hosted LLM routers","filter":{"hosting":"self_hosted"},"count":4},{"slug":"open-source-llm-router","href":"/best/open-source-llm-router","title":"Open-source LLM routers","filter":{"openness":"open_source"},"count":5},{"slug":"cheapest-llm-gateway","href":"/best/cheapest-llm-gateway","title":"Cheapest LLM gateway options","filter":{"objective":"cost"},"count":17},{"slug":"llm-cost-optimization","href":"/best/llm-cost-optimization","title":"LLM cost optimization routers","filter":{"objective":"cost"},"count":17}],"routers":[{"slug":"litellm","name":"LiteLLM","vendor":"BerriAI","type":"gateway","status":"active","summary":"Open-source Python SDK and proxy server that unifies 100+ LLM APIs behind a single OpenAI-compatible interface, with load balancing, cost tracking, and configurable failover.","editorTake":null,"bestFor":["open source","self-hosting","OpenAI-compatible proxy","developer tooling","cost tracking"],"targetProviders":["openai-api","anthropic-api","google-ai-studio","gcp-vertex-ai","microsoft-foundry","azure-openai","cohere-api","mistral-ai-api","deepseek-api"],"targetProviderHrefs":["/provider/openai-api","/provider/anthropic-api","/provider/google-ai-studio","/provider/gcp-vertex-ai","/provider/microsoft-foundry","/provider/azure-openai","/provider/cohere-api","/provider/mistral-ai-api","/provider/deepseek-api"],"modelsCount":100,"apiCompatibility":["openai"],"pricingModel":"free_oss","dataRetention":"zero_retention","selfHostAvailable":true,"href":"/router/litellm","apiHref":"/api/router/litellm","lastChecked":"2026-06-08"},{"slug":"openrouter","name":"OpenRouter","vendor":"OpenRouter, Inc.","type":"hybrid","status":"active","summary":"Unified hybrid gateway to 400+ models from 60+ providers via a single OpenAI-compatible API, with optional auto-routing that selects the best model per prompt.","editorTake":null,"bestFor":["multi-provider access","cost optimization","auto model selection","provider fallback"],"targetProviders":["openai-api","anthropic-api","google-ai-studio","gcp-vertex-ai","mistral-ai-api","xai-console","deepseek-api","cohere-api","together-ai","fireworks-ai"],"targetProviderHrefs":["/provider/openai-api","/provider/anthropic-api","/provider/google-ai-studio","/provider/gcp-vertex-ai","/provider/mistral-ai-api","/provider/xai-console","/provider/deepseek-api","/provider/cohere-api","/provider/together-ai","/provider/fireworks-ai"],"modelsCount":400,"apiCompatibility":["openai"],"pricingModel":"passthrough","dataRetention":"opt_in_logging","selfHostAvailable":false,"href":"/router/openrouter","apiHref":"/api/router/openrouter","lastChecked":"2026-06-08"},{"slug":"portkey","name":"Portkey","vendor":"Portkey AI","type":"gateway","status":"active","summary":"Production AI gateway routing to 1,600+ LLMs with failover, load balancing, semantic caching, and guardrails; Apache 2.0 core is fully self-hostable with the complete feature set.","editorTake":null,"bestFor":["production reliability","governance","observability","self-hosting","enterprise"],"targetProviders":["openai-api","anthropic-api","google-ai-studio","gcp-vertex-ai","microsoft-foundry","azure-openai","cohere-api","mistral-ai-api"],"targetProviderHrefs":["/provider/openai-api","/provider/anthropic-api","/provider/google-ai-studio","/provider/gcp-vertex-ai","/provider/microsoft-foundry","/provider/azure-openai","/provider/cohere-api","/provider/mistral-ai-api"],"modelsCount":1600,"apiCompatibility":["openai"],"pricingModel":"subscription","dataRetention":"opt_in_logging","selfHostAvailable":true,"href":"/router/portkey","apiHref":"/api/router/portkey","lastChecked":"2026-06-08"},{"slug":"airouter","name":"AIRouter","vendor":"Heureka Labs UG","type":"router","status":"active","summary":"Commercial LLM router that analyzes incoming requests and routes to the optimal model for cost/quality/latency via a drop-in OpenAI-compatible API, with a privacy-preserving embedding mode that avoids sending prompt content.","editorTake":null,"bestFor":["cost optimization","OpenAI drop-in replacement","privacy-aware routing"],"targetProviders":["openai-api","anthropic-api","google-ai-studio","gcp-vertex-ai","mistral-ai-api"],"targetProviderHrefs":["/provider/openai-api","/provider/anthropic-api","/provider/google-ai-studio","/provider/gcp-vertex-ai","/provider/mistral-ai-api"],"modelsCount":null,"apiCompatibility":["openai"],"pricingModel":"passthrough_plus_fee","dataRetention":"unknown","selfHostAvailable":false,"href":"/router/airouter","apiHref":"/api/router/airouter","lastChecked":"2026-06-08"},{"slug":"bedrock-intelligent-prompt-routing","name":"Amazon Bedrock Intelligent Prompt Routing","vendor":"Amazon Web Services","type":"router","status":"active","summary":"AWS Bedrock's native intelligent prompt router that routes prompts between Anthropic Claude model tiers (Haiku/Sonnet) based on predicted task complexity, with no extra per-routing charge.","editorTake":null,"bestFor":["Bedrock users","Claude cost optimization","AWS ecosystem"],"targetProviders":["aws-bedrock"],"targetProviderHrefs":["/provider/aws-bedrock"],"modelsCount":null,"apiCompatibility":["native"],"pricingModel":"passthrough","dataRetention":"retains","selfHostAvailable":false,"href":"/router/bedrock-intelligent-prompt-routing","apiHref":"/api/router/bedrock-intelligent-prompt-routing","lastChecked":"2026-06-08"},{"slug":"azure-foundry-model-router","name":"Azure AI Foundry Model Router","vendor":"Microsoft","type":"router","status":"active","summary":"Microsoft Azure AI Foundry's native model router that uses a trained ML model to route each prompt in real time to the optimal Azure-hosted model, with Balanced/Cost/Quality mode selection and automatic failover.","editorTake":null,"bestFor":["Azure AI Foundry users","cost optimization","Microsoft ecosystem","zero-configuration routing"],"targetProviders":["microsoft-foundry","azure-openai"],"targetProviderHrefs":["/provider/microsoft-foundry","/provider/azure-openai"],"modelsCount":null,"apiCompatibility":["openai"],"pricingModel":"passthrough","dataRetention":"retains","selfHostAvailable":false,"href":"/router/azure-foundry-model-router","apiHref":"/api/router/azure-foundry-model-router","lastChecked":"2026-06-08"},{"slug":"helicone","name":"Helicone","vendor":"Helicone","type":"gateway","status":"active","summary":"Observability-first AI gateway with routing, caching, rate limiting, and request tracing; Apache 2.0 open-source core with a managed hosted tier for logging and analytics.","editorTake":null,"bestFor":["observability","LLM tracing","cost tracking","self-hosting"],"targetProviders":["openai-api","anthropic-api","microsoft-foundry","azure-openai","google-ai-studio","gcp-vertex-ai"],"targetProviderHrefs":["/provider/openai-api","/provider/anthropic-api","/provider/microsoft-foundry","/provider/azure-openai","/provider/google-ai-studio","/provider/gcp-vertex-ai"],"modelsCount":null,"apiCompatibility":["openai","anthropic"],"pricingModel":"subscription","dataRetention":"opt_in_logging","selfHostAvailable":true,"href":"/router/helicone","apiHref":"/api/router/helicone","lastChecked":"2026-06-08"},{"slug":"kong-ai-gateway","name":"Kong AI Gateway","vendor":"Kong Inc.","type":"gateway","status":"active","summary":"Multi-LLM AI gateway built on Kong Gateway 3.x, adding semantic routing, load balancing, guardrails, and MCP traffic analytics as plugins over Kong's existing API management platform.","editorTake":null,"bestFor":["enterprise API management","multi-LLM routing","Kong users","self-hosting"],"targetProviders":["openai-api","anthropic-api","google-ai-studio","gcp-vertex-ai","microsoft-foundry","azure-openai","cohere-api"],"targetProviderHrefs":["/provider/openai-api","/provider/anthropic-api","/provider/google-ai-studio","/provider/gcp-vertex-ai","/provider/microsoft-foundry","/provider/azure-openai","/provider/cohere-api"],"modelsCount":null,"apiCompatibility":["openai","native"],"pricingModel":"subscription","dataRetention":"unknown","selfHostAvailable":true,"href":"/router/kong-ai-gateway","apiHref":"/api/router/kong-ai-gateway","lastChecked":"2026-06-08"},{"slug":"martian","name":"Martian","vendor":"Martian, Inc.","type":"router","status":"active","summary":"AI-powered LLM router that analyzes each prompt in real-time to select the optimal model, targeting 20–97% cost reduction while maintaining quality; San Francisco startup reportedly nearing $1.3B valuation.","editorTake":null,"bestFor":["cost reduction","quality optimization","enterprise routing"],"targetProviders":["openai-api","anthropic-api","google-ai-studio","gcp-vertex-ai","mistral-ai-api"],"targetProviderHrefs":["/provider/openai-api","/provider/anthropic-api","/provider/google-ai-studio","/provider/gcp-vertex-ai","/provider/mistral-ai-api"],"modelsCount":null,"apiCompatibility":["openai","native"],"pricingModel":"passthrough_plus_fee","dataRetention":"unknown","selfHostAvailable":false,"href":"/router/martian","apiHref":"/api/router/martian","lastChecked":"2026-06-08"},{"slug":"neutrino","name":"Neutrino AI","vendor":"Neutrino AI","type":"router","status":"active","summary":"Commercial LLM router that dynamically routes each query to the best-suited model with load balancing and fallback handling, charging 3% of underlying AI spend.","editorTake":null,"bestFor":["cost reduction","dynamic model selection","load balancing","fallback handling"],"targetProviders":["openai-api","anthropic-api","google-ai-studio","gcp-vertex-ai","mistral-ai-api"],"targetProviderHrefs":["/provider/openai-api","/provider/anthropic-api","/provider/google-ai-studio","/provider/gcp-vertex-ai","/provider/mistral-ai-api"],"modelsCount":null,"apiCompatibility":["native"],"pricingModel":"passthrough_plus_fee","dataRetention":"opt_in_logging","selfHostAvailable":false,"href":"/router/neutrino","apiHref":"/api/router/neutrino","lastChecked":"2026-06-08"},{"slug":"not-diamond","name":"Not Diamond","vendor":"Not Diamond","type":"router","status":"active","summary":"Predictive model router that determines the best LLM for each query; claims up to 25% accuracy gains and 10x cost reduction; powers OpenRouter's auto mode and is positioned specifically for coding agents.","editorTake":null,"bestFor":["coding agents","accuracy optimization","cost reduction"],"targetProviders":["openai-api","anthropic-api","google-ai-studio","gcp-vertex-ai","mistral-ai-api"],"targetProviderHrefs":["/provider/openai-api","/provider/anthropic-api","/provider/google-ai-studio","/provider/gcp-vertex-ai","/provider/mistral-ai-api"],"modelsCount":null,"apiCompatibility":["native"],"pricingModel":"enterprise_quote","dataRetention":"opt_in_logging","selfHostAvailable":false,"href":"/router/not-diamond","apiHref":"/api/router/not-diamond","lastChecked":"2026-06-08"},{"slug":"nvidia-llm-router","name":"NVIDIA LLM Router Blueprint","vendor":"NVIDIA","type":"router","status":"deprecated","summary":"NVIDIA's open-source AI blueprint for LLM routing that selects the optimal model per prompt via intent classification or neural auto-routing; being deprecated 2026-06-20.","editorTake":null,"bestFor":["open source","reference implementation","NVIDIA ecosystem","self-hosting"],"targetProviders":["openai-api","anthropic-api","nvidia-nim"],"targetProviderHrefs":["/provider/openai-api","/provider/anthropic-api","/provider/nvidia-nim"],"modelsCount":null,"apiCompatibility":["openai","native"],"pricingModel":"free_oss","dataRetention":"zero_retention","selfHostAvailable":true,"href":"/router/nvidia-llm-router","apiHref":"/api/router/nvidia-llm-router","lastChecked":"2026-06-08"},{"slug":"openai-auto","name":"OpenAI Auto Routing (GPT-5 Auto)","vendor":"OpenAI","type":"router","status":"active","summary":"OpenAI's native auto-routing mode (GPT-5 Auto) that dynamically routes each API request between GPT-5 and GPT-5 Instant based on prompt complexity, with no extra charge beyond model token costs.","editorTake":null,"bestFor":["OpenAI users","zero-configuration routing","automatic cost optimization"],"targetProviders":["openai-api"],"targetProviderHrefs":["/provider/openai-api"],"modelsCount":null,"apiCompatibility":["openai","native"],"pricingModel":"passthrough","dataRetention":"retains","selfHostAvailable":false,"href":"/router/openai-auto","apiHref":"/api/router/openai-auto","lastChecked":"2026-06-08"},{"slug":"requesty","name":"Requesty","vendor":"Requesty","type":"hybrid","status":"active","summary":"AI gateway to 400+ LLM providers with intelligent routing, caching, guardrails, and governance; flat 5% markup on model costs with no subscription fee.","editorTake":null,"bestFor":["cost optimization","observability","governance","EU data residency"],"targetProviders":["openai-api","anthropic-api","google-ai-studio","gcp-vertex-ai","mistral-ai-api","deepseek-api"],"targetProviderHrefs":["/provider/openai-api","/provider/anthropic-api","/provider/google-ai-studio","/provider/gcp-vertex-ai","/provider/mistral-ai-api","/provider/deepseek-api"],"modelsCount":400,"apiCompatibility":["openai"],"pricingModel":"passthrough_plus_fee","dataRetention":"opt_in_logging","selfHostAvailable":false,"href":"/router/requesty","apiHref":"/api/router/requesty","lastChecked":"2026-06-08"},{"slug":"respan","name":"Respan","vendor":"Respan (formerly Keywords AI)","type":"hybrid","status":"active","summary":"Unified LLM engineering platform (gateway + observability + evals + prompt management) routing across 250+ models; previously Keywords AI, rebranded February 2026.","editorTake":null,"bestFor":["observability","evals","prompt management","multi-model gateway","agent tracing"],"targetProviders":["openai-api","anthropic-api","google-ai-studio","gcp-vertex-ai","mistral-ai-api","deepseek-api"],"targetProviderHrefs":["/provider/openai-api","/provider/anthropic-api","/provider/google-ai-studio","/provider/gcp-vertex-ai","/provider/mistral-ai-api","/provider/deepseek-api"],"modelsCount":250,"apiCompatibility":["openai"],"pricingModel":"subscription","dataRetention":"opt_in_logging","selfHostAvailable":false,"href":"/router/respan","apiHref":"/api/router/respan","lastChecked":"2026-06-08"},{"slug":"routellm","name":"RouteLLM","vendor":"LMSYS (lm-sys)","type":"router","status":"active","summary":"Open-source LLM routing framework from LMSYS that routes simpler queries to a cheaper weak model and harder ones to a stronger frontier model, achieving 35–85% cost reduction on benchmarks.","editorTake":null,"bestFor":["open source","binary cost optimization","research","self-hosting"],"targetProviders":["openai-api","anthropic-api","google-ai-studio","gcp-vertex-ai"],"targetProviderHrefs":["/provider/openai-api","/provider/anthropic-api","/provider/google-ai-studio","/provider/gcp-vertex-ai"],"modelsCount":null,"apiCompatibility":["openai"],"pricingModel":"free_oss","dataRetention":"zero_retention","selfHostAvailable":true,"href":"/router/routellm","apiHref":"/api/router/routellm","lastChecked":"2026-06-08"},{"slug":"unify","name":"Unify","vendor":"Unify AI","type":"router","status":"active","summary":"Benchmark-driven LLM router using a neural scorer and live runtime benchmarks refreshed every 10 minutes to route each request to the optimal endpoint across 100+ providers.","editorTake":null,"bestFor":["benchmark-driven routing","latency optimization","cost vs quality tradeoffs"],"targetProviders":["openai-api","anthropic-api","google-ai-studio","gcp-vertex-ai","mistral-ai-api"],"targetProviderHrefs":["/provider/openai-api","/provider/anthropic-api","/provider/google-ai-studio","/provider/gcp-vertex-ai","/provider/mistral-ai-api"],"modelsCount":null,"apiCompatibility":["openai"],"pricingModel":"subscription","dataRetention":"unknown","selfHostAvailable":false,"href":"/router/unify","apiHref":"/api/router/unify","lastChecked":"2026-06-08"},{"slug":"vllm-semantic-router","name":"vLLM Semantic Router","vendor":"Red Hat / vLLM Project","type":"router","status":"active","summary":"Open-source Mixture-of-Models router that semantically classifies each request and routes it to the best backend (local, private, or frontier) by cost, latency, privacy, or safety, deployed as an Envoy External Processor.","editorTake":null,"bestFor":["open source","Kubernetes/OpenShift","privacy-aware routing","on-prem","edge/hybrid cloud"],"targetProviders":[],"targetProviderHrefs":[],"modelsCount":null,"apiCompatibility":["openai"],"pricingModel":"free_oss","dataRetention":"zero_retention","selfHostAvailable":true,"href":"/router/vllm-semantic-router","apiHref":"/api/router/vllm-semantic-router","lastChecked":"2026-06-08"}]}