77 lines
2.8 KiB
TOML
77 lines
2.8 KiB
TOML
# Anthropic direct
|
|
[[model]]
|
|
id = "claude-opus-4-8"
|
|
provider = "anthropic"
|
|
context_window = 1000000
|
|
capability = { tool_calling = "parallel", structured_output = "json_schema", vision = true, prompt_caching = { kind = "explicit", max_breakpoints = 4 } }
|
|
|
|
[[model]]
|
|
id = "claude-sonnet-4-6"
|
|
provider = "anthropic"
|
|
context_window = 1000000
|
|
capability = { tool_calling = "parallel", structured_output = "json_schema", reasoning = "budget_tokens", vision = true, prompt_caching = { kind = "explicit", max_breakpoints = 4 } }
|
|
|
|
[[model]]
|
|
id = "claude-haiku-4-5"
|
|
provider = "anthropic"
|
|
context_window = 200000
|
|
capability = { tool_calling = "parallel", structured_output = "json_schema", reasoning = "budget_tokens", vision = true, prompt_caching = { kind = "explicit", max_breakpoints = 4 } }
|
|
|
|
# Ollama local (capability is router-ish / ollama handles its own models)
|
|
[[model]]
|
|
id = "llama3.3"
|
|
provider = "ollama-local"
|
|
context_window = 128000
|
|
|
|
[[model]]
|
|
id = "qwen3-coder"
|
|
provider = "ollama-local"
|
|
context_window = 256000
|
|
|
|
# Codex OAuth (ChatGPT backend via Responses API)
|
|
# Codex CLI's model catalog exposes these coding models with a 272k effective
|
|
# context window on this route, even when public API docs advertise larger
|
|
# model-family windows.
|
|
[[model]]
|
|
id = "gpt-5.5"
|
|
provider = "codex-oauth"
|
|
context_window = 272000
|
|
capability = { tool_calling = "parallel", structured_output = "json_schema", reasoning = "effort", vision = true, prompt_caching = { kind = "auto" } }
|
|
|
|
[[model]]
|
|
id = "gpt-5.4"
|
|
provider = "codex-oauth"
|
|
context_window = 272000
|
|
capability = { tool_calling = "parallel", structured_output = "json_schema", reasoning = "effort", vision = true, prompt_caching = { kind = "auto" } }
|
|
|
|
[[model]]
|
|
id = "gpt-5.4-mini"
|
|
provider = "codex-oauth"
|
|
context_window = 272000
|
|
capability = { tool_calling = "parallel", structured_output = "json_schema", reasoning = "effort", vision = true, prompt_caching = { kind = "auto" } }
|
|
|
|
[[model]]
|
|
id = "gpt-5.3-codex-spark"
|
|
provider = "codex-oauth"
|
|
context_window = 272000
|
|
capability = { tool_calling = "parallel", structured_output = "json_schema", reasoning = "effort", vision = true, prompt_caching = { kind = "auto" } }
|
|
|
|
# OpenRouter
|
|
[[model]]
|
|
id = "anthropic/claude-opus-4.8"
|
|
provider = "openrouter"
|
|
context_window = 1000000
|
|
capability = { tool_calling = "parallel", structured_output = "json_schema", reasoning = "budget_tokens", vision = true, prompt_caching = { kind = "auto" } }
|
|
|
|
[[model]]
|
|
id = "anthropic/claude-sonnet-4.6"
|
|
provider = "openrouter"
|
|
context_window = 1000000
|
|
capability = { tool_calling = "parallel", structured_output = "json_schema", reasoning = "budget_tokens", vision = true, prompt_caching = { kind = "auto" } }
|
|
|
|
[[model]]
|
|
id = "openai/gpt-5.5"
|
|
provider = "openrouter"
|
|
context_window = 1050000
|
|
capability = { tool_calling = "parallel", structured_output = "json_schema", reasoning = "effort", vision = true, prompt_caching = { kind = "auto" } }
|