llm-model-configの実装

2026-04-19 23:32:14 +09:00 · 2026-04-19 23:32:14 +09:00 · 230936274b
commit 230936274b
parent e1d672e9c0
50 changed files with 1718 additions and 1175 deletions
--- a/crates/llm-worker/examples/record_test_fixtures/main.rs
+++ b/crates/llm-worker/examples/record_test_fixtures/main.rs
@ -20,9 +20,35 @@ mod recorder;
 mod scenarios;

 use clap::{Parser, ValueEnum};
-use llm_worker::llm_client::providers::anthropic::AnthropicClient;
-use llm_worker::llm_client::providers::gemini::GeminiClient;
-use llm_worker::llm_client::providers::openai::OpenAIClient;
+use llm_worker::llm_client::capability::{
+    CacheStrategy, ModelCapability, StructuredOutput, ToolCallingSupport,
+};
+use llm_worker::llm_client::scheme::{
+    Scheme, anthropic::AnthropicScheme, gemini::GeminiScheme, openai_chat::OpenAIScheme,
+};
+use llm_worker::llm_client::transport::{HttpTransport, ResolvedAuth};
+
+/// 既定の capability: fixture 記録には cache_control を付けない
+/// （既知モデルの静的テーブルを経由すると scheme 毎に自動設定される）。
+fn fallback_capability() -> ModelCapability {
+    ModelCapability {
+        tool_calling: ToolCallingSupport::Parallel,
+        structured_output: StructuredOutput::JsonSchema,
+        reasoning: None,
+        vision: false,
+        prompt_caching: CacheStrategy::Auto,
+    }
+}
+
+fn make_transport<S: Scheme>(
+    scheme: S,
+    model: &str,
+    auth: ResolvedAuth,
+) -> HttpTransport<S> {
+    let cap = scheme.capability_for(model).unwrap_or_else(fallback_capability);
+    let base_url = scheme.default_base_url().to_string();
+    HttpTransport::new(scheme, model.to_string(), base_url, auth, cap)
+}

 #[derive(Parser, Debug)]
 #[command(author, version, about, long_about = None)]
@ -60,7 +86,11 @@ async fn run_scenario_with_anthropic(
    let api_key = std::env::var("ANTHROPIC_API_KEY")
        .expect("ANTHROPIC_API_KEY environment variable must be set");
    let model = model.as_deref().unwrap_or("claude-sonnet-4-20250514");
-    let client = AnthropicClient::new(&api_key, model);
+    let client = make_transport(
+        AnthropicScheme::new(),
+        model,
+        ResolvedAuth::ApiKey(api_key),
+    );

    recorder::record_request(
        &client,
@ -82,7 +112,7 @@ async fn run_scenario_with_openai(
    let api_key =
        std::env::var("OPENAI_API_KEY").expect("OPENAI_API_KEY environment variable must be set");
    let model = model.as_deref().unwrap_or("gpt-4o");
-    let client = OpenAIClient::new(&api_key, model);
+    let client = make_transport(OpenAIScheme::new(), model, ResolvedAuth::ApiKey(api_key));

    recorder::record_request(
        &client,
@ -101,10 +131,15 @@ async fn run_scenario_with_ollama(
    subdir: &str,
    model: Option<String>,
 ) -> Result<(), Box<dyn std::error::Error>> {
-    use llm_worker::llm_client::providers::ollama::OllamaClient;
-    // Ollama typically runs local, no key needed or placeholder
-    let model = model.as_deref().unwrap_or("llama3"); // default example
-    let client = OllamaClient::new(model); // base_url placeholder, handled by client default
+    // Ollama = Anthropic scheme + base_url 差し替え + 認証なし
+    let model = model.as_deref().unwrap_or("llama3");
+    let client = HttpTransport::new(
+        AnthropicScheme::new(),
+        model.to_string(),
+        "http://localhost:11434".to_string(),
+        ResolvedAuth::None,
+        fallback_capability(),
+    );

    recorder::record_request(
        &client,
@ -126,7 +161,7 @@ async fn run_scenario_with_gemini(
    let api_key =
        std::env::var("GEMINI_API_KEY").expect("GEMINI_API_KEY environment variable must be set");
    let model = model.as_deref().unwrap_or("gemini-2.0-flash");
-    let client = GeminiClient::new(&api_key, model);
+    let client = make_transport(GeminiScheme::new(), model, ResolvedAuth::ApiKey(api_key));

    recorder::record_request(
        &client,
--- a/crates/llm-worker/examples/worker_cancel_demo.rs
+++ b/crates/llm-worker/examples/worker_cancel_demo.rs
@ -2,7 +2,11 @@
 //!
 //! Example of cancelling from another thread during streaming

-use llm_worker::llm_client::providers::anthropic::AnthropicClient;
+use llm_worker::llm_client::capability::{
+    CacheStrategy, ModelCapability, StructuredOutput, ToolCallingSupport,
+};
+use llm_worker::llm_client::scheme::{Scheme, anthropic::AnthropicScheme};
+use llm_worker::llm_client::transport::{HttpTransport, ResolvedAuth};
 use llm_worker::{Worker, WorkerResult};
 use std::time::Duration;

@ -22,7 +26,17 @@ async fn main() -> Result<(), Box<dyn std::error::Error>> {
    let api_key =
        std::env::var("ANTHROPIC_API_KEY").expect("ANTHROPIC_API_KEY environment variable not set");

-    let client = AnthropicClient::new(&api_key, "claude-sonnet-4-20250514");
+    let scheme = AnthropicScheme::new();
+    let model = "claude-sonnet-4-20250514".to_string();
+    let cap = scheme.capability_for(&model).unwrap_or(ModelCapability {
+        tool_calling: ToolCallingSupport::Parallel,
+        structured_output: StructuredOutput::JsonSchema,
+        reasoning: None,
+        vision: false,
+        prompt_caching: CacheStrategy::Auto,
+    });
+    let base_url = scheme.default_base_url().to_string();
+    let client = HttpTransport::new(scheme, model, base_url, ResolvedAuth::ApiKey(api_key), cap);
    let worker = Worker::new(client);

    println!("🚀 Starting Worker...");
--- a/crates/llm-worker/examples/worker_cli.rs
+++ b/crates/llm-worker/examples/worker_cli.rs
@ -44,10 +44,11 @@ use llm_worker::{
    interceptor::{Interceptor, PostToolAction, ToolResultInfo},
    llm_client::{
        LlmClient,
-        providers::{
-            anthropic::AnthropicClient, gemini::GeminiClient, ollama::OllamaClient,
-            openai::OpenAIClient,
+        capability::{CacheStrategy, ModelCapability, StructuredOutput, ToolCallingSupport},
+        scheme::{
+            Scheme, anthropic::AnthropicScheme, gemini::GeminiScheme, openai_chat::OpenAIScheme,
        },
+        transport::{HttpTransport, ResolvedAuth},
    },
    timeline::{Handler, TextBlockEvent, TextBlockKind, ToolUseBlockEvent, ToolUseBlockKind},
 };
@ -327,6 +328,28 @@ fn get_api_key(args: &Args) -> Result<String, String> {
 }

 /// Create client based on provider
+fn default_capability() -> ModelCapability {
+    ModelCapability {
+        tool_calling: ToolCallingSupport::Parallel,
+        structured_output: StructuredOutput::JsonSchema,
+        reasoning: None,
+        vision: false,
+        prompt_caching: CacheStrategy::Auto,
+    }
+}
+
+fn build_transport<S: Scheme>(
+    scheme: S,
+    model: String,
+    auth: ResolvedAuth,
+) -> Box<dyn LlmClient> {
+    let cap = scheme
+        .capability_for(&model)
+        .unwrap_or_else(default_capability);
+    let base_url = scheme.default_base_url().to_string();
+    Box::new(HttpTransport::new(scheme, model, base_url, auth, cap))
+}
+
 fn create_client(args: &Args) -> Result<Box<dyn LlmClient>, String> {
    let model = args
        .model
@ -336,21 +359,32 @@ fn create_client(args: &Args) -> Result<Box<dyn LlmClient>, String> {
    let api_key = get_api_key(args)?;

    match args.provider {
-        Provider::Anthropic => {
-            let client = AnthropicClient::new(&api_key, &model);
-            Ok(Box::new(client))
-        }
-        Provider::Gemini => {
-            let client = GeminiClient::new(&api_key, &model);
-            Ok(Box::new(client))
-        }
-        Provider::Openai => {
-            let client = OpenAIClient::new(&api_key, &model);
-            Ok(Box::new(client))
-        }
+        Provider::Anthropic => Ok(build_transport(
+            AnthropicScheme::new(),
+            model,
+            ResolvedAuth::ApiKey(api_key),
+        )),
+        Provider::Gemini => Ok(build_transport(
+            GeminiScheme::new(),
+            model,
+            ResolvedAuth::ApiKey(api_key),
+        )),
+        Provider::Openai => Ok(build_transport(
+            OpenAIScheme::new(),
+            model,
+            ResolvedAuth::ApiKey(api_key),
+        )),
        Provider::Ollama => {
-            let client = OllamaClient::new(&model);
-            Ok(Box::new(client))
+            // Ollama = Anthropic scheme + base_url 差し替え + 認証なし
+            let scheme = AnthropicScheme::new();
+            let cap = default_capability();
+            Ok(Box::new(HttpTransport::new(
+                scheme,
+                model,
+                "http://localhost:11434".to_string(),
+                ResolvedAuth::None,
+                cap,
+            )))
        }
    }
 }
--- a/crates/llm-worker/src/llm_client/auth.rs
+++ b/crates/llm-worker/src/llm_client/auth.rs
@ -0,0 +1,23 @@
+//! `Scheme` 実装と通信層が要求する認証要件。
+//!
+//! マニフェスト側の型（`ModelConfig` / `SchemeKind` / `AuthRef`）は
+//! `crates/manifest` に置き、llm-worker はそれを知らずに済む。
+//! `AuthRequirement` は scheme が宣言する「この scheme はどんな認証を
+//! 期待するか」のランタイム記述で、manifest 側の `AuthRef` との
+//! 照合（`AuthRef → ResolvedAuth` 変換の適否）は `crates/provider`
+//! で行う。
+
+/// `Scheme::required_auth()` が返す認証要件。
+#[derive(Debug, Clone, Copy, PartialEq, Eq)]
+pub enum AuthRequirement {
+    /// 認証を行わない（Ollama など）
+    None,
+    /// `Authorization: Bearer <token>` ヘッダ（token は API key 相当）
+    Bearer,
+    /// `x-api-key: <token>` ヘッダ（Anthropic 形式）
+    XApiKey,
+    /// クエリパラメータ `?<name>=<token>`（Gemini 形式）
+    QueryParam { name: &'static str },
+    /// 複合ヘッダ（Codex OAuth 等、`crates/provider` 側で解決）
+    Custom,
+}
--- a/crates/llm-worker/src/llm_client/capability.rs
+++ b/crates/llm-worker/src/llm_client/capability.rs
@ -0,0 +1,102 @@
+//! モデル能力メタデータ
+//!
+//! `ModelCapability` はモデルが持つ機能差を表現する。scheme は同じでも
+//! モデルごとに reasoning 可否や prompt caching 方式が違うため、scheme
+//! から分離して保持する。
+//!
+//! 値の供給経路は 2 通り:
+//! 1. scheme 実装側の `model_id → ModelCapability` 静的テーブル（既知モデル）
+//! 2. `ModelConfig::capability` での明示 override（未知モデル、または上書き）
+
+use serde::{Deserialize, Serialize};
+
+/// モデル能力メタデータ
+#[derive(Debug, Clone, Serialize, Deserialize, PartialEq)]
+pub struct ModelCapability {
+    pub tool_calling: ToolCallingSupport,
+    pub structured_output: StructuredOutput,
+    #[serde(default)]
+    pub reasoning: Option<ReasoningSupport>,
+    #[serde(default)]
+    pub vision: bool,
+    pub prompt_caching: CacheStrategy,
+}
+
+impl ModelCapability {
+    /// 何もサポートしない安全側デフォルト。未知モデルのフォールバック用。
+    pub const fn minimal() -> Self {
+        Self {
+            tool_calling: ToolCallingSupport::None,
+            structured_output: StructuredOutput::None,
+            reasoning: None,
+            vision: false,
+            prompt_caching: CacheStrategy::Auto,
+        }
+    }
+}
+
+/// ツール呼び出しサポート
+#[derive(Debug, Clone, Copy, Serialize, Deserialize, PartialEq, Eq)]
+#[serde(rename_all = "snake_case")]
+pub enum ToolCallingSupport {
+    /// 非サポート
+    None,
+    /// 1 回のレスポンスで 1 ツールのみ
+    Sequential,
+    /// 1 回のレスポンスで複数ツール並行
+    Parallel,
+}
+
+/// Structured output サポート
+#[derive(Debug, Clone, Copy, Serialize, Deserialize, PartialEq, Eq)]
+#[serde(rename_all = "snake_case")]
+pub enum StructuredOutput {
+    None,
+    /// `json_object` モード（スキーマなし JSON 強制）
+    JsonObject,
+    /// JSON Schema 指定で構造化出力
+    JsonSchema,
+}
+
+/// Reasoning（extended thinking）サポート
+#[derive(Debug, Clone, Copy, Serialize, Deserialize, PartialEq, Eq)]
+#[serde(rename_all = "snake_case")]
+pub enum ReasoningSupport {
+    /// OpenAI 形式: `reasoning.effort` (low/medium/high)
+    Effort,
+    /// Anthropic 形式: `thinking.budget_tokens`
+    BudgetTokens,
+    /// 両対応（内部では共通 `ReasoningControl` として扱い、各 scheme で投影）
+    Both,
+}
+
+/// Prompt caching 戦略
+#[derive(Debug, Clone, Copy, Serialize, Deserialize, PartialEq, Eq)]
+#[serde(tag = "kind", rename_all = "snake_case")]
+pub enum CacheStrategy {
+    /// Anthropic: `cache_control` マーカーを明示挿入
+    Explicit { max_breakpoints: u8 },
+    /// それ以外: サーバ側自動 prefix、または未サポート
+    Auto,
+}
+
+/// Reasoning 制御（共通型、scheme 側で各社形式に投影）
+///
+/// `effort` / `budget_tokens` はユーザー設定から任意で渡される。Scheme
+/// 側は自身の `ReasoningSupport` に応じて片方だけ使う。両方が宣言
+/// されている場合の優先順位は scheme 実装が決める。
+#[derive(Debug, Clone, Default, Serialize, Deserialize, PartialEq, Eq)]
+pub struct ReasoningControl {
+    #[serde(default)]
+    pub effort: Option<ReasoningEffort>,
+    #[serde(default)]
+    pub budget_tokens: Option<u32>,
+}
+
+#[derive(Debug, Clone, Copy, Serialize, Deserialize, PartialEq, Eq)]
+#[serde(rename_all = "lowercase")]
+pub enum ReasoningEffort {
+    Low,
+    Medium,
+    High,
+}
--- a/crates/llm-worker/src/llm_client/mod.rs
+++ b/crates/llm-worker/src/llm_client/mod.rs
@ -16,14 +16,18 @@
 //! - `providers`: プロバイダ固有のクライアント実装
 //! - `scheme`: APIスキーマ（リクエスト/レスポンス変換）

+pub mod auth;
+pub mod capability;
 pub mod client;
 pub mod error;
 pub mod event;
 pub mod types;

-pub mod providers;
 pub mod scheme;
+pub mod transport;

+pub use auth::*;
+pub use capability::*;
 pub use client::*;
 pub use error::*;
 pub use event::*;
--- a/crates/llm-worker/src/llm_client/providers/anthropic.rs
+++ b/crates/llm-worker/src/llm_client/providers/anthropic.rs
@ -1,206 +0,0 @@
-//! Anthropic プロバイダ実装
-//!
-//! Anthropic Messages APIと通信し、Eventストリームを出力
-
-use std::pin::Pin;
-
-use crate::llm_client::{
-    ClientError, LlmClient, Request, event::Event, scheme::anthropic::AnthropicScheme,
-};
-use async_trait::async_trait;
-use eventsource_stream::Eventsource;
-use futures::{Stream, StreamExt, TryStreamExt, future::ready};
-use reqwest::header::{CONTENT_TYPE, HeaderMap, HeaderValue};
-
-/// Anthropic クライアント
-#[derive(Clone)]
-pub struct AnthropicClient {
-    /// HTTPクライアント
-    http_client: reqwest::Client,
-    /// APIキー
-    api_key: String,
-    /// モデル名
-    model: String,
-    /// スキーマ
-    scheme: AnthropicScheme,
-    /// ベースURL
-    base_url: String,
-}
-
-impl AnthropicClient {
-    /// 新しいAnthropicクライアントを作成
-    pub fn new(api_key: impl Into<String>, model: impl Into<String>) -> Self {
-        Self {
-            http_client: reqwest::Client::new(),
-            api_key: api_key.into(),
-            model: model.into(),
-            scheme: AnthropicScheme::default(),
-            base_url: "https://api.anthropic.com".to_string(),
-        }
-    }
-
-    /// カスタムHTTPクライアントを設定
-    pub fn with_http_client(mut self, client: reqwest::Client) -> Self {
-        self.http_client = client;
-        self
-    }
-
-    /// スキーマを設定
-    pub fn with_scheme(mut self, scheme: AnthropicScheme) -> Self {
-        self.scheme = scheme;
-        self
-    }
-
-    /// ベースURLを設定
-    pub fn with_base_url(mut self, url: impl Into<String>) -> Self {
-        self.base_url = url.into();
-        self
-    }
-
-    /// リクエストヘッダーを構築
-    fn build_headers(&self) -> Result<HeaderMap, ClientError> {
-        let mut headers = HeaderMap::new();
-
-        headers.insert(CONTENT_TYPE, HeaderValue::from_static("application/json"));
-        headers.insert(
-            "x-api-key",
-            HeaderValue::from_str(&self.api_key)
-                .map_err(|e| ClientError::Config(format!("Invalid API key: {}", e)))?,
-        );
-        headers.insert(
-            "anthropic-version",
-            HeaderValue::from_str(&self.scheme.api_version)
-                .map_err(|e| ClientError::Config(format!("Invalid API version: {}", e)))?,
-        );
-
-        // 細粒度ツールストリーミングを有効にする場合
-        if self.scheme.fine_grained_tool_streaming {
-            headers.insert(
-                "anthropic-beta",
-                HeaderValue::from_static("fine-grained-tool-streaming-2025-05-14"),
-            );
-        }
-
-        Ok(headers)
-    }
-}
-
-#[async_trait]
-impl LlmClient for AnthropicClient {
-    fn clone_boxed(&self) -> Box<dyn LlmClient> {
-        Box::new(self.clone())
-    }
-
-    async fn stream(
-        &self,
-        request: Request,
-    ) -> Result<Pin<Box<dyn Stream<Item = Result<Event, ClientError>> + Send>>, ClientError> {
-        let url = format!("{}/v1/messages", self.base_url);
-        let headers = self.build_headers()?;
-        let body = self.scheme.build_request(&self.model, &request);
-
-        let response = self
-            .http_client
-            .post(&url)
-            .headers(headers)
-            .json(&body)
-            .send()
-            .await?;
-
-        // エラーレスポンスをチェック
-        if !response.status().is_success() {
-            let status = response.status().as_u16();
-            let text = response.text().await.unwrap_or_default();
-
-            // JSONでエラーをパースしてみる
-            if let Ok(json) = serde_json::from_str::<serde_json::Value>(&text) {
-                let error = json.get("error").unwrap_or(&json);
-                let code = error.get("type").and_then(|v| v.as_str()).map(String::from);
-                let message = error
-                    .get("message")
-                    .and_then(|v| v.as_str())
-                    .unwrap_or(&text)
-                    .to_string();
-                return Err(ClientError::Api {
-                    status: Some(status),
-                    code,
-                    message,
-                });
-            }
-
-            return Err(ClientError::Api {
-                status: Some(status),
-                code: None,
-                message: text,
-            });
-        }
-
-        // SSEストリームを構築
-        let scheme = self.scheme.clone();
-        let byte_stream = response
-            .bytes_stream()
-            .map_err(|e| std::io::Error::other(e));
-        let event_stream = byte_stream.eventsource();
-
-        // AnthropicはBlockStopイベントに正しいblock_typeを含まないため、
-        // クライアント側で状態を追跡して補完する
-        let mut current_block_type = None;
-
-        let stream = event_stream.filter_map(move |result| {
-            ready(match result {
-                Ok(event) => {
-                    // SSEイベントをパース
-                    match scheme.parse_event(&event.event, &event.data) {
-                        Ok(Some(mut evt)) => {
-                            // ブロックタイプの追跡と修正
-                            match &evt {
-                                Event::BlockStart(start) => {
-                                    current_block_type = Some(start.block_type);
-                                }
-                                Event::BlockStop(stop) => {
-                                    if let Some(block_type) = current_block_type.take() {
-                                        // 正しいブロックタイプで上書き
-                                        // (Event::BlockStopの中身を置換)
-                                        evt =
-                                            Event::BlockStop(crate::llm_client::event::BlockStop {
-                                                block_type,
-                                                ..stop.clone()
-                                            });
-                                    }
-                                }
-                                _ => {}
-                            }
-                            Some(Ok(evt))
-                        }
-                        Ok(None) => None,
-                        Err(e) => Some(Err(e)),
-                    }
-                }
-                Err(e) => Some(Err(ClientError::Sse(e.to_string()))),
-            })
-        });
-
-        Ok(Box::pin(stream))
-    }
-}
-
-#[cfg(test)]
-mod tests {
-    use super::*;
-
-    #[test]
-    fn test_client_creation() {
-        let client = AnthropicClient::new("test-key", "claude-sonnet-4-20250514");
-        assert_eq!(client.model, "claude-sonnet-4-20250514");
-    }
-
-    #[test]
-    fn test_build_headers() {
-        let client = AnthropicClient::new("test-key", "claude-sonnet-4-20250514");
-        let headers = client.build_headers().unwrap();
-
-        assert!(headers.contains_key("x-api-key"));
-        assert!(headers.contains_key("anthropic-version"));
-        assert!(headers.contains_key("anthropic-beta"));
-    }
-}
--- a/crates/llm-worker/src/llm_client/providers/gemini.rs
+++ b/crates/llm-worker/src/llm_client/providers/gemini.rs
@ -1,190 +0,0 @@
-//! Gemini プロバイダ実装
-//!
-//! Google Gemini APIと通信し、Eventストリームを出力
-
-use std::pin::Pin;
-
-use crate::llm_client::{
-    ClientError, LlmClient, Request, event::Event, scheme::gemini::GeminiScheme,
-};
-use async_trait::async_trait;
-use eventsource_stream::Eventsource;
-use futures::{Stream, StreamExt, TryStreamExt};
-use reqwest::header::{CONTENT_TYPE, HeaderMap, HeaderValue};
-
-/// Gemini クライアント
-#[derive(Clone)]
-pub struct GeminiClient {
-    /// HTTPクライアント
-    http_client: reqwest::Client,
-    /// APIキー
-    api_key: String,
-    /// モデル名
-    model: String,
-    /// スキーマ
-    scheme: GeminiScheme,
-    /// ベースURL
-    base_url: String,
-}
-
-impl GeminiClient {
-    /// 新しいGeminiクライアントを作成
-    pub fn new(api_key: impl Into<String>, model: impl Into<String>) -> Self {
-        Self {
-            http_client: reqwest::Client::new(),
-            api_key: api_key.into(),
-            model: model.into(),
-            scheme: GeminiScheme::default(),
-            base_url: "https://generativelanguage.googleapis.com".to_string(),
-        }
-    }
-
-    /// カスタムHTTPクライアントを設定
-    pub fn with_http_client(mut self, client: reqwest::Client) -> Self {
-        self.http_client = client;
-        self
-    }
-
-    /// スキーマを設定
-    pub fn with_scheme(mut self, scheme: GeminiScheme) -> Self {
-        self.scheme = scheme;
-        self
-    }
-
-    /// ベースURLを設定
-    pub fn with_base_url(mut self, url: impl Into<String>) -> Self {
-        self.base_url = url.into();
-        self
-    }
-
-    /// リクエストヘッダーを構築
-    fn build_headers(&self) -> Result<HeaderMap, ClientError> {
-        let mut headers = HeaderMap::new();
-
-        headers.insert(CONTENT_TYPE, HeaderValue::from_static("application/json"));
-
-        Ok(headers)
-    }
-}
-
-#[async_trait]
-impl LlmClient for GeminiClient {
-    fn clone_boxed(&self) -> Box<dyn LlmClient> {
-        Box::new(self.clone())
-    }
-
-    async fn stream(
-        &self,
-        request: Request,
-    ) -> Result<Pin<Box<dyn Stream<Item = Result<Event, ClientError>> + Send>>, ClientError> {
-        // URL構築: base_url/v1beta/models/{model}:streamGenerateContent?alt=sse&key={api_key}
-        let url = format!(
-            "{}/v1beta/models/{}:streamGenerateContent?alt=sse&key={}",
-            self.base_url, self.model, self.api_key
-        );
-
-        let headers = self.build_headers()?;
-        let body = self.scheme.build_request(&request);
-
-        let response = self
-            .http_client
-            .post(&url)
-            .headers(headers)
-            .json(&body)
-            .send()
-            .await?;
-
-        // エラーレスポンスをチェック
-        if !response.status().is_success() {
-            let status = response.status().as_u16();
-            let text = response.text().await.unwrap_or_default();
-
-            // JSONでエラーをパースしてみる
-            if let Ok(json) = serde_json::from_str::<serde_json::Value>(&text) {
-                // Gemini error format: { "error": { "code": xxx, "message": "...", "status": "..." } }
-                let error = json.get("error").unwrap_or(&json);
-                let code = error
-                    .get("status")
-                    .and_then(|v| v.as_str())
-                    .map(String::from);
-                let message = error
-                    .get("message")
-                    .and_then(|v| v.as_str())
-                    .unwrap_or(&text)
-                    .to_string();
-                return Err(ClientError::Api {
-                    status: Some(status),
-                    code,
-                    message,
-                });
-            }
-
-            return Err(ClientError::Api {
-                status: Some(status),
-                code: None,
-                message: text,
-            });
-        }
-
-        // SSEストリームを構築
-        let scheme = self.scheme.clone();
-        let byte_stream = response
-            .bytes_stream()
-            .map_err(|e| std::io::Error::other(e));
-        let event_stream = byte_stream.eventsource();
-
-        let stream = event_stream
-            .map(move |result| {
-                match result {
-                    Ok(event) => {
-                        // SSEイベントをパース
-                        // Geminiは "data: {...}" 形式で送る
-                        match scheme.parse_event(&event.data) {
-                            Ok(Some(events)) => Ok(Some(events)),
-                            Ok(None) => Ok(None),
-                            Err(e) => Err(e),
-                        }
-                    }
-                    Err(e) => Err(ClientError::Sse(e.to_string())),
-                }
-            })
-            // flatten Option<Vec<Event>> stream to Stream<Event>
-            .map(|res| {
-                let s: Pin<Box<dyn Stream<Item = Result<Event, ClientError>> + Send>> = match res {
-                    Ok(Some(events)) => Box::pin(futures::stream::iter(events.into_iter().map(Ok))),
-                    Ok(None) => Box::pin(futures::stream::empty()),
-                    Err(e) => Box::pin(futures::stream::once(async move { Err(e) })),
-                };
-                s
-            })
-            .flatten();
-
-        Ok(Box::pin(stream))
-    }
-}
-
-#[cfg(test)]
-mod tests {
-    use super::*;
-
-    #[test]
-    fn test_client_creation() {
-        let client = GeminiClient::new("test-key", "gemini-2.0-flash");
-        assert_eq!(client.model, "gemini-2.0-flash");
-    }
-
-    #[test]
-    fn test_build_headers() {
-        let client = GeminiClient::new("test-key", "gemini-2.0-flash");
-        let headers = client.build_headers().unwrap();
-
-        assert!(headers.contains_key("content-type"));
-    }
-
-    #[test]
-    fn test_custom_base_url() {
-        let client = GeminiClient::new("test-key", "gemini-2.0-flash")
-            .with_base_url("https://custom.api.example.com");
-        assert_eq!(client.base_url, "https://custom.api.example.com");
-    }
-}
--- a/crates/llm-worker/src/llm_client/providers/mod.rs
+++ b/crates/llm-worker/src/llm_client/providers/mod.rs
@ -1,8 +0,0 @@
-//! プロバイダ実装
-//!
-//! 各プロバイダ固有のHTTPクライアント実装
-
-pub mod anthropic;
-pub mod gemini;
-pub mod ollama;
-pub mod openai;
--- a/crates/llm-worker/src/llm_client/providers/ollama.rs
+++ b/crates/llm-worker/src/llm_client/providers/ollama.rs
@ -1,67 +0,0 @@
-//! Ollama プロバイダ実装
-//!
-//! OllamaはOpenAI互換APIを提供するため、OpenAIクライアントと互換性がある。
-//! デフォルトのベースURLと認証設定が異なる。
-
-use std::pin::Pin;
-
-use crate::llm_client::{
-    ClientError, LlmClient, Request, event::Event, providers::openai::OpenAIClient,
-    scheme::openai::OpenAIScheme,
-};
-use async_trait::async_trait;
-use futures::Stream;
-
-/// Ollama クライアント
-///
-/// 内部的にOpenAIClientを使用するラッパー、もしくはOpenAIClientと同様の実装を持つ。
-/// ここではOpenAIClient構成をカスタマイズして提供する。
-#[derive(Clone)]
-pub struct OllamaClient {
-    inner: OpenAIClient,
-}
-
-impl OllamaClient {
-    /// 新しいOllamaクライアントを作成
-    pub fn new(model: impl Into<String>) -> Self {
-        // Ollama usually runs on localhost:11434/v1
-        // API key is "ollama" or ignored
-        let base_url = "http://localhost:11434";
-
-        let scheme = OpenAIScheme::new().with_legacy_max_tokens(true);
-
-        let client = OpenAIClient::new("ollama", model)
-            .with_base_url(base_url)
-            .with_scheme(scheme);
-        // Currently OpenAIScheme sets include_usage: true. Ollama supports checks?
-        // Assuming Ollama modern versions support usage.
-
-        Self { inner: client }
-    }
-
-    /// ベースURLを設定
-    pub fn with_base_url(mut self, url: impl Into<String>) -> Self {
-        self.inner = self.inner.with_base_url(url);
-        self
-    }
-
-    /// カスタムHTTPクライアントを設定
-    pub fn with_http_client(mut self, client: reqwest::Client) -> Self {
-        self.inner = self.inner.with_http_client(client);
-        self
-    }
-}
-
-#[async_trait]
-impl LlmClient for OllamaClient {
-    fn clone_boxed(&self) -> Box<dyn LlmClient> {
-        Box::new(self.clone())
-    }
-
-    async fn stream(
-        &self,
-        request: Request,
-    ) -> Result<Pin<Box<dyn Stream<Item = Result<Event, ClientError>> + Send>>, ClientError> {
-        self.inner.stream(request).await
-    }
-}
--- a/crates/llm-worker/src/llm_client/providers/openai.rs
+++ b/crates/llm-worker/src/llm_client/providers/openai.rs
@ -1,217 +0,0 @@
-//! OpenAI プロバイダ実装
-//!
-//! OpenAI Chat Completions APIと通信し、Eventストリームを出力
-
-use std::pin::Pin;
-
-use crate::llm_client::{
-    ClientError, ConfigWarning, LlmClient, Request, RequestConfig, event::Event,
-    scheme::openai::OpenAIScheme,
-};
-use async_trait::async_trait;
-use eventsource_stream::Eventsource;
-use futures::{Stream, StreamExt, TryStreamExt};
-use reqwest::header::{CONTENT_TYPE, HeaderMap, HeaderValue};
-
-/// OpenAI クライアント
-#[derive(Clone)]
-pub struct OpenAIClient {
-    /// HTTPクライアント
-    http_client: reqwest::Client,
-    /// APIキー
-    api_key: String,
-    /// モデル名
-    model: String,
-    /// スキーマ
-    scheme: OpenAIScheme,
-    /// ベースURL
-    base_url: String,
-}
-
-impl OpenAIClient {
-    /// 新しいOpenAIクライアントを作成
-    pub fn new(api_key: impl Into<String>, model: impl Into<String>) -> Self {
-        Self {
-            http_client: reqwest::Client::new(),
-            api_key: api_key.into(),
-            model: model.into(),
-            scheme: OpenAIScheme::default(),
-            base_url: "https://api.openai.com".to_string(),
-        }
-    }
-
-    /// カスタムHTTPクライアントを設定
-    pub fn with_http_client(mut self, client: reqwest::Client) -> Self {
-        self.http_client = client;
-        self
-    }
-
-    /// スキーマを設定
-    pub fn with_scheme(mut self, scheme: OpenAIScheme) -> Self {
-        self.scheme = scheme;
-        self
-    }
-
-    /// ベースURLを設定
-    pub fn with_base_url(mut self, url: impl Into<String>) -> Self {
-        self.base_url = url.into();
-        self
-    }
-
-    /// リクエストヘッダーを構築
-    fn build_headers(&self) -> Result<HeaderMap, ClientError> {
-        let mut headers = HeaderMap::new();
-
-        headers.insert(CONTENT_TYPE, HeaderValue::from_static("application/json"));
-
-        let api_key_val = if self.api_key.is_empty() {
-            // For providers like Ollama, API key might be empty/dummy.
-            // But typical OpenAI requires it.
-            // We'll allow empty if user intends it, but usually it's checked.
-            HeaderValue::from_static("")
-        } else {
-            let mut val = HeaderValue::from_str(&format!("Bearer {}", self.api_key))
-                .map_err(|e| ClientError::Config(format!("Invalid API key: {}", e)))?;
-            val.set_sensitive(true);
-            val
-        };
-
-        if !api_key_val.is_empty() {
-            headers.insert("Authorization", api_key_val);
-        }
-
-        Ok(headers)
-    }
-}
-
-#[async_trait]
-impl LlmClient for OpenAIClient {
-    fn clone_boxed(&self) -> Box<dyn LlmClient> {
-        Box::new(self.clone())
-    }
-
-    async fn stream(
-        &self,
-        request: Request,
-    ) -> Result<Pin<Box<dyn Stream<Item = Result<Event, ClientError>> + Send>>, ClientError> {
-        // Construct the URL: base_url usually ends without slash, path starts with slash or vice versa.
-        // Standard OpenAI base is "https://api.openai.com". Endpoint is "/v1/chat/completions".
-        // If external base_url includes /v1, we should be careful.
-        // Let's assume defaults. If user provides "http://localhost:11434/v1", we append "/chat/completions".
-        // Or cleaner: user provides full base up to version?
-        // Anthropic client uses "{}/v1/messages".
-        // Let's stick to appending "/v1/chat/completions" if base is just host,
-        // OR assume base includes /v1 if user overrides it?
-        // Let's use robust joining or simple assumption matching Anthropic pattern:
-        // Default: https://api.openai.com -> https://api.openai.com/v1/chat/completions
-
-        // However, Ollama default is http://localhost:11434/v1/chat/completions if using OpenAI compact.
-        // If we configure base_url via `with_base_url`, it's flexible.
-        // Let's try to detect if /v1 is present or just append consistently.
-        // Ideally `base_url` should be the root passed to `new`.
-
-        let url = if self.base_url.ends_with("/v1") {
-            format!("{}/chat/completions", self.base_url)
-        } else if self.base_url.ends_with("/") {
-            format!("{}v1/chat/completions", self.base_url)
-        } else {
-            format!("{}/v1/chat/completions", self.base_url)
-        };
-
-        let headers = self.build_headers()?;
-        let body = self.scheme.build_request(&self.model, &request);
-
-        let response = self
-            .http_client
-            .post(&url)
-            .headers(headers)
-            .json(&body)
-            .send()
-            .await?;
-
-        // エラーレスポンスをチェック
-        if !response.status().is_success() {
-            let status = response.status().as_u16();
-            let text = response.text().await.unwrap_or_default();
-
-            // JSONでエラーをパースしてみる
-            if let Ok(json) = serde_json::from_str::<serde_json::Value>(&text) {
-                // OpenAI error format: { "error": { "message": "...", "type": "...", ... } }
-                let error = json.get("error").unwrap_or(&json);
-                let code = error.get("type").and_then(|v| v.as_str()).map(String::from);
-                let message = error
-                    .get("message")
-                    .and_then(|v| v.as_str())
-                    .unwrap_or(&text)
-                    .to_string();
-                return Err(ClientError::Api {
-                    status: Some(status),
-                    code,
-                    message,
-                });
-            }
-
-            return Err(ClientError::Api {
-                status: Some(status),
-                code: None,
-                message: text,
-            });
-        }
-
-        // SSEストリームを構築
-        let scheme = self.scheme.clone();
-        let byte_stream = response
-            .bytes_stream()
-            .map_err(|e| std::io::Error::other(e));
-        let event_stream = byte_stream.eventsource();
-
-        let stream = event_stream
-            .map(move |result| {
-                match result {
-                    Ok(event) => {
-                        // SSEイベントをパース
-                        // OpenAI stream events are "data: {...}"
-                        // event.event is usually "message" (default) or empty.
-                        // parse_event takes data string.
-
-                        if event.data == "[DONE]" {
-                            // End of stream handled inside parse_event usually returning None
-                            Ok(None)
-                        } else {
-                            match scheme.parse_event(&event.data) {
-                                Ok(Some(events)) => Ok(Some(events)),
-                                Ok(None) => Ok(None),
-                                Err(e) => Err(e),
-                            }
-                        }
-                    }
-                    Err(e) => Err(ClientError::Sse(e.to_string())),
-                }
-            })
-            // flatten Option<Vec<Event>> stream to Stream<Event>
-            // map returns Result<Option<Vec<Event>>, Error>
-            // We want Stream<Item = Result<Event, Error>>
-            .map(|res| {
-                let s: Pin<Box<dyn Stream<Item = Result<Event, ClientError>> + Send>> = match res {
-                    Ok(Some(events)) => Box::pin(futures::stream::iter(events.into_iter().map(Ok))),
-                    Ok(None) => Box::pin(futures::stream::empty()),
-                    Err(e) => Box::pin(futures::stream::once(async move { Err(e) })),
-                };
-                s
-            })
-            .flatten();
-
-        Ok(Box::pin(stream))
-    }
-
-    fn validate_config(&self, config: &RequestConfig) -> Vec<ConfigWarning> {
-        let mut warnings = Vec::new();
-
-        // OpenAI does not support top_k
-        if config.top_k.is_some() {
-            warnings.push(ConfigWarning::unsupported("top_k", "OpenAI"));
-        }
-
-        warnings
-    }
-}
--- a/crates/llm-worker/src/llm_client/scheme/anthropic/capability.rs
+++ b/crates/llm-worker/src/llm_client/scheme/anthropic/capability.rs
@ -0,0 +1,26 @@
+//! `model_id → ModelCapability` 静的テーブル。
+//!
+//! 既知モデルのみ網羅する。未知モデルは `None` を返し、呼び出し側
+//! （`HttpTransport` 構築時）に scheme 既定へフォールバックさせる。
+
+use crate::llm_client::capability::{
+    CacheStrategy, ModelCapability, ReasoningSupport, StructuredOutput, ToolCallingSupport,
+};
+
+/// Anthropic 公式モデルの既定 capability。
+///
+/// `claude-sonnet-*` / `claude-opus-*` / `claude-haiku-*` に対応する。
+/// `cache_control` は公式のみ有効で、最大 4 breakpoint（公式仕様）。
+pub(crate) fn lookup(model_id: &str) -> Option<ModelCapability> {
+    if !model_id.starts_with("claude-") {
+        return None;
+    }
+    Some(ModelCapability {
+        tool_calling: ToolCallingSupport::Parallel,
+        structured_output: StructuredOutput::JsonSchema,
+        reasoning: Some(ReasoningSupport::BudgetTokens),
+        vision: true,
+        prompt_caching: CacheStrategy::Explicit { max_breakpoints: 4 },
+    })
+}
+
--- a/crates/llm-worker/src/llm_client/scheme/anthropic/mod.rs
+++ b/crates/llm-worker/src/llm_client/scheme/anthropic/mod.rs
@ -3,8 +3,12 @@
 //! - リクエストJSON生成
 //! - SSEイベントパース → Event変換

+mod capability;
 mod events;
 mod request;
+mod scheme_impl;
+
+pub use scheme_impl::AnthropicState;

 /// Anthropicスキーマ
 ///
--- a/crates/llm-worker/src/llm_client/scheme/anthropic/request.rs
+++ b/crates/llm-worker/src/llm_client/scheme/anthropic/request.rs
@ -8,6 +8,7 @@ use serde::Serialize;

 use crate::llm_client::{
    Request,
+    capability::{CacheStrategy, ModelCapability, ReasoningSupport},
    types::{ContentPart, Item, Role, ToolDefinition, parse_tool_arguments},
 };

@ -32,6 +33,15 @@ pub(crate) struct AnthropicRequest {
    #[serde(skip_serializing_if = "Vec::is_empty")]
    pub stop_sequences: Vec<String>,
    pub stream: bool,
+    #[serde(skip_serializing_if = "Option::is_none")]
+    pub thinking: Option<AnthropicThinking>,
+}
+
+/// Anthropic extended thinking 指示。
+#[derive(Debug, Serialize)]
+#[serde(tag = "type", rename_all = "snake_case")]
+pub(crate) enum AnthropicThinking {
+    Enabled { budget_tokens: u32 },
 }

 /// Anthropic message
@ -130,12 +140,40 @@ pub(crate) struct AnthropicTool {
 }

 impl AnthropicScheme {
-    /// Build Anthropic request from Request
-    pub(crate) fn build_request(&self, model: &str, request: &Request) -> AnthropicRequest {
-        let breakpoints = compute_breakpoints(&request.items, request.cache_anchor);
+    /// Build Anthropic request from Request.
+    ///
+    /// `capability.prompt_caching` が [`CacheStrategy::Auto`] のときは
+    /// `cache_control` マーカーを一切挿入しない（Ollama の `/v1/messages`
+    /// 流用時など、サーバ側が `cache_control` を受け付けないケース）。
+    pub(crate) fn build_request(
+        &self,
+        model: &str,
+        request: &Request,
+        capability: &ModelCapability,
+    ) -> AnthropicRequest {
+        let breakpoints = if matches!(capability.prompt_caching, CacheStrategy::Explicit { .. }) {
+            compute_breakpoints(&request.items, request.cache_anchor)
+        } else {
+            BTreeSet::new()
+        };
        let messages = self.convert_items_to_messages(&request.items, &breakpoints);
        let tools = request.tools.iter().map(|t| self.convert_tool(t)).collect();

+        // Reasoning の投影: capability が BudgetTokens / Both をサポート
+        // していて、request 側で budget_tokens が指定されているときだけ
+        // thinking フィールドを付ける。
+        let supports_budget_tokens = matches!(
+            capability.reasoning,
+            Some(ReasoningSupport::BudgetTokens | ReasoningSupport::Both),
+        );
+        let thinking = request
+            .config
+            .reasoning
+            .as_ref()
+            .and_then(|rc| rc.budget_tokens)
+            .filter(|_| supports_budget_tokens)
+            .map(|budget_tokens| AnthropicThinking::Enabled { budget_tokens });
+
        AnthropicRequest {
            model: model.to_string(),
            max_tokens: request.config.max_tokens.unwrap_or(4096),
@ -147,6 +185,7 @@ impl AnthropicScheme {
            top_k: request.config.top_k,
            stop_sequences: request.config.stop_sequences.clone(),
            stream: true,
+            thinking,
        }
    }

@ -360,6 +399,28 @@ fn compute_breakpoints(items: &[Item], cache_anchor: Option<usize>) -> BTreeSet<
 #[cfg(test)]
 mod tests {
    use super::*;
+    use crate::llm_client::capability::{
+        CacheStrategy, StructuredOutput, ToolCallingSupport,
+    };
+
+    /// cache_control が有効になる既定の capability。
+    fn cap_explicit() -> ModelCapability {
+        ModelCapability {
+            tool_calling: ToolCallingSupport::Parallel,
+            structured_output: StructuredOutput::JsonSchema,
+            reasoning: None,
+            vision: false,
+            prompt_caching: CacheStrategy::Explicit { max_breakpoints: 4 },
+        }
+    }
+
+    /// cache_control を送らない capability（Ollama 等）。
+    fn cap_auto() -> ModelCapability {
+        ModelCapability {
+            prompt_caching: CacheStrategy::Auto,
+            ..cap_explicit()
+        }
+    }

    #[test]
    fn test_build_simple_request() {
@ -368,7 +429,7 @@ mod tests {
            .system("You are a helpful assistant.")
            .user("Hello!");

-        let anthropic_req = scheme.build_request("claude-sonnet-4-20250514", &request);
+        let anthropic_req = scheme.build_request("claude-sonnet-4-20250514", &request, &cap_explicit());

        assert_eq!(anthropic_req.model, "claude-sonnet-4-20250514");
        assert_eq!(
@ -394,7 +455,7 @@ mod tests {
                })),
        );

-        let anthropic_req = scheme.build_request("claude-sonnet-4-20250514", &request);
+        let anthropic_req = scheme.build_request("claude-sonnet-4-20250514", &request, &cap_explicit());

        assert_eq!(anthropic_req.tools.len(), 1);
        assert_eq!(anthropic_req.tools[0].name, "get_weather");
@ -412,7 +473,7 @@ mod tests {
            ))
            .item(Item::tool_result("call_123", "Sunny, 25°C"));

-        let anthropic_req = scheme.build_request("claude-sonnet-4-20250514", &request);
+        let anthropic_req = scheme.build_request("claude-sonnet-4-20250514", &request, &cap_explicit());

        assert_eq!(anthropic_req.messages.len(), 3);
        assert_eq!(anthropic_req.messages[0].role, "user");
@ -469,7 +530,7 @@ mod tests {
        let mut request = Request::new().items(items);
        request.cache_anchor = Some(0);

-        let req = scheme.build_request("claude-sonnet-4-20250514", &request);
+        let req = scheme.build_request("claude-sonnet-4-20250514", &request, &cap_explicit());
        let bps = breakpoint_positions(&req);
        assert_eq!(bps.len(), 3, "expected 3 breakpoints, got {:?}", bps);
        for (_, _, cc) in bps {
@ -485,7 +546,7 @@ mod tests {
        // cache_anchor=None, turn_end=4, head=5.
        let request = Request::new().items(items);

-        let req = scheme.build_request("claude-sonnet-4-20250514", &request);
+        let req = scheme.build_request("claude-sonnet-4-20250514", &request, &cap_explicit());
        let bps = breakpoint_positions(&req);
        assert_eq!(bps.len(), 2, "expected 2 breakpoints, got {:?}", bps);
    }
@ -495,7 +556,7 @@ mod tests {
        let scheme = AnthropicScheme::new();
        let request = Request::new().user("first ever turn");
        // latest user at 0 → no turn_end; head=0; no anchor. Collapse → 1.
-        let req = scheme.build_request("claude-sonnet-4-20250514", &request);
+        let req = scheme.build_request("claude-sonnet-4-20250514", &request, &cap_explicit());
        let bps = breakpoint_positions(&req);
        assert_eq!(bps.len(), 1, "expected 1 breakpoint, got {:?}", bps);
    }
@ -511,7 +572,7 @@ mod tests {
        ]);
        request.cache_anchor = Some(0);

-        let req = scheme.build_request("claude-sonnet-4-20250514", &request);
+        let req = scheme.build_request("claude-sonnet-4-20250514", &request, &cap_explicit());
        let bps = breakpoint_positions(&req);
        assert_eq!(bps.len(), 2, "expected collapse to 2, got {:?}", bps);
    }
@ -525,7 +586,7 @@ mod tests {
            .user("run it")
            .item(Item::tool_call("c1", "t", "{}"))
            .item(Item::tool_result("c1", "result"));
-        let req = scheme.build_request("claude-sonnet-4-20250514", &request);
+        let req = scheme.build_request("claude-sonnet-4-20250514", &request, &cap_explicit());
        let bps = breakpoint_positions(&req);
        assert_eq!(bps.len(), 1);
        let (mi, pi, _) = bps[0];
@ -549,7 +610,7 @@ mod tests {
        let request = Request::new()
            .user("hello")
            .assistant("hi there");
-        let req = scheme.build_request("claude-sonnet-4-20250514", &request);
+        let req = scheme.build_request("claude-sonnet-4-20250514", &request, &cap_explicit());
        assert!(
            matches!(req.messages[0].content, AnthropicContent::Text(_)),
            "non-breakpoint single-text message should use text shorthand",
@ -563,7 +624,7 @@ mod tests {
        let scheme = AnthropicScheme::new();
        let mut request = Request::new().user("hello");
        request.cache_anchor = Some(0);
-        let req = scheme.build_request("claude-sonnet-4-20250514", &request);
+        let req = scheme.build_request("claude-sonnet-4-20250514", &request, &cap_explicit());
        match &req.messages[0].content {
            AnthropicContent::Parts(parts) => {
                assert_eq!(parts.len(), 1);
@ -583,7 +644,7 @@ mod tests {
        let scheme = AnthropicScheme::new();
        let mut request = Request::new().user("hello");
        request.cache_anchor = Some(0);
-        let req = scheme.build_request("claude-sonnet-4-20250514", &request);
+        let req = scheme.build_request("claude-sonnet-4-20250514", &request, &cap_explicit());
        let json = serde_json::to_value(&req).unwrap();
        let part = &json["messages"][0]["content"][0];
        assert_eq!(part["type"], "text");
@ -598,7 +659,7 @@ mod tests {
        let scheme = AnthropicScheme::new();
        let mut request = Request::new().user("one");
        request.cache_anchor = Some(99);
-        let req = scheme.build_request("claude-sonnet-4-20250514", &request);
+        let req = scheme.build_request("claude-sonnet-4-20250514", &request, &cap_explicit());
        // Only the Head breakpoint survives.
        let bps = breakpoint_positions(&req);
        assert_eq!(bps.len(), 1);
@ -607,11 +668,22 @@ mod tests {
    #[test]
    fn empty_items_produce_no_breakpoints() {
        let scheme = AnthropicScheme::new();
-        let req = scheme.build_request("claude-sonnet-4-20250514", &Request::new());
+        let req = scheme.build_request("claude-sonnet-4-20250514", &Request::new(), &cap_explicit());
        assert!(req.messages.is_empty());
        assert!(breakpoint_positions(&req).is_empty());
    }

+    #[test]
+    fn cache_auto_does_not_add_cache_control() {
+        // Ollama のように `CacheStrategy::Auto` のときは cache_control
+        // マーカーを一切付けない。breakpoint 計算も走らないこと。
+        let scheme = AnthropicScheme::new();
+        let mut request = Request::new().user("hello");
+        request.cache_anchor = Some(0);
+        let req = scheme.build_request("claude-sonnet-4-20250514", &request, &cap_auto());
+        assert!(breakpoint_positions(&req).is_empty());
+    }
+
    #[test]
    fn tool_definitions_carry_no_cache_control() {
        // Tool JSON schema must serialise unchanged — no sneak-in of
@ -623,7 +695,7 @@ mod tests {
                "type": "object",
                "properties": {}
            })));
-        let req = scheme.build_request("claude-sonnet-4-20250514", &request);
+        let req = scheme.build_request("claude-sonnet-4-20250514", &request, &cap_explicit());
        let json = serde_json::to_value(&req).unwrap();
        let tool = &json["tools"][0];
        assert!(tool.get("cache_control").is_none());
--- a/crates/llm-worker/src/llm_client/scheme/anthropic/scheme_impl.rs
+++ b/crates/llm-worker/src/llm_client/scheme/anthropic/scheme_impl.rs
@ -0,0 +1,99 @@
+//! `impl Scheme for AnthropicScheme`
+//!
+//! Anthropic Messages API の wire 表現に必要な URL・ヘッダ・SSE パース・
+//! リクエスト body 生成を共通 `Scheme` trait にぶら下げる。
+
+use serde_json::Value;
+
+use crate::llm_client::{
+    ClientError,
+    capability::ModelCapability,
+    event::{BlockStop, BlockType, Event},
+    auth::AuthRequirement,
+    scheme::Scheme,
+    types::Request,
+};
+
+use super::AnthropicScheme;
+
+/// Anthropic の SSE パースで必要な状態。
+///
+/// `content_block_stop` イベントは `block_type` を持たない仕様なので、
+/// 直前の `content_block_start` で観測した `block_type` を保持して
+/// `BlockStop` に書き戻す。
+#[derive(Debug, Default)]
+pub struct AnthropicState {
+    current_block_type: Option<BlockType>,
+}
+
+impl Scheme for AnthropicScheme {
+    type State = AnthropicState;
+
+    fn default_base_url(&self) -> &'static str {
+        "https://api.anthropic.com"
+    }
+
+    fn path(&self, _model_id: &str) -> String {
+        "/v1/messages".to_string()
+    }
+
+    fn required_auth(&self) -> AuthRequirement {
+        // Ollama の `/v1/messages` 互換では認証が要らないが、それは
+        // `AuthRef::None` + `build_headers` 側の「ResolvedAuth::None
+        // なら何もしない」分岐で吸収する（`accepts` 判定で弾かれない
+        // よう、現状は XApiKey を要求しつつ、None 側でもパスするよう
+        // にする戦略）。
+        AuthRequirement::XApiKey
+    }
+
+    fn additional_headers(&self) -> Vec<(&'static str, String)> {
+        let mut headers = vec![("anthropic-version", self.api_version.clone())];
+        if self.fine_grained_tool_streaming {
+            headers.push((
+                "anthropic-beta",
+                "fine-grained-tool-streaming-2025-05-14".to_string(),
+            ));
+        }
+        headers
+    }
+
+    fn build_request_body(
+        &self,
+        model_id: &str,
+        request: &Request,
+        capability: &ModelCapability,
+    ) -> Value {
+        let req = self.build_request(model_id, request, capability);
+        serde_json::to_value(&req).expect("AnthropicRequest is always serialisable")
+    }
+
+    fn parse_sse(
+        &self,
+        event_type: &str,
+        data: &str,
+        state: &mut Self::State,
+    ) -> Result<Vec<Event>, ClientError> {
+        let Some(mut event) = self.parse_event(event_type, data)? else {
+            return Ok(Vec::new());
+        };
+        match &event {
+            Event::BlockStart(start) => {
+                state.current_block_type = Some(start.block_type);
+            }
+            Event::BlockStop(stop) => {
+                if let Some(block_type) = state.current_block_type.take() {
+                    event = Event::BlockStop(BlockStop {
+                        block_type,
+                        ..stop.clone()
+                    });
+                }
+            }
+            _ => {}
+        }
+        Ok(vec![event])
+    }
+
+    fn capability_for(&self, model_id: &str) -> Option<ModelCapability> {
+        super::capability::lookup(model_id)
+    }
+}
--- a/crates/llm-worker/src/llm_client/scheme/gemini/capability.rs
+++ b/crates/llm-worker/src/llm_client/scheme/gemini/capability.rs
@ -0,0 +1,26 @@
+//! `model_id → ModelCapability` 静的テーブル（Google Gemini）。
+
+use crate::llm_client::capability::{
+    CacheStrategy, ModelCapability, ReasoningSupport, StructuredOutput, ToolCallingSupport,
+};
+
+pub(crate) fn lookup(model_id: &str) -> Option<ModelCapability> {
+    if !model_id.starts_with("gemini-") {
+        return None;
+    }
+    // 2.5 系以降は thinking / reasoning を持つ
+    let reasoning = if model_id.starts_with("gemini-2.5")
+        || model_id.starts_with("gemini-3")
+    {
+        Some(ReasoningSupport::BudgetTokens)
+    } else {
+        None
+    };
+    Some(ModelCapability {
+        tool_calling: ToolCallingSupport::Parallel,
+        structured_output: StructuredOutput::JsonSchema,
+        reasoning,
+        vision: true,
+        prompt_caching: CacheStrategy::Auto,
+    })
+}
--- a/crates/llm-worker/src/llm_client/scheme/gemini/mod.rs
+++ b/crates/llm-worker/src/llm_client/scheme/gemini/mod.rs
@ -3,8 +3,10 @@
 //! - リクエストJSON生成
 //! - SSEイベントパース → Event変換

+mod capability;
 mod events;
 mod request;
+mod scheme_impl;

 /// Geminiスキーマ
 ///
--- a/crates/llm-worker/src/llm_client/scheme/gemini/request.rs
+++ b/crates/llm-worker/src/llm_client/scheme/gemini/request.rs
@ -7,6 +7,7 @@ use serde_json::Value;

 use crate::llm_client::{
    Request,
+    capability::{ModelCapability, ReasoningSupport},
    types::{Item, Role, ToolDefinition, parse_tool_arguments},
 };

@ -139,11 +140,26 @@ pub(crate) struct GeminiGenerationConfig {
    /// Stop sequences
    #[serde(skip_serializing_if = "Vec::is_empty")]
    pub stop_sequences: Vec<String>,
+    /// Thinking / reasoning 設定（Gemini 2.5 以降）。
+    #[serde(skip_serializing_if = "Option::is_none")]
+    pub thinking_config: Option<GeminiThinkingConfig>,
+}
+
+/// Gemini thinking config (gemini-2.5 以降)
+#[derive(Debug, Serialize)]
+#[serde(rename_all = "camelCase")]
+pub(crate) struct GeminiThinkingConfig {
+    /// Token budget for thinking. `-1` means dynamic.
+    pub thinking_budget: i32,
 }

 impl GeminiScheme {
    /// Build Gemini request from Request
-    pub(crate) fn build_request(&self, request: &Request) -> GeminiRequest {
+    pub(crate) fn build_request(
+        &self,
+        request: &Request,
+        capability: &ModelCapability,
+    ) -> GeminiRequest {
        let contents = self.convert_items_to_contents(&request.items);

        // System prompt
@ -177,6 +193,22 @@ impl GeminiScheme {
            None
        };

+        // Reasoning の投影: capability が BudgetTokens / Both をサポートし、
+        // request 側で budget_tokens が指定されているときだけ thinking_config を付ける。
+        let supports_budget = matches!(
+            capability.reasoning,
+            Some(ReasoningSupport::BudgetTokens | ReasoningSupport::Both),
+        );
+        let thinking_config = request
+            .config
+            .reasoning
+            .as_ref()
+            .and_then(|rc| rc.budget_tokens)
+            .filter(|_| supports_budget)
+            .map(|budget| GeminiThinkingConfig {
+                thinking_budget: budget as i32,
+            });
+
        // Generation config
        let generation_config = Some(GeminiGenerationConfig {
            max_output_tokens: request.config.max_tokens,
@ -184,6 +216,7 @@ impl GeminiScheme {
            top_p: request.config.top_p,
            top_k: request.config.top_k,
            stop_sequences: request.config.stop_sequences.clone(),
+            thinking_config,
        });

        GeminiRequest {
@ -341,6 +374,17 @@ impl GeminiScheme {
 #[cfg(test)]
 mod tests {
    use super::*;
+    use crate::llm_client::capability::{CacheStrategy, StructuredOutput, ToolCallingSupport};
+
+    fn cap() -> ModelCapability {
+        ModelCapability {
+            tool_calling: ToolCallingSupport::Parallel,
+            structured_output: StructuredOutput::JsonSchema,
+            reasoning: None,
+            vision: true,
+            prompt_caching: CacheStrategy::Auto,
+        }
+    }

    #[test]
    fn test_build_simple_request() {
@ -349,7 +393,7 @@ mod tests {
            .system("You are a helpful assistant.")
            .user("Hello!");

-        let gemini_req = scheme.build_request(&request);
+        let gemini_req = scheme.build_request(&request, &cap());

        assert!(gemini_req.system_instruction.is_some());
        assert_eq!(gemini_req.contents.len(), 1);
@ -371,7 +415,7 @@ mod tests {
                })),
        );

-        let gemini_req = scheme.build_request(&request);
+        let gemini_req = scheme.build_request(&request, &cap());

        assert_eq!(gemini_req.tools.len(), 1);
        assert_eq!(gemini_req.tools[0].function_declarations.len(), 1);
@ -387,7 +431,7 @@ mod tests {
        let scheme = GeminiScheme::new();
        let request = Request::new().user("Hello").assistant("Hi there!");

-        let gemini_req = scheme.build_request(&request);
+        let gemini_req = scheme.build_request(&request, &cap());

        assert_eq!(gemini_req.contents.len(), 2);
        assert_eq!(gemini_req.contents[0].role, "user");
@ -406,7 +450,7 @@ mod tests {
            ))
            .item(Item::tool_result("call_123", "Sunny, 25°C"));

-        let gemini_req = scheme.build_request(&request);
+        let gemini_req = scheme.build_request(&request, &cap());

        assert_eq!(gemini_req.contents.len(), 3);
        assert_eq!(gemini_req.contents[0].role, "user");
--- a/crates/llm-worker/src/llm_client/scheme/gemini/scheme_impl.rs
+++ b/crates/llm-worker/src/llm_client/scheme/gemini/scheme_impl.rs
@ -0,0 +1,53 @@
+//! `impl Scheme for GeminiScheme`
+
+use serde_json::Value;
+
+use crate::llm_client::{
+    ClientError,
+    capability::ModelCapability,
+    event::Event,
+    auth::AuthRequirement,
+    scheme::Scheme,
+    types::Request,
+};
+
+use super::GeminiScheme;
+
+impl Scheme for GeminiScheme {
+    type State = ();
+
+    fn default_base_url(&self) -> &'static str {
+        "https://generativelanguage.googleapis.com"
+    }
+
+    fn path(&self, model_id: &str) -> String {
+        format!("/v1beta/models/{model_id}:streamGenerateContent?alt=sse")
+    }
+
+    fn required_auth(&self) -> AuthRequirement {
+        AuthRequirement::QueryParam { name: "key" }
+    }
+
+    fn build_request_body(
+        &self,
+        _model_id: &str,
+        request: &Request,
+        capability: &ModelCapability,
+    ) -> Value {
+        let req = self.build_request(request, capability);
+        serde_json::to_value(&req).expect("GeminiRequest is always serialisable")
+    }
+
+    fn parse_sse(
+        &self,
+        _event_type: &str,
+        data: &str,
+        _state: &mut Self::State,
+    ) -> Result<Vec<Event>, ClientError> {
+        Ok(self.parse_event(data)?.unwrap_or_default())
+    }
+
+    fn capability_for(&self, model_id: &str) -> Option<ModelCapability> {
+        super::capability::lookup(model_id)
+    }
+}
--- a/crates/llm-worker/src/llm_client/scheme/mod.rs
+++ b/crates/llm-worker/src/llm_client/scheme/mod.rs
@ -3,7 +3,80 @@
 //! 各APIスキーマごとの変換ロジック
 //! - リクエスト変換: Request → プロバイダ固有JSON
 //! - レスポンス変換: SSEイベント → Event
+//!
+//! [`Scheme`] trait により `HttpTransport<S>` から scheme 固有の差分
+//! （パス、ヘッダ、認証要件、body 生成、SSE パース）をすべて委譲する。

 pub mod anthropic;
 pub mod gemini;
-pub mod openai;
+pub mod openai_chat;
+
+use serde_json::Value;
+
+use super::auth::AuthRequirement;
+use super::capability::ModelCapability;
+use super::error::ClientError;
+use super::event::Event;
+use super::types::Request;
+
+/// wire scheme の抽象。各プロバイダの API 仕様ごとに 1 つ実装する。
+///
+/// `HttpTransport<S: Scheme>` が URL 組立・認証ヘッダ挿入・SSE パース
+/// のループを担い、`Scheme` 実装は各仕様固有の差分のみ提供する。
+///
+/// # 状態
+///
+/// SSE パースでフレーム間に状態を保つ必要がある scheme（Anthropic の
+/// `BlockStop` に `block_type` が載らない仕様の補完など）は
+/// [`Scheme::State`] に中間状態を表す型を置く。
+/// 状態を持たない scheme は `type State = ()` とする。
+pub trait Scheme: Clone + Send + Sync + 'static {
+    /// SSE パースのフレーム間で共有する状態。`HttpTransport` が
+    /// ストリーム開始時に `Default::default()` を一度だけ作り、
+    /// フレームごとに `&mut` で渡す。
+    type State: Default + Send + 'static;
+
+    /// scheme のベース URL（`ModelConfig::base_url` 未指定時のデフォルト）
+    fn default_base_url(&self) -> &'static str;
+
+    /// リクエスト先の相対パス。Gemini のようにモデル名をパスに埋め込む
+    /// プロバイダもあるため、モデル ID を受け取る。
+    fn path(&self, model_id: &str) -> String;
+
+    /// この scheme が要求する認証形式。`build_client` 時に
+    /// [`AuthRef`](../../../manifest/enum.AuthRef.html) と照合する。
+    fn required_auth(&self) -> AuthRequirement;
+
+    /// `Content-Type` 以外の追加ヘッダ。`anthropic-version` / `anthropic-beta` 等。
+    fn additional_headers(&self) -> Vec<(&'static str, String)> {
+        Vec::new()
+    }
+
+    /// リクエスト body を生成する。`capability` は `CacheStrategy` や
+    /// `ReasoningSupport` を参照して scheme 側の挙動を分岐させるため
+    /// に渡される。
+    fn build_request_body(
+        &self,
+        model_id: &str,
+        request: &Request,
+        capability: &ModelCapability,
+    ) -> Value;
+
+    /// SSE イベント 1 件を 0 個以上の [`Event`] に変換する。
+    ///
+    /// `event_type` は SSE フレームの `event:` フィールド、`data` は
+    /// `data:` フィールド。`[DONE]` 等の終端マーカーは実装側で判定する。
+    /// `state` はストリーム単位で共有される可変状態。
+    fn parse_sse(
+        &self,
+        event_type: &str,
+        data: &str,
+        state: &mut Self::State,
+    ) -> Result<Vec<Event>, ClientError>;
+
+    /// 既知モデル ID の能力テーブル引き。未知なら `None` を返す
+    /// ので、呼び出し側は scheme ごとの安全側デフォルト
+    /// （[`ModelCapability::minimal`]）にフォールバックする。
+    fn capability_for(&self, model_id: &str) -> Option<ModelCapability>;
+}
+
--- a/crates/llm-worker/src/llm_client/scheme/openai_chat/capability.rs
+++ b/crates/llm-worker/src/llm_client/scheme/openai_chat/capability.rs
@ -0,0 +1,47 @@
+//! `model_id → ModelCapability` 静的テーブル（OpenAI Chat Completions）。
+//!
+//! OpenAI 本家の主要モデルのみ網羅する。OpenRouter / xAI / Groq 等は
+//! モデル ID が各社独自なので、マニフェスト側で明示 override する
+//! 前提。
+
+use crate::llm_client::capability::{
+    CacheStrategy, ModelCapability, ReasoningSupport, StructuredOutput, ToolCallingSupport,
+};
+
+pub(crate) fn lookup(model_id: &str) -> Option<ModelCapability> {
+    // GPT-5 / o1 / o3 / o4 reasoning 系
+    if model_id.starts_with("gpt-5")
+        || model_id.starts_with("o1")
+        || model_id.starts_with("o3")
+        || model_id.starts_with("o4")
+    {
+        return Some(ModelCapability {
+            tool_calling: ToolCallingSupport::Parallel,
+            structured_output: StructuredOutput::JsonSchema,
+            reasoning: Some(ReasoningSupport::Effort),
+            vision: true,
+            prompt_caching: CacheStrategy::Auto,
+        });
+    }
+    // GPT-4o / GPT-4 系
+    if model_id.starts_with("gpt-4") {
+        return Some(ModelCapability {
+            tool_calling: ToolCallingSupport::Parallel,
+            structured_output: StructuredOutput::JsonSchema,
+            reasoning: None,
+            vision: true,
+            prompt_caching: CacheStrategy::Auto,
+        });
+    }
+    // GPT-3.5 系（旧式・structured output 限定）
+    if model_id.starts_with("gpt-3.5") {
+        return Some(ModelCapability {
+            tool_calling: ToolCallingSupport::Parallel,
+            structured_output: StructuredOutput::JsonObject,
+            reasoning: None,
+            vision: false,
+            prompt_caching: CacheStrategy::Auto,
+        });
+    }
+    None
+}
--- a/crates/llm-worker/src/llm_client/scheme/openai_chat/events.rs
+++ b/crates/llm-worker/src/llm_client/scheme/openai_chat/events.rs
--- a/crates/llm-worker/src/llm_client/scheme/openai_chat/mod.rs
+++ b/crates/llm-worker/src/llm_client/scheme/openai_chat/mod.rs
@ -3,8 +3,10 @@
 //! - リクエストJSON生成
 //! - SSEイベントパース → Event変換

+mod capability;
 mod events;
 mod request;
+mod scheme_impl;

 /// OpenAIスキーマ
 ///
--- a/crates/llm-worker/src/llm_client/scheme/openai_chat/request.rs
+++ b/crates/llm-worker/src/llm_client/scheme/openai_chat/request.rs
@ -7,6 +7,7 @@ use serde_json::Value;

 use crate::llm_client::{
    Request,
+    capability::{ModelCapability, ReasoningEffort, ReasoningSupport},
    types::{Item, Role, ToolDefinition, parse_tool_arguments},
 };

@ -34,6 +35,9 @@ pub(crate) struct OpenAIRequest {
    pub tools: Vec<OpenAITool>,
    #[serde(skip_serializing_if = "Option::is_none")]
    pub tool_choice: Option<String>,
+    /// Reasoning effort（o1 / o3 / o4 / gpt-5 系で有効）。
+    #[serde(skip_serializing_if = "Option::is_none")]
+    pub reasoning_effort: Option<&'static str>,
 }

 #[derive(Debug, Serialize)]
@ -110,7 +114,12 @@ pub(crate) struct OpenAIToolCallFunction {

 impl OpenAIScheme {
    /// Build OpenAI request from Request
-    pub(crate) fn build_request(&self, model: &str, request: &Request) -> OpenAIRequest {
+    pub(crate) fn build_request(
+        &self,
+        model: &str,
+        request: &Request,
+        capability: &ModelCapability,
+    ) -> OpenAIRequest {
        let mut messages = Vec::new();

        // Add system message if present
@ -135,6 +144,24 @@ impl OpenAIScheme {
            (None, request.config.max_tokens)
        };

+        // Reasoning の投影: capability が Effort / Both をサポートし、
+        // request 側で effort が指定されているときだけ reasoning_effort を付ける。
+        let supports_effort = matches!(
+            capability.reasoning,
+            Some(ReasoningSupport::Effort | ReasoningSupport::Both),
+        );
+        let reasoning_effort = request
+            .config
+            .reasoning
+            .as_ref()
+            .and_then(|rc| rc.effort)
+            .filter(|_| supports_effort)
+            .map(|effort| match effort {
+                ReasoningEffort::Low => "low",
+                ReasoningEffort::Medium => "medium",
+                ReasoningEffort::High => "high",
+            });
+
        OpenAIRequest {
            model: model.to_string(),
            max_completion_tokens,
@ -149,6 +176,7 @@ impl OpenAIScheme {
            messages,
            tools,
            tool_choice: None,
+            reasoning_effort,
        }
    }

@ -294,13 +322,24 @@ impl OpenAIScheme {
 #[cfg(test)]
 mod tests {
    use super::*;
+    use crate::llm_client::capability::{CacheStrategy, StructuredOutput, ToolCallingSupport};
+
+    fn cap() -> ModelCapability {
+        ModelCapability {
+            tool_calling: ToolCallingSupport::Parallel,
+            structured_output: StructuredOutput::JsonSchema,
+            reasoning: None,
+            vision: false,
+            prompt_caching: CacheStrategy::Auto,
+        }
+    }

    #[test]
    fn test_build_simple_request() {
        let scheme = OpenAIScheme::new();
        let request = Request::new().system("System prompt").user("Hello");

-        let body = scheme.build_request("gpt-4o", &request);
+        let body = scheme.build_request("gpt-4o", &request, &cap());

        assert_eq!(body.model, "gpt-4o");
        assert_eq!(body.messages.len(), 2);
@ -321,7 +360,7 @@ mod tests {
            .user("Check weather")
            .tool(ToolDefinition::new("weather").description("Get weather"));

-        let body = scheme.build_request("gpt-4o", &request);
+        let body = scheme.build_request("gpt-4o", &request, &cap());
        assert_eq!(body.tools.len(), 1);
        assert_eq!(body.tools[0].function.name, "weather");
    }
@ -331,7 +370,7 @@ mod tests {
        let scheme = OpenAIScheme::new().with_legacy_max_tokens(true);
        let request = Request::new().user("Hello").max_tokens(100);

-        let body = scheme.build_request("llama3", &request);
+        let body = scheme.build_request("llama3", &request, &cap());

        assert_eq!(body.max_tokens, Some(100));
        assert!(body.max_completion_tokens.is_none());
@ -342,7 +381,7 @@ mod tests {
        let scheme = OpenAIScheme::new();
        let request = Request::new().user("Hello").max_tokens(100);

-        let body = scheme.build_request("gpt-4o", &request);
+        let body = scheme.build_request("gpt-4o", &request, &cap());

        assert_eq!(body.max_completion_tokens, Some(100));
        assert!(body.max_tokens.is_none());
@ -360,7 +399,7 @@ mod tests {
            ))
            .item(Item::tool_result("call_123", "Sunny, 25°C"));

-        let body = scheme.build_request("gpt-4o", &request);
+        let body = scheme.build_request("gpt-4o", &request, &cap());

        assert_eq!(body.messages.len(), 3);
        assert_eq!(body.messages[0].role, "user");
--- a/crates/llm-worker/src/llm_client/scheme/openai_chat/scheme_impl.rs
+++ b/crates/llm-worker/src/llm_client/scheme/openai_chat/scheme_impl.rs
@ -0,0 +1,57 @@
+//! `impl Scheme for OpenAIScheme`
+
+use serde_json::Value;
+
+use crate::llm_client::{
+    ClientError,
+    capability::ModelCapability,
+    event::Event,
+    auth::AuthRequirement,
+    scheme::Scheme,
+    types::Request,
+};
+
+use super::OpenAIScheme;
+
+impl Scheme for OpenAIScheme {
+    type State = ();
+
+    fn default_base_url(&self) -> &'static str {
+        "https://api.openai.com"
+    }
+
+    fn path(&self, _model_id: &str) -> String {
+        "/v1/chat/completions".to_string()
+    }
+
+    fn required_auth(&self) -> AuthRequirement {
+        AuthRequirement::Bearer
+    }
+
+    fn build_request_body(
+        &self,
+        model_id: &str,
+        request: &Request,
+        capability: &ModelCapability,
+    ) -> Value {
+        let req = self.build_request(model_id, request, capability);
+        serde_json::to_value(&req).expect("OpenAIRequest is always serialisable")
+    }
+
+    fn parse_sse(
+        &self,
+        _event_type: &str,
+        data: &str,
+        _state: &mut Self::State,
+    ) -> Result<Vec<Event>, ClientError> {
+        // `data: [DONE]` は終端マーカー
+        if data.trim() == "[DONE]" {
+            return Ok(Vec::new());
+        }
+        Ok(self.parse_event(data)?.unwrap_or_default())
+    }
+
+    fn capability_for(&self, model_id: &str) -> Option<ModelCapability> {
+        super::capability::lookup(model_id)
+    }
+}
--- a/crates/llm-worker/src/llm_client/transport.rs
+++ b/crates/llm-worker/src/llm_client/transport.rs
@ -0,0 +1,226 @@
+//! `HttpTransport<S: Scheme>`: すべての LLM wire scheme を共通の 1 本の
+//! HTTP クライアントで扱う。
+//!
+//! 旧 `providers/{anthropic,openai,gemini,ollama}.rs` を置き換える。
+//! scheme 固有の差分は [`Scheme`] trait 実装に委譲する。
+
+use std::pin::Pin;
+
+use async_trait::async_trait;
+use eventsource_stream::Eventsource;
+use futures::{Stream, StreamExt, TryStreamExt};
+use reqwest::header::{CONTENT_TYPE, HeaderMap, HeaderValue};
+
+use super::capability::ModelCapability;
+use super::client::LlmClient;
+use super::error::ClientError;
+use super::event::Event;
+use super::auth::AuthRequirement;
+use super::scheme::Scheme;
+use super::types::Request;
+
+/// `AuthRef` を解決したランタイム表現。`crates/provider` が構築する。
+///
+/// `AuthRef::ApiKey` → 読み取った文字列、`AuthRef::None` → `None`。
+/// `CodexOAuth` 等、動的に更新される認証は別途 `Custom` バリアントを
+/// 追加する余地を残す（本チケットでは未実装）。
+#[derive(Debug, Clone)]
+pub enum ResolvedAuth {
+    None,
+    ApiKey(String),
+}
+
+impl ResolvedAuth {
+    /// 認証要件と実際の解決値が噛み合うか検査する。構築時検証用。
+    ///
+    /// `ResolvedAuth::None` は認証を付けないという宣言なので、どの
+    /// `AuthRequirement` でも受け入れる（Ollama の Anthropic scheme
+    /// 流用は `required_auth = XApiKey` だが認証ヘッダなしで動く）。
+    pub fn matches(&self, req: AuthRequirement) -> bool {
+        match (self, req) {
+            (Self::None, _) => true,
+            (
+                Self::ApiKey(_),
+                AuthRequirement::Bearer | AuthRequirement::XApiKey | AuthRequirement::QueryParam { .. },
+            ) => true,
+            _ => false,
+        }
+    }
+}
+
+/// scheme 共通の HTTP 通信層。
+pub struct HttpTransport<S: Scheme> {
+    http_client: reqwest::Client,
+    scheme: S,
+    model_id: String,
+    base_url: String,
+    auth: ResolvedAuth,
+    capability: ModelCapability,
+}
+
+impl<S: Scheme> HttpTransport<S> {
+    /// 新しい transport を作る。`base_url` は末尾スラッシュの有無を
+    /// どちらでも受け付ける（内部で正規化）。
+    pub fn new(
+        scheme: S,
+        model_id: impl Into<String>,
+        base_url: impl Into<String>,
+        auth: ResolvedAuth,
+        capability: ModelCapability,
+    ) -> Self {
+        let base_url = base_url.into();
+        let base_url = base_url.trim_end_matches('/').to_string();
+        Self {
+            http_client: reqwest::Client::new(),
+            scheme,
+            model_id: model_id.into(),
+            base_url,
+            auth,
+            capability,
+        }
+    }
+
+    /// カスタム HTTP クライアントを差し込む（テスト等）。
+    pub fn with_http_client(mut self, client: reqwest::Client) -> Self {
+        self.http_client = client;
+        self
+    }
+
+    fn build_url(&self) -> String {
+        let path = self.scheme.path(&self.model_id);
+        let url = format!("{}{}", self.base_url, path);
+        // Gemini のようにクエリパラメータで認証する場合は URL にキーを追記する
+        if let (AuthRequirement::QueryParam { name }, ResolvedAuth::ApiKey(key)) =
+            (self.scheme.required_auth(), &self.auth)
+        {
+            let sep = if url.contains('?') { '&' } else { '?' };
+            format!("{url}{sep}{name}={key}")
+        } else {
+            url
+        }
+    }
+
+    fn build_headers(&self) -> Result<HeaderMap, ClientError> {
+        let mut headers = HeaderMap::new();
+        headers.insert(CONTENT_TYPE, HeaderValue::from_static("application/json"));
+
+        match (self.scheme.required_auth(), &self.auth) {
+            (AuthRequirement::None, _) | (_, ResolvedAuth::None) => {}
+            (AuthRequirement::Bearer, ResolvedAuth::ApiKey(key)) => {
+                let mut val = HeaderValue::from_str(&format!("Bearer {key}"))
+                    .map_err(|e| ClientError::Config(format!("invalid api key: {e}")))?;
+                val.set_sensitive(true);
+                headers.insert("Authorization", val);
+            }
+            (AuthRequirement::XApiKey, ResolvedAuth::ApiKey(key)) => {
+                let mut val = HeaderValue::from_str(key.as_str())
+                    .map_err(|e| ClientError::Config(format!("invalid api key: {e}")))?;
+                val.set_sensitive(true);
+                headers.insert("x-api-key", val);
+            }
+            (AuthRequirement::QueryParam { .. }, _) => {
+                // クエリパラメータは `build_url` で付与済み
+            }
+            (AuthRequirement::Custom, _) => {
+                // 今チケットでは Custom は使わない。Codex OAuth で追加予定
+            }
+        }
+
+        for (name, value) in self.scheme.additional_headers() {
+            let hv = HeaderValue::from_str(&value)
+                .map_err(|e| ClientError::Config(format!("invalid header {name}: {e}")))?;
+            headers.insert(name, hv);
+        }
+
+        Ok(headers)
+    }
+}
+
+impl<S: Scheme + Clone> Clone for HttpTransport<S> {
+    fn clone(&self) -> Self {
+        Self {
+            http_client: self.http_client.clone(),
+            scheme: self.scheme.clone(),
+            model_id: self.model_id.clone(),
+            base_url: self.base_url.clone(),
+            auth: self.auth.clone(),
+            capability: self.capability.clone(),
+        }
+    }
+}
+
+#[async_trait]
+impl<S: Scheme + Clone + 'static> LlmClient for HttpTransport<S> {
+    fn clone_boxed(&self) -> Box<dyn LlmClient> {
+        Box::new(self.clone())
+    }
+
+    async fn stream(
+        &self,
+        request: Request,
+    ) -> Result<Pin<Box<dyn Stream<Item = Result<Event, ClientError>> + Send>>, ClientError> {
+        let url = self.build_url();
+        let headers = self.build_headers()?;
+        let body = self
+            .scheme
+            .build_request_body(&self.model_id, &request, &self.capability);
+
+        let response = self
+            .http_client
+            .post(&url)
+            .headers(headers)
+            .json(&body)
+            .send()
+            .await?;
+
+        if !response.status().is_success() {
+            let status = response.status().as_u16();
+            let text = response.text().await.unwrap_or_default();
+            if let Ok(json) = serde_json::from_str::<serde_json::Value>(&text) {
+                let error = json.get("error").unwrap_or(&json);
+                let code = error.get("type").and_then(|v| v.as_str()).map(String::from);
+                let message = error
+                    .get("message")
+                    .and_then(|v| v.as_str())
+                    .unwrap_or(&text)
+                    .to_string();
+                return Err(ClientError::Api {
+                    status: Some(status),
+                    code,
+                    message,
+                });
+            }
+            return Err(ClientError::Api {
+                status: Some(status),
+                code: None,
+                message: text,
+            });
+        }
+
+        let scheme = self.scheme.clone();
+        let byte_stream = response.bytes_stream().map_err(std::io::Error::other);
+        let event_stream = byte_stream.eventsource();
+
+        // scheme 固有のパース状態をストリーム単位で保持する
+        let mut state = <S::State as Default>::default();
+
+        let stream = event_stream
+            .map(move |result| match result {
+                Ok(frame) => match scheme.parse_sse(&frame.event, &frame.data, &mut state) {
+                    Ok(events) => Ok(events),
+                    Err(e) => Err(e),
+                },
+                Err(e) => Err(ClientError::Sse(e.to_string())),
+            })
+            .map(|res| {
+                let s: Pin<Box<dyn Stream<Item = Result<Event, ClientError>> + Send>> = match res {
+                    Ok(events) => Box::pin(futures::stream::iter(events.into_iter().map(Ok))),
+                    Err(e) => Box::pin(futures::stream::once(async move { Err(e) })),
+                };
+                s
+            })
+            .flatten();
+
+        Ok(Box::pin(stream))
+    }
+}
--- a/crates/llm-worker/src/llm_client/types.rs
+++ b/crates/llm-worker/src/llm_client/types.rs
@ -565,6 +565,12 @@ pub struct RequestConfig {
    pub top_k: Option<u32>,
    /// Stop sequences
    pub stop_sequences: Vec<String>,
+    /// Reasoning / extended-thinking 制御（共通型、scheme 側で各社形式に投影）。
+    ///
+    /// `None` のときは何も送らない。`Some` でも scheme の
+    /// `ModelCapability::reasoning` が `None` なら無視される。
+    #[serde(default)]
+    pub reasoning: Option<crate::llm_client::capability::ReasoningControl>,
 }

 impl RequestConfig {
--- a/crates/llm-worker/tests/ui/locked_register_tool.rs
+++ b/crates/llm-worker/tests/ui/locked_register_tool.rs
@ -1,9 +1,26 @@
 use llm_worker::Worker;
-use llm_worker::llm_client::providers::ollama::OllamaClient;
+use llm_worker::llm_client::capability::{
+    CacheStrategy, ModelCapability, StructuredOutput, ToolCallingSupport,
+};
+use llm_worker::llm_client::scheme::anthropic::AnthropicScheme;
+use llm_worker::llm_client::transport::{HttpTransport, ResolvedAuth};
 use std::sync::Arc;

 fn main() {
-    let client = OllamaClient::new("dummy-model");
+    let cap = ModelCapability {
+        tool_calling: ToolCallingSupport::Parallel,
+        structured_output: StructuredOutput::JsonSchema,
+        reasoning: None,
+        vision: false,
+        prompt_caching: CacheStrategy::Auto,
+    };
+    let client = HttpTransport::new(
+        AnthropicScheme::new(),
+        "dummy-model".to_string(),
+        "http://localhost:11434".to_string(),
+        ResolvedAuth::None,
+        cap,
+    );
    let worker = Worker::new(client);
    let mut locked = worker.lock();
    let def: llm_worker::tool::ToolDefinition = Arc::new(|| panic!("unused"));
--- a/crates/llm-worker/tests/ui/locked_register_tool.stderr
+++ b/crates/llm-worker/tests/ui/locked_register_tool.stderr
@ -1,8 +1,8 @@
-error[E0599]: no method named `register_tool` found for struct `Worker<OllamaClient, Locked>` in the current scope
-  --> tests/ui/locked_register_tool.rs:10:20
+error[E0599]: no method named `register_tool` found for struct `Worker<HttpTransport<AnthropicScheme>, Locked>` in the current scope
+  --> tests/ui/locked_register_tool.rs:27:20
   |
-10 |     let _ = locked.register_tool(def);
-   |                    ^^^^^^^^^^^^^ method not found in `Worker<OllamaClient, Locked>`
+27 |     let _ = locked.register_tool(def);
+   |                    ^^^^^^^^^^^^^ method not found in `Worker<HttpTransport<AnthropicScheme>, Locked>`
   |
   = note: the method was found for
           - `Worker<C>`
--- a/crates/llm-worker/tests/ui/tool_server_handle_register_tool.rs
+++ b/crates/llm-worker/tests/ui/tool_server_handle_register_tool.rs
@ -1,9 +1,26 @@
 use llm_worker::Worker;
-use llm_worker::llm_client::providers::ollama::OllamaClient;
+use llm_worker::llm_client::capability::{
+    CacheStrategy, ModelCapability, StructuredOutput, ToolCallingSupport,
+};
+use llm_worker::llm_client::scheme::anthropic::AnthropicScheme;
+use llm_worker::llm_client::transport::{HttpTransport, ResolvedAuth};
 use std::sync::Arc;

 fn main() {
-    let client = OllamaClient::new("dummy-model");
+    let cap = ModelCapability {
+        tool_calling: ToolCallingSupport::Parallel,
+        structured_output: StructuredOutput::JsonSchema,
+        reasoning: None,
+        vision: false,
+        prompt_caching: CacheStrategy::Auto,
+    };
+    let client = HttpTransport::new(
+        AnthropicScheme::new(),
+        "dummy-model".to_string(),
+        "http://localhost:11434".to_string(),
+        ResolvedAuth::None,
+        cap,
+    );
    let worker = Worker::new(client);
    let handle = worker.tool_server_handle();
    let def: llm_worker::tool::ToolDefinition = Arc::new(|| panic!("unused"));
--- a/crates/llm-worker/tests/ui/tool_server_handle_register_tool.stderr
+++ b/crates/llm-worker/tests/ui/tool_server_handle_register_tool.stderr
@ -1,7 +1,7 @@
 error[E0624]: method `register_tool` is private
-  --> tests/ui/tool_server_handle_register_tool.rs:10:20
+  --> tests/ui/tool_server_handle_register_tool.rs:27:20
   |
-10 |     let _ = handle.register_tool(def);
+27 |     let _ = handle.register_tool(def);
   |                    ^^^^^^^^^^^^^ private method
   |
  ::: src/tool_server.rs
--- a/crates/llm-worker/tests/validation_test.rs
+++ b/crates/llm-worker/tests/validation_test.rs
@ -1,39 +0,0 @@
-use llm_worker::llm_client::providers::openai::OpenAIClient;
-use llm_worker::{Worker, WorkerError};
-
-#[test]
-fn test_openai_top_k_warning() {
-    // Create client with dummy key (validate_config doesn't make network calls, so safe)
-    let client = OpenAIClient::new("dummy-key", "gpt-4o");
-
-    // Create Worker with top_k set (OpenAI doesn't support top_k)
-    let worker = Worker::new(client).top_k(50);
-
-    // Run validate()
-    let result = worker.validate();
-
-    // Verify error is returned and ConfigWarnings is included
-    match result {
-        Err(WorkerError::ConfigWarnings(warnings)) => {
-            assert_eq!(warnings.len(), 1);
-            assert_eq!(warnings[0].option_name, "top_k");
-            println!("Got expected warning: {}", warnings[0]);
-        }
-        Ok(_) => panic!("Should have returned validation error"),
-        Err(e) => panic!("Unexpected error type: {:?}", e),
-    }
-}
-
-#[test]
-fn test_openai_valid_config() {
-    let client = OpenAIClient::new("dummy-key", "gpt-4o");
-
-    // Valid configuration (temperature only)
-    let worker = Worker::new(client).temperature(0.7);
-
-    // Run validate()
-    let result = worker.validate();
-
-    // Verify success
-    assert!(result.is_ok());
-}
--- a/crates/manifest/README.md
+++ b/crates/manifest/README.md
@ -1,13 +1,14 @@
 # manifest

-Pod の宣言的設定を TOML マニフェストとして定義・パースするクレート。プロバイダ設定、ワーカー設定、ディレクトリスコープ制約を記述できる。
+Pod の宣言的設定を TOML マニフェストとして定義・パースするクレート。モデル設定、ワーカー設定、ディレクトリスコープ制約を記述できる。

 ## 公開型

 - `PodManifest` — Pod 設定全体（`from_toml()` でパース）
 - `PodMeta` — Pod メタデータ（名前、pwd）
- `ProviderConfig` — LLM プロバイダ設定（種別、モデル、APIキー環境変数、ベースURL）
- `ProviderKind` — プロバイダ種別（`Anthropic`, `Openai`, `Gemini`, `Ollama`）
+- `ModelConfig` — LLM モデル設定（scheme、base_url、model_id、auth）
+- `SchemeKind` — wire scheme 種別（`Anthropic`, `OpenaiChat`, `OpenaiResponses`, `Gemini`）
+- `AuthRef` — 認証参照（`None`, `ApiKey { env, file }`, `CodexOAuth`）
 - `WorkerManifest` — ワーカー設定（システムプロンプト、max_tokens、temperature）
 - `ScopeConfig` / `ScopeRule` / `Permission` — allow / deny の宣言的スコープ設定
 - `Scope` — 実行時スコープ。`from_config(&ScopeConfig, pwd)` で構築し、`is_readable` / `is_writable` / `permission_at` で問い合わせる
--- a/crates/manifest/src/config.rs
+++ b/crates/manifest/src/config.rs
@ -13,10 +13,8 @@ use std::path::{Path, PathBuf};
 use serde::{Deserialize, Serialize};

 use crate::defaults;
-use crate::{
-    CompactionConfig, PodManifest, PodMeta, ProviderConfig, ProviderKind, ScopeConfig,
-    ToolOutputLimits, WorkerManifest,
-};
+use crate::model::{AuthRef, ModelConfig, SchemeKind};
+use crate::{CompactionConfig, PodManifest, PodMeta, ScopeConfig, ToolOutputLimits, WorkerManifest};

 /// Partial-form Pod manifest. Every field is optional; one or more
 /// instances merge via [`PodManifestConfig::merge`] before being
@ -26,7 +24,7 @@ pub struct PodManifestConfig {
    #[serde(default)]
    pub pod: PodMetaConfig,
    #[serde(default)]
-    pub provider: ProviderConfigPartial,
+    pub model: ModelConfigPartial,
    #[serde(default)]
    pub worker: WorkerManifestConfig,
    #[serde(default)]
@ -41,16 +39,17 @@ pub struct PodMetaConfig {
    pub name: Option<String>,
 }

+/// Partial-form of [`ModelConfig`]. カスケード層で個別に与えられる。
 #[derive(Debug, Clone, Default, Serialize, Deserialize)]
-pub struct ProviderConfigPartial {
+pub struct ModelConfigPartial {
    #[serde(default)]
-    pub kind: Option<ProviderKind>,
-    #[serde(default)]
-    pub model: Option<String>,
-    #[serde(default)]
-    pub api_key_file: Option<PathBuf>,
+    pub scheme: Option<SchemeKind>,
    #[serde(default)]
    pub base_url: Option<String>,
+    #[serde(default)]
+    pub model_id: Option<String>,
+    #[serde(default)]
+    pub auth: Option<AuthRef>,
 }

 #[derive(Debug, Clone, Default, Serialize, Deserialize)]
@ -92,7 +91,7 @@ pub struct CompactionConfigPartial {
    #[serde(default)]
    pub compact_worker_max_input_tokens: Option<u64>,
    #[serde(default)]
-    pub provider: Option<ProviderConfigPartial>,
+    pub model: Option<ModelConfigPartial>,
 }

 /// Errors raised when converting a [`PodManifestConfig`] to a validated
@ -148,18 +147,16 @@ impl PodManifestConfig {
    /// rules from different layers do not accidentally inherit another
    /// layer's base.
    ///
-    /// Affected fields: `provider.api_key_file`,
+    /// Affected fields: `model.auth.file`,
    /// `scope.allow[].target`, `scope.deny[].target`,
-    /// `compaction.provider.api_key_file`.
+    /// `compaction.model.auth.file`.
    pub fn resolve_paths(mut self, base: &Path) -> Self {
        debug_assert!(
            base.is_absolute(),
            "resolve_paths base must be absolute: {}",
            base.display()
        );
-        if let Some(ref mut p) = self.provider.api_key_file {
-            *p = join_if_relative(base, p);
-        }
+        resolve_auth_file(&mut self.model.auth, base);
        for rule in &mut self.scope.allow {
            rule.target = join_if_relative(base, &rule.target);
        }
@ -167,10 +164,9 @@ impl PodManifestConfig {
            rule.target = join_if_relative(base, &rule.target);
        }
        if let Some(ref mut compaction) = self.compaction
-            && let Some(ref mut cp) = compaction.provider
-            && let Some(ref mut p) = cp.api_key_file
+            && let Some(ref mut cp) = compaction.model
        {
-            *p = join_if_relative(base, p);
+            resolve_auth_file(&mut cp.auth, base);
        }
        self
    }
@ -182,7 +178,7 @@ impl PodManifestConfig {
    pub fn merge(self, upper: PodManifestConfig) -> Self {
        Self {
            pod: self.pod.merge(upper.pod),
-            provider: self.provider.merge(upper.provider),
+            model: self.model.merge(upper.model),
            worker: self.worker.merge(upper.worker),
            scope: merge_scope(self.scope, upper.scope),
            compaction: merge_option(
@ -202,13 +198,13 @@ impl PodMetaConfig {
    }
 }

-impl ProviderConfigPartial {
+impl ModelConfigPartial {
    fn merge(self, upper: Self) -> Self {
        Self {
-            kind: upper.kind.or(self.kind),
-            model: upper.model.or(self.model),
-            api_key_file: upper.api_key_file.or(self.api_key_file),
+            scheme: upper.scheme.or(self.scheme),
            base_url: upper.base_url.or(self.base_url),
+            model_id: upper.model_id.or(self.model_id),
+            auth: upper.auth.or(self.auth),
        }
    }
 }
@ -254,7 +250,7 @@ impl CompactionConfigPartial {
            compact_worker_max_input_tokens: upper
                .compact_worker_max_input_tokens
                .or(self.compact_worker_max_input_tokens),
-            provider: merge_option(self.provider, upper.provider, ProviderConfigPartial::merge),
+            model: merge_option(self.model, upper.model, ModelConfigPartial::merge),
        }
    }
 }
@ -295,25 +291,35 @@ fn ensure_absolute(field: &'static str, path: &Path) -> Result<(), ResolveError>
    }
 }

-fn resolve_provider(
-    cfg: ProviderConfigPartial,
-    kind_field: &'static str,
-    model_field: &'static str,
-    api_key_field: &'static str,
-) -> Result<ProviderConfig, ResolveError> {
-    let kind = cfg.kind.ok_or(ResolveError::MissingField(kind_field))?;
-    let model = cfg.model.ok_or(ResolveError::MissingField(model_field))?;
-    if let Some(ref p) = cfg.api_key_file {
-        ensure_absolute(api_key_field, p)?;
+fn resolve_model(
+    cfg: ModelConfigPartial,
+    scheme_field: &'static str,
+    model_id_field: &'static str,
+    auth_file_field: &'static str,
+) -> Result<ModelConfig, ResolveError> {
+    let scheme = cfg.scheme.ok_or(ResolveError::MissingField(scheme_field))?;
+    let model_id = cfg
+        .model_id
+        .ok_or(ResolveError::MissingField(model_id_field))?;
+    let auth = cfg.auth.unwrap_or_default();
+    if let AuthRef::ApiKey { file: Some(p), .. } = &auth {
+        ensure_absolute(auth_file_field, p)?;
    }
-    Ok(ProviderConfig {
-        kind,
-        model,
-        api_key_file: cfg.api_key_file,
+    Ok(ModelConfig {
+        scheme,
        base_url: cfg.base_url,
+        model_id,
+        auth,
    })
 }

+/// `AuthRef::ApiKey { file, .. }` が相対パスのとき `base` を前置する。
+fn resolve_auth_file(auth: &mut Option<AuthRef>, base: &Path) {
+    if let Some(AuthRef::ApiKey { file: Some(p), .. }) = auth.as_mut() {
+        *p = join_if_relative(base, p);
+    }
+}
+
 impl TryFrom<PodManifestConfig> for PodManifest {
    type Error = ResolveError;

@ -323,11 +329,11 @@ impl TryFrom<PodManifestConfig> for PodManifest {
            .name
            .ok_or(ResolveError::MissingField("pod.name"))?;

-        let provider = resolve_provider(
-            cfg.provider,
-            "provider.kind",
-            "provider.model",
-            "provider.api_key_file",
+        let model = resolve_model(
+            cfg.model,
+            "model.scheme",
+            "model.model_id",
+            "model.auth.file",
        )?;

        let worker = WorkerManifest {
@ -361,14 +367,14 @@ impl TryFrom<PodManifestConfig> for PodManifest {
        let compaction = cfg
            .compaction
            .map(|c| -> Result<CompactionConfig, ResolveError> {
-                let comp_provider = c
-                    .provider
+                let comp_model = c
+                    .model
                    .map(|p| {
-                        resolve_provider(
+                        resolve_model(
                            p,
-                            "compaction.provider.kind",
-                            "compaction.provider.model",
-                            "compaction.provider.api_key_file",
+                            "compaction.model.scheme",
+                            "compaction.model.model_id",
+                            "compaction.model.auth.file",
                        )
                    })
                    .transpose()?;
@ -390,14 +396,14 @@ impl TryFrom<PodManifestConfig> for PodManifest {
                    compact_worker_max_input_tokens: c
                        .compact_worker_max_input_tokens
                        .unwrap_or(defaults::COMPACT_WORKER_MAX_INPUT_TOKENS),
-                    provider: comp_provider,
+                    model: comp_model,
                })
            })
            .transpose()?;

        Ok(PodManifest {
            pod: PodMeta { name },
-            provider,
+            model,
            worker,
            scope: cfg.scope,
            compaction,
@ -414,14 +420,21 @@ mod tests {
        PathBuf::from(format!("/tmp/insomnia-test{path}"))
    }

+    fn api_key_file_auth(path: PathBuf) -> AuthRef {
+        AuthRef::ApiKey {
+            env: None,
+            file: Some(path),
+        }
+    }
+
    fn minimal_valid() -> PodManifestConfig {
        PodManifestConfig {
            pod: PodMetaConfig {
                name: Some("test".into()),
            },
-            provider: ProviderConfigPartial {
-                kind: Some(ProviderKind::Anthropic),
-                model: Some("claude-sonnet-4-20250514".into()),
+            model: ModelConfigPartial {
+                scheme: Some(SchemeKind::Anthropic),
+                model_id: Some("claude-sonnet-4-20250514".into()),
                ..Default::default()
            },
            worker: WorkerManifestConfig::default(),
@ -441,16 +454,20 @@ mod tests {
    fn resolve_minimal_succeeds() {
        let manifest: PodManifest = minimal_valid().try_into().unwrap();
        assert_eq!(manifest.pod.name, "test");
-        assert_eq!(manifest.provider.kind, ProviderKind::Anthropic);
+        assert_eq!(manifest.model.scheme, SchemeKind::Anthropic);
    }

    #[test]
-    fn resolve_paths_joins_relative_api_key_file() {
+    fn resolve_paths_joins_relative_auth_file() {
        let mut cfg = minimal_valid();
-        cfg.provider.api_key_file = Some(PathBuf::from("keys/anthropic"));
+        cfg.model.auth = Some(api_key_file_auth(PathBuf::from("keys/anthropic")));
        let resolved = cfg.resolve_paths(Path::new("/home/user/.config/insomnia"));
+        let file = match resolved.model.auth {
+            Some(AuthRef::ApiKey { file, .. }) => file,
+            _ => panic!("expected ApiKey"),
+        };
        assert_eq!(
-            resolved.provider.api_key_file.as_deref(),
+            file.as_deref(),
            Some(Path::new("/home/user/.config/insomnia/keys/anthropic"))
        );
    }
@ -458,12 +475,13 @@ mod tests {
    #[test]
    fn resolve_paths_leaves_absolute_paths_untouched() {
        let mut cfg = minimal_valid();
-        cfg.provider.api_key_file = Some(PathBuf::from("/etc/already/abs"));
+        cfg.model.auth = Some(api_key_file_auth(PathBuf::from("/etc/already/abs")));
        let resolved = cfg.resolve_paths(Path::new("/home/user"));
-        assert_eq!(
-            resolved.provider.api_key_file.as_deref(),
-            Some(Path::new("/etc/already/abs"))
-        );
+        let file = match resolved.model.auth {
+            Some(AuthRef::ApiKey { file, .. }) => file,
+            _ => panic!("expected ApiKey"),
+        };
+        assert_eq!(file.as_deref(), Some(Path::new("/etc/already/abs")));
    }

    #[test]
@ -484,16 +502,14 @@ mod tests {
    }

    #[test]
-    fn try_from_invariant_rejects_lingering_relative_api_key_file() {
+    fn try_from_invariant_rejects_lingering_relative_auth_file() {
        let mut cfg = minimal_valid();
-        cfg.provider.api_key_file = Some(PathBuf::from("keys/relative"));
-        // Skipping resolve_paths on purpose: TryFrom must catch the
-        // invariant violation.
+        cfg.model.auth = Some(api_key_file_auth(PathBuf::from("keys/relative")));
        let err = PodManifest::try_from(cfg).unwrap_err();
        assert!(matches!(
            err,
            ResolveError::RelativePath {
-                field: "provider.api_key_file",
+                field: "model.auth.file",
                ..
            }
        ));
@ -535,8 +551,8 @@ mod tests {
            pod: PodMetaConfig {
                name: Some("lower".into()),
            },
-            provider: ProviderConfigPartial {
-                model: Some("lower-model".into()),
+            model: ModelConfigPartial {
+                model_id: Some("lower-model".into()),
                ..Default::default()
            },
            ..Default::default()
@ -549,8 +565,8 @@ mod tests {
        };
        let merged = lower.merge(upper);
        assert_eq!(merged.pod.name.as_deref(), Some("upper"));
-        // model not present in upper — retain lower
-        assert_eq!(merged.provider.model.as_deref(), Some("lower-model"));
+        // model_id not present in upper — retain lower
+        assert_eq!(merged.model.model_id.as_deref(), Some("lower-model"));
    }

    #[test]
@ -706,9 +722,9 @@ permission = "write"
            pod: PodMetaConfig {
                name: Some("x".into()),
            },
-            provider: ProviderConfigPartial {
-                kind: Some(ProviderKind::Anthropic),
-                model: Some("m".into()),
+            model: ModelConfigPartial {
+                scheme: Some(SchemeKind::Anthropic),
+                model_id: Some("m".into()),
                ..Default::default()
            },
            scope: ScopeConfig {
@ -734,9 +750,9 @@ permission = "write"
        let builtin = PodManifestConfig::default();
        let user = PodManifestConfig::from_toml(
            r#"
-[provider]
-kind = "anthropic"
-model = "claude-sonnet-4-20250514"
+[model]
+scheme = "anthropic"
+model_id = "claude-sonnet-4-20250514"
 "#,
        )
        .unwrap();
@ -759,7 +775,7 @@ name = "dbg"
        let merged = builtin.merge(user).merge(project).merge(overlay);
        let manifest: PodManifest = merged.try_into().unwrap();
        assert_eq!(manifest.pod.name, "dbg");
-        assert_eq!(manifest.provider.kind, ProviderKind::Anthropic);
+        assert_eq!(manifest.model.scheme, SchemeKind::Anthropic);
        assert_eq!(manifest.scope.allow.len(), 1);
    }
 }
--- a/crates/manifest/src/lib.rs
+++ b/crates/manifest/src/lib.rs
@ -1,30 +1,31 @@
 mod config;
 pub mod defaults;
+mod model;
 mod scope;

 pub use config::{
-    CompactionConfigPartial, PodManifestConfig, PodMetaConfig, ProviderConfigPartial, ResolveError,
+    CompactionConfigPartial, ModelConfigPartial, PodManifestConfig, PodMetaConfig, ResolveError,
    ToolOutputLimitsPartial, WorkerManifestConfig,
 };
+pub use model::{AuthRef, ModelConfig, SchemeKind};
 pub use protocol::{Permission, ScopeRule};
 pub use scope::{Scope, ScopeError};

 use std::collections::HashMap;
 use std::num::NonZeroU32;
-use std::path::PathBuf;

 use serde::{Deserialize, Serialize};

 /// Declarative configuration for a Pod.
 ///
-/// Parsed from a TOML manifest file. Describes the provider, model,
-/// system prompt, and directory scope (required). The Pod's working
-/// directory is **not** part of the manifest — it is the process's
-/// `std::env::current_dir()` at construction time.
+/// Parsed from a TOML manifest file. Describes the model, system prompt,
+/// and directory scope (required). The Pod's working directory is **not**
+/// part of the manifest — it is the process's `std::env::current_dir()`
+/// at construction time.
 #[derive(Debug, Clone, Serialize, Deserialize)]
 pub struct PodManifest {
    pub pod: PodMeta,
-    pub provider: ProviderConfig,
+    pub model: ModelConfig,
    pub worker: WorkerManifest,
    pub scope: ScopeConfig,
    #[serde(default)]
@ -37,44 +38,6 @@ pub struct PodMeta {
    pub name: String,
 }

-/// LLM provider configuration.
-#[derive(Debug, Clone, Serialize, Deserialize)]
-pub struct ProviderConfig {
-    pub kind: ProviderKind,
-    pub model: String,
-    /// Path to a file containing the API key (read and trimmed at startup).
-    #[serde(default)]
-    pub api_key_file: Option<PathBuf>,
-    /// Custom base URL for the provider API.
-    #[serde(default)]
-    pub base_url: Option<String>,
-}
-
-/// Supported LLM providers.
-#[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize, Deserialize)]
-#[serde(rename_all = "lowercase")]
-pub enum ProviderKind {
-    Anthropic,
-    Openai,
-    Gemini,
-    Ollama,
-}
-
-impl ProviderKind {
-    /// Conventional environment variable name for the API key.
-    ///
-    /// Returns `INSOMNIA_API_KEY_{KIND}` (e.g. `INSOMNIA_API_KEY_ANTHROPIC`).
-    pub fn env_var_name(self) -> String {
-        let kind = match self {
-            Self::Anthropic => "ANTHROPIC",
-            Self::Openai => "OPENAI",
-            Self::Gemini => "GEMINI",
-            Self::Ollama => "OLLAMA",
-        };
-        format!("INSOMNIA_API_KEY_{kind}")
-    }
-}
-
 /// Worker-level configuration embedded in the manifest.
 #[derive(Debug, Clone, Serialize, Deserialize)]
 pub struct WorkerManifest {
@ -211,10 +174,10 @@ pub struct CompactionConfig {
    #[serde(default = "default_compact_worker_max_input_tokens")]
    pub compact_worker_max_input_tokens: u64,

-    /// Optional provider for the compactor (summary) LLM.
-    /// If omitted, the main provider is cloned via `clone_boxed()`.
+    /// Optional model for the compactor (summary) LLM.
+    /// If omitted, the main model is cloned via `clone_boxed()`.
    #[serde(default)]
-    pub provider: Option<ProviderConfig>,
+    pub model: Option<ModelConfig>,
 }

 fn default_prune_protected_turns() -> usize {
@ -243,7 +206,7 @@ impl Default for CompactionConfig {
            compact_retained_tokens: default_compact_retained_tokens(),
            compact_auto_read_budget: default_compact_auto_read_budget(),
            compact_worker_max_input_tokens: default_compact_worker_max_input_tokens(),
-            provider: None,
+            model: None,
        }
    }
 }
@ -263,9 +226,9 @@ mod tests {
 [pod]
 name = "test-agent"

-[provider]
-kind = "anthropic"
-model = "claude-sonnet-4-20250514"
+[model]
+scheme = "anthropic"
+model_id = "claude-sonnet-4-20250514"

 [worker]

@ -278,9 +241,9 @@ permission = "write"
    fn parse_minimal_manifest() {
        let manifest = PodManifest::from_toml(MINIMAL_REQUIRED).unwrap();
        assert_eq!(manifest.pod.name, "test-agent");
-        assert_eq!(manifest.provider.kind, ProviderKind::Anthropic);
-        assert_eq!(manifest.provider.model, "claude-sonnet-4-20250514");
-        assert!(manifest.provider.api_key_file.is_none());
+        assert_eq!(manifest.model.scheme, SchemeKind::Anthropic);
+        assert_eq!(manifest.model.model_id, "claude-sonnet-4-20250514");
+        assert_eq!(manifest.model.auth, AuthRef::None);
        assert_eq!(manifest.scope.allow.len(), 1);
        assert!(manifest.scope.deny.is_empty());
        assert_eq!(manifest.worker.instruction, defaults::DEFAULT_INSTRUCTION);
@ -292,10 +255,10 @@ permission = "write"
 [pod]
 name = "code-reviewer"

-[provider]
-kind = "anthropic"
-model = "claude-sonnet-4-20250514"
-api_key_file = "/abs/keys/anthropic"
+[model]
+scheme = "anthropic"
+model_id = "claude-sonnet-4-20250514"
+auth = { kind = "api_key", file = "/abs/keys/anthropic" }

 [worker]
 instruction = "$user/reviewer"
@ -317,10 +280,11 @@ permission = "write"
 "#;
        let manifest = PodManifest::from_toml(toml).unwrap();
        assert_eq!(manifest.pod.name, "code-reviewer");
-        assert_eq!(
-            manifest.provider.api_key_file.as_deref(),
-            Some(std::path::Path::new("/abs/keys/anthropic"))
-        );
+        let file = match &manifest.model.auth {
+            AuthRef::ApiKey { file, .. } => file.as_deref(),
+            _ => panic!("expected ApiKey"),
+        };
+        assert_eq!(file, Some(std::path::Path::new("/abs/keys/anthropic")));
        assert_eq!(manifest.worker.instruction, "$user/reviewer");
        assert_eq!(manifest.worker.max_tokens, Some(4096));
        assert_eq!(manifest.worker.temperature, Some(0.3));
@ -340,9 +304,9 @@ permission = "write"
 [pod]
 name = "missing-scope"

-[provider]
-kind = "anthropic"
-model = "claude-sonnet-4-20250514"
+[model]
+scheme = "anthropic"
+model_id = "claude-sonnet-4-20250514"

 [worker]
 "#;
@ -408,20 +372,20 @@ model = "claude-sonnet-4-20250514"
    }

    #[test]
-    fn parse_compaction_with_provider() {
+    fn parse_compaction_with_model() {
        let toml = format!(
            "{MINIMAL_REQUIRED}\n\
             [compaction]\n\
             compact_threshold = 80000\n\n\
-             [compaction.provider]\n\
-             kind = \"gemini\"\n\
-             model = \"gemini-2.0-flash\"\n"
+             [compaction.model]\n\
+             scheme = \"gemini\"\n\
+             model_id = \"gemini-2.0-flash\"\n"
        );
        let manifest = PodManifest::from_toml(&toml).unwrap();
        let c = manifest.compaction.unwrap();
-        let p = c.provider.unwrap();
-        assert_eq!(p.kind, ProviderKind::Gemini);
-        assert_eq!(p.model, "gemini-2.0-flash");
+        let p = c.model.unwrap();
+        assert_eq!(p.scheme, SchemeKind::Gemini);
+        assert_eq!(p.model_id, "gemini-2.0-flash");
    }

    #[test]
@ -431,8 +395,9 @@ model = "claude-sonnet-4-20250514"
    }

    #[test]
-    fn reject_unknown_provider() {
-        let toml = MINIMAL_REQUIRED.replace("kind = \"anthropic\"", "kind = \"unknown_provider\"");
+    fn reject_unknown_scheme() {
+        let toml =
+            MINIMAL_REQUIRED.replace("scheme = \"anthropic\"", "scheme = \"unknown_scheme\"");
        assert!(PodManifest::from_toml(&toml).is_err());
    }

--- a/crates/manifest/src/model.rs
+++ b/crates/manifest/src/model.rs
@ -0,0 +1,74 @@
+//! LLM モデル宣言型
+//!
+//! Pod マニフェストの `[model]` セクションで記述する型。`scheme` と
+//! `auth` を直交軸として表現し、1 つの汎用アダプタ（`crates/provider`）
+//! で任意の wire / 認証組合せを受け止める。
+
+use std::path::PathBuf;
+
+use serde::{Deserialize, Serialize};
+
+/// Pod が使う LLM モデルの宣言。
+#[derive(Debug, Clone, Serialize, Deserialize, PartialEq)]
+pub struct ModelConfig {
+    /// wire format
+    pub scheme: SchemeKind,
+    /// API のベース URL。未指定なら scheme の既定値にフォールバック
+    #[serde(default)]
+    pub base_url: Option<String>,
+    /// プロバイダが受け付けるモデル ID
+    pub model_id: String,
+    /// 認証方式
+    #[serde(default)]
+    pub auth: AuthRef,
+}
+
+/// サポートする wire scheme の種類。
+#[derive(Debug, Clone, Copy, Serialize, Deserialize, PartialEq, Eq)]
+#[serde(rename_all = "snake_case")]
+pub enum SchemeKind {
+    /// Anthropic Messages API (`/v1/messages`)。Ollama `/v1/messages` もこれで扱う
+    Anthropic,
+    /// OpenAI Chat Completions (`/v1/chat/completions`)。OpenAI 互換ルーター共通枠
+    OpenaiChat,
+    /// OpenAI Responses API (`/v1/responses`)。別チケットで scheme 新設予定
+    OpenaiResponses,
+    /// Google Gemini (`/v1beta/models/...:streamGenerateContent`)
+    Gemini,
+}
+
+/// 認証の参照。
+///
+/// 実際のトークン値の解決（env / file 読取、OAuth refresh 等）は
+/// `crates/provider` で行う。ここはあくまで「どこから取るか」の宣言。
+#[derive(Debug, Clone, Serialize, Deserialize, PartialEq, Eq, Default)]
+#[serde(tag = "kind", rename_all = "snake_case")]
+pub enum AuthRef {
+    /// 認証不要（ローカル Ollama 等）
+    #[default]
+    None,
+    /// API key。env / file のいずれか（両方指定された場合は env が優先）
+    ApiKey {
+        /// 環境変数名。未指定のときは scheme ごとの既定（`INSOMNIA_API_KEY_*`）
+        #[serde(default)]
+        env: Option<String>,
+        /// key を書き込んだファイル（絶対パス）
+        #[serde(default)]
+        file: Option<PathBuf>,
+    },
+    /// ChatGPT OAuth（`~/.codex/auth.json`）。実装は `llm-auth-codex-oauth` チケット
+    CodexOAuth,
+}
+
+impl SchemeKind {
+    /// 既定の環境変数名（`INSOMNIA_API_KEY_*`）。
+    ///
+    /// `AuthRef::ApiKey { env: None, .. }` の env 未指定時に使う。
+    pub fn default_env_var(self) -> &'static str {
+        match self {
+            Self::Anthropic => "INSOMNIA_API_KEY_ANTHROPIC",
+            Self::OpenaiChat | Self::OpenaiResponses => "INSOMNIA_API_KEY_OPENAI",
+            Self::Gemini => "INSOMNIA_API_KEY_GEMINI",
+        }
+    }
+}
--- a/crates/pod/examples/pod_cli.rs
+++ b/crates/pod/examples/pod_cli.rs
@ -22,9 +22,9 @@ fn manifest_toml(pwd: &std::path::Path) -> String {
 name = "hello-pod"
 pwd = "{pwd}"

-[provider]
-kind = "anthropic"
-model = "claude-sonnet-4-20250514"
+[model]
+scheme = "anthropic"
+model_id = "claude-sonnet-4-20250514"

 [worker]
 system_prompt = "You are a concise assistant. Reply in one or two sentences."
--- a/crates/pod/examples/pod_protocol.rs
+++ b/crates/pod/examples/pod_protocol.rs
@ -16,9 +16,9 @@ fn manifest_toml(pwd: &std::path::Path) -> String {
 name = "protocol-demo"
 pwd = "{pwd}"

-[provider]
-kind = "anthropic"
-model = "claude-sonnet-4-20250514"
+[model]
+scheme = "anthropic"
+model_id = "claude-sonnet-4-20250514"

 [worker]
 system_prompt = "You are a concise assistant. Reply in one or two sentences."
--- a/crates/pod/src/controller.rs
+++ b/crates/pod/src/controller.rs
@ -113,7 +113,7 @@ impl PodController {
        let scope_for_tools = pod.scope().clone();
        let pwd_for_tools = pod.pwd().to_path_buf();
        let spawner_name = pod.manifest().pod.name.clone();
-        let spawner_provider = pod.manifest().provider.clone();
+        let spawner_model = pod.manifest().model.clone();

        // Parent callback socket (this Pod's own parent, used for
        // `PodEvent` upward reports). `None` for top-level Pods.
@ -230,7 +230,7 @@ impl PodController {
                pwd_for_tools,
                spawned_registry.clone(),
                self_parent_socket.clone(),
-                spawner_provider.clone(),
+                spawner_model.clone(),
            ));
            worker.register_tool(send_to_pod_tool(spawned_registry.clone()));
            worker.register_tool(read_pod_output_tool(spawned_registry.clone()));
@ -663,11 +663,11 @@ where
    St: Store,
 {
    let manifest = pod.manifest();
-    let provider = match manifest.provider.kind {
-        manifest::ProviderKind::Anthropic => "anthropic",
-        manifest::ProviderKind::Openai => "openai",
-        manifest::ProviderKind::Gemini => "gemini",
-        manifest::ProviderKind::Ollama => "ollama",
+    let provider = match manifest.model.scheme {
+        manifest::SchemeKind::Anthropic => "anthropic",
+        manifest::SchemeKind::OpenaiChat => "openai_chat",
+        manifest::SchemeKind::OpenaiResponses => "openai_responses",
+        manifest::SchemeKind::Gemini => "gemini",
    };
    // The tool list mirrors what `spawn()` registers on the Worker:
    // builtin filesystem tools plus the pod-orchestration tools.
@ -689,7 +689,7 @@ where
        pod_name: manifest.pod.name.clone(),
        cwd: pod.pwd().display().to_string(),
        provider: provider.into(),
-        model: manifest.provider.model.clone(),
+        model: manifest.model.model_id.clone(),
        scope_summary: pod.scope().summary(),
        tools: tool_names,
    }
--- a/crates/pod/src/factory.rs
+++ b/crates/pod/src/factory.rs
@ -317,9 +317,9 @@ mod tests {
 [pod]
 name = "solo"

-[provider]
-kind = "anthropic"
-model = "claude-sonnet-4-20250514"
+[model]
+scheme = "anthropic"
+model_id = "claude-sonnet-4-20250514"

 [[scope.allow]]
 target = "{pwd}"
@ -342,9 +342,9 @@ permission = "write"
        let pwd = tmp.path().canonicalize().unwrap();
        let user_cfg = PodManifestConfig::from_toml(&format!(
            r#"
-[provider]
-kind = "anthropic"
-model = "user-model"
+[model]
+scheme = "anthropic"
+model_id = "user-model"

 [[scope.allow]]
 target = "{pwd}"
@ -355,8 +355,8 @@ permission = "read"
        .unwrap();
        let project_cfg = PodManifestConfig::from_toml(&format!(
            r#"
-[provider]
-model = "project-model"
+[model]
+model_id = "project-model"

 [[scope.allow]]
 target = "{pwd}"
@ -387,7 +387,7 @@ name = "overlay-name"
        // overlay layer so later calls win. This also exercises the
        // scope union across layers (two allow rules).
        assert_eq!(manifest.pod.name, "overlay-name");
-        assert_eq!(manifest.provider.model, "project-model");
+        assert_eq!(manifest.model.model_id, "project-model");
        assert_eq!(manifest.scope.allow.len(), 2);
    }

@ -406,9 +406,9 @@ name = "overlay-name"
 [pod]
 name = "from-user"

-[provider]
-kind = "anthropic"
-model = "user-model"
+[model]
+scheme = "anthropic"
+model_id = "user-model"

 [[scope.allow]]
 target = "{pwd}"
@ -423,8 +423,8 @@ permission = "write"
        write(
            &project_manifest,
            r#"
-[provider]
-model = "project-model"
+[model]
+model_id = "project-model"
 "#,
        );

@ -436,8 +436,8 @@ model = "project-model"
            .resolve()
            .unwrap();

-        // project layer overrides user layer on provider.model
-        assert_eq!(manifest.provider.model, "project-model");
+        // project layer overrides user layer on model.model_id
+        assert_eq!(manifest.model.model_id, "project-model");
        // user layer provides the rest
        assert_eq!(manifest.pod.name, "from-user");
    }
@ -454,9 +454,9 @@ model = "project-model"
 [pod]
 name = "walked-up"

-[provider]
-kind = "anthropic"
-model = "claude-sonnet-4-20250514"
+[model]
+scheme = "anthropic"
+model_id = "claude-sonnet-4-20250514"

 [[scope.allow]]
 target = "{root}"
@ -487,9 +487,9 @@ permission = "write"
 [pod]
 name = "standalone"

-[provider]
-kind = "anthropic"
-model = "m"
+[model]
+scheme = "anthropic"
+model_id = "m"

 [[scope.allow]]
 target = "{pwd}"
@ -529,9 +529,9 @@ permission = "write"
 [pod]
 name = "rel-user"

-[provider]
-kind = "anthropic"
-model = "m"
+[model]
+scheme = "anthropic"
+model_id = "m"

 [[scope.allow]]
 target = "./workspace"
@ -565,9 +565,9 @@ permission = "write"
 [pod]
 name = "rel-project"

-[provider]
-kind = "anthropic"
-model = "m"
+[model]
+scheme = "anthropic"
+model_id = "m"

 [[scope.allow]]
 target = "."
@ -604,9 +604,9 @@ permission = "write"
 [pod]
 name = "factory-pod"

-[provider]
-kind = "anthropic"
-model = "m"
+[model]
+scheme = "anthropic"
+model_id = "m"

 [[scope.allow]]
 target = "{root}"
@ -661,9 +661,9 @@ permission = "write"
        // pod.name missing — resolver must reject.
        let overlay = format!(
            r#"
-[provider]
-kind = "anthropic"
-model = "m"
+[model]
+scheme = "anthropic"
+model_id = "m"

 [[scope.allow]]
 target = "{pwd}"
--- a/crates/pod/src/lib.rs
+++ b/crates/pod/src/lib.rs
@ -31,7 +31,7 @@ pub use factory::{FactoryError, PodFactory};
 pub use notifier::Notifier;
 pub use hook::{Hook, HookEventKind, HookRegistryBuilder};
 pub use manifest::{
-    PodManifest, PodManifestConfig, PodMetaConfig, ProviderConfig, ProviderKind, Scope,
+    AuthRef, ModelConfig, PodManifest, PodManifestConfig, PodMetaConfig, Scope, SchemeKind,
 };
 pub use pod::{Pod, PodError, PodRunResult, apply_worker_manifest};
 pub use prompt_loader::PromptLoader;
--- a/crates/pod/src/pod.rs
+++ b/crates/pod/src/pod.rs
@ -818,7 +818,7 @@ impl<C: LlmClient, St: Store> Pod<C, St> {
    /// `[summary, ...recent_turns]` and creating a new session.
    ///
    /// The summary Worker uses:
-    /// - `compaction.provider` from the manifest if configured, or
+    /// - `compaction.model` from the manifest if configured, or
    /// - a clone of the main LlmClient via `clone_boxed()`.
    ///
    /// Returns the new session ID.
@ -1056,12 +1056,12 @@ impl<C: LlmClient, St: Store> Pod<C, St> {

    /// Build the LlmClient for the compactor Worker.
    ///
-    /// Uses `compaction.provider` from manifest if set, otherwise clones
+    /// Uses `compaction.model` from manifest if set, otherwise clones
    /// the main client.
    fn build_compactor_client(&self) -> Result<Box<dyn LlmClient>, PodError> {
        if let Some(ref compaction) = self.manifest.compaction {
-            if let Some(ref provider_config) = compaction.provider {
-                let client = provider::build_client(provider_config)?;
+            if let Some(ref model_config) = compaction.model {
+                let client = provider::build_client(model_config)?;
                return Ok(client);
            }
        }
@ -1109,7 +1109,7 @@ impl<St: Store> Pod<Box<dyn LlmClient>, St> {
            scope.allow_rules(),
        )?;

-        let client = provider::build_client(&manifest.provider)?;
+        let client = provider::build_client(&manifest.model)?;
        let mut worker = Worker::new(client);
        apply_worker_manifest(&mut worker, &manifest.worker);

@ -1176,7 +1176,7 @@ impl<St: Store> Pod<Box<dyn LlmClient>, St> {
        let scope_allocation =
            scope_lock::adopt_allocation(manifest.pod.name.clone(), std::process::id())?;

-        let client = provider::build_client(&manifest.provider)?;
+        let client = provider::build_client(&manifest.model)?;
        let mut worker = Worker::new(client);
        apply_worker_manifest(&mut worker, &manifest.worker);

--- a/crates/pod/src/spawn_pod.rs
+++ b/crates/pod/src/spawn_pod.rs
@ -14,8 +14,8 @@ use std::time::Duration;
 use async_trait::async_trait;
 use llm_worker::tool::{Tool, ToolDefinition, ToolError, ToolMeta, ToolOutput};
 use manifest::{
-    Permission, PodManifestConfig, PodMetaConfig, ProviderConfig, ProviderConfigPartial,
-    ScopeConfig, ScopeRule, WorkerManifestConfig,
+    ModelConfig, ModelConfigPartial, Permission, PodManifestConfig, PodMetaConfig, ScopeConfig,
+    ScopeRule, WorkerManifestConfig,
 };
 use protocol::Method;
 use protocol::stream::JsonLineWriter;
@ -118,7 +118,7 @@ pub struct SpawnPodTool {
    /// Pod's overlay TOML so the child does not need its own provider
    /// configuration in the manifest cascade. Per-spawn override is
    /// out of scope here (see `tickets/spawn-inherit-provider.md`).
-    spawner_provider: ProviderConfig,
+    spawner_model: ModelConfig,
 }

 impl SpawnPodTool {
@ -129,7 +129,7 @@ impl SpawnPodTool {
        spawner_pwd: PathBuf,
        registry: Arc<SpawnedPodRegistry>,
        parent_socket: Option<PathBuf>,
-        spawner_provider: ProviderConfig,
+        spawner_model: ModelConfig,
    ) -> Self {
        Self {
            spawner_name,
@ -138,7 +138,7 @@ impl SpawnPodTool {
            spawner_pwd,
            registry,
            parent_socket,
-            spawner_provider,
+            spawner_model,
        }
    }
 }
@ -196,7 +196,7 @@ impl Tool for SpawnPodTool {
            &input.name,
            &instruction,
            &scope_allow,
-            &self.spawner_provider,
+            &self.spawner_model,
        ) {
            Ok(s) => s,
            Err(e) => {
@ -350,17 +350,17 @@ fn build_overlay_toml(
    name: &str,
    instruction: &str,
    scope_allow: &[ScopeRule],
-    provider: &ProviderConfig,
+    model: &ModelConfig,
 ) -> Result<String, toml::ser::Error> {
    let overlay = PodManifestConfig {
        pod: PodMetaConfig {
            name: Some(name.to_string()),
        },
-        provider: ProviderConfigPartial {
-            kind: Some(provider.kind),
-            model: Some(provider.model.clone()),
-            api_key_file: provider.api_key_file.clone(),
-            base_url: provider.base_url.clone(),
+        model: ModelConfigPartial {
+            scheme: Some(model.scheme),
+            base_url: model.base_url.clone(),
+            model_id: Some(model.model_id.clone()),
+            auth: Some(model.auth.clone()),
        },
        worker: WorkerManifestConfig {
            instruction: Some(instruction.to_string()),
@ -458,7 +458,7 @@ pub fn spawn_pod_tool(
    spawner_pwd: PathBuf,
    registry: Arc<SpawnedPodRegistry>,
    parent_socket: Option<PathBuf>,
-    spawner_provider: ProviderConfig,
+    spawner_model: ModelConfig,
 ) -> ToolDefinition {
    Arc::new(move || {
        let schema = schemars::schema_for!(SpawnPodInput);
@ -473,7 +473,7 @@ pub fn spawn_pod_tool(
            spawner_pwd.clone(),
            registry.clone(),
            parent_socket.clone(),
-            spawner_provider.clone(),
+            spawner_model.clone(),
        ));
        (meta, tool)
    })
@ -482,29 +482,30 @@ pub fn spawn_pod_tool(
 #[cfg(test)]
 mod tests {
    use super::*;
-    use manifest::ProviderKind;
+    use manifest::{AuthRef, SchemeKind};

    #[test]
-    fn overlay_inherits_spawner_provider() {
-        let provider = ProviderConfig {
-            kind: ProviderKind::Anthropic,
-            model: "claude-sonnet-4".into(),
-            api_key_file: Some(PathBuf::from("/etc/keys/anthropic")),
+    fn overlay_inherits_spawner_model() {
+        let model = ModelConfig {
+            scheme: SchemeKind::Anthropic,
            base_url: Some("https://example.test".into()),
+            model_id: "claude-sonnet-4".into(),
+            auth: AuthRef::ApiKey {
+                env: None,
+                file: Some(PathBuf::from("/etc/keys/anthropic")),
+            },
        };

-        let toml_str = build_overlay_toml("child", "$insomnia/default", &[], &provider).unwrap();
+        let toml_str = build_overlay_toml("child", "$insomnia/default", &[], &model).unwrap();
        let parsed = PodManifestConfig::from_toml(&toml_str).unwrap();

-        assert_eq!(parsed.provider.kind, Some(ProviderKind::Anthropic));
-        assert_eq!(parsed.provider.model.as_deref(), Some("claude-sonnet-4"));
-        assert_eq!(
-            parsed.provider.api_key_file.as_deref(),
-            Some(Path::new("/etc/keys/anthropic"))
-        );
-        assert_eq!(
-            parsed.provider.base_url.as_deref(),
-            Some("https://example.test")
-        );
+        assert_eq!(parsed.model.scheme, Some(SchemeKind::Anthropic));
+        assert_eq!(parsed.model.model_id.as_deref(), Some("claude-sonnet-4"));
+        assert_eq!(parsed.model.base_url.as_deref(), Some("https://example.test"));
+        let file = match parsed.model.auth {
+            Some(AuthRef::ApiKey { file, .. }) => file,
+            _ => panic!("expected ApiKey"),
+        };
+        assert_eq!(file.as_deref(), Some(Path::new("/etc/keys/anthropic")));
    }
 }
--- a/crates/pod/tests/controller_test.rs
+++ b/crates/pod/tests/controller_test.rs
@ -110,9 +110,9 @@ const MANIFEST_TOML: &str = r#"
 name = "test-pod"
 pwd = "./"

-[provider]
-kind = "anthropic"
-model = "test-model"
+[model]
+scheme = "anthropic"
+model_id = "test-model"

 [worker]
 max_tokens = 100
--- a/crates/pod/tests/spawn_pod_test.rs
+++ b/crates/pod/tests/spawn_pod_test.rs
@ -11,7 +11,7 @@ use std::path::{Path, PathBuf};
 use std::sync::{LazyLock, Mutex};

 use llm_worker::tool::{ToolError, ToolOutput};
-use manifest::{Permission, ProviderConfig, ProviderKind, ScopeRule};
+use manifest::{AuthRef, ModelConfig, Permission, SchemeKind, ScopeRule};
 use pod::runtime_dir::{RuntimeDir, SpawnedPodRecord};
 use pod::scope_lock::{self, LockFileGuard};
 use pod::spawn_pod::spawn_pod_tool;
@ -132,15 +132,15 @@ fn which_true() -> String {
    "/bin/true".into()
 }

-/// Tests don't exercise the provider — they intercept the spawned
+/// Tests don't exercise the model — they intercept the spawned
 /// child via a mock socket — but `spawn_pod_tool` needs a value to
-/// embed in the overlay TOML. Any well-formed `ProviderConfig` works.
-fn dummy_provider() -> ProviderConfig {
-    ProviderConfig {
-        kind: ProviderKind::Anthropic,
-        model: "claude-test".into(),
-        api_key_file: None,
+/// embed in the overlay TOML. Any well-formed `ModelConfig` works.
+fn dummy_model() -> ModelConfig {
+    ModelConfig {
+        scheme: SchemeKind::Anthropic,
        base_url: None,
+        model_id: "claude-test".into(),
+        auth: AuthRef::None,
    }
 }

@ -171,7 +171,7 @@ async fn spawn_pod_delegates_scope_and_sends_run() {
        allow_root.path().to_path_buf(),
        registry,
        None,
-        dummy_provider(),
+        dummy_model(),
    );
    let (_meta, tool) = def();

@ -234,7 +234,7 @@ async fn spawn_pod_rejects_scope_outside_spawner() {
        allow_root.path().to_path_buf(),
        registry,
        None,
-        dummy_provider(),
+        dummy_model(),
    );
    let (_meta, tool) = def();

@ -293,7 +293,7 @@ async fn spawn_pod_rolls_back_reservation_when_socket_never_appears() {
        allow_root.path().to_path_buf(),
        registry,
        None,
-        dummy_provider(),
+        dummy_model(),
    );
    let (_meta, tool) = def();

--- a/crates/pod/tests/system_prompt_template_test.rs
+++ b/crates/pod/tests/system_prompt_template_test.rs
@ -79,9 +79,9 @@ const MINIMAL_MANIFEST_TOML: &str = r#"
 name = "test-pod"
 pwd = "./"

-[provider]
-kind = "anthropic"
-model = "test-model"
+[model]
+scheme = "anthropic"
+model_id = "test-model"

 [worker]
 max_tokens = 100
--- a/crates/provider/README.md
+++ b/crates/provider/README.md
@ -1,8 +1,15 @@
 # provider

-マニフェストの設定から適切な LLM クライアントを構築するファクトリクレート。APIキーの環境変数解決を含む。
+マニフェストの `ModelConfig` から適切な `LlmClient`（`HttpTransport<S>`）を構築するファクトリクレート。APIキーの環境変数 / ファイル解決と scheme ↔ auth の整合検証を担う。

 ## 公開型

- `build_client(config: &ProviderConfig) -> Result<Box<dyn LlmClient>, ProviderError>` — プロバイダ設定に応じたクライアント生成（Anthropic, OpenAI, Gemini, Ollama）
+- `build_client(config: &ModelConfig) -> Result<Box<dyn LlmClient>, ProviderError>` — `SchemeKind` と `AuthRef` から `HttpTransport<S>` を構築
 - `ProviderError` — クライアント構築エラー
+
+## 責務
+
+- `AuthRef::ApiKey` を `ResolvedAuth::ApiKey` に解決（env → file の優先順位）
+- `AuthRef::None` を `ResolvedAuth::None` に変換
+- `Scheme::required_auth()` と `ResolvedAuth` の妥当性検証（非対応組合せは構築エラー）
+- 既知モデルは scheme の静的テーブル、未知モデルは scheme 既定の `ModelCapability` を採用
--- a/crates/provider/src/lib.rs
+++ b/crates/provider/src/lib.rs
@ -1,99 +1,148 @@
-use llm_worker::llm_client::client::LlmClient;
-use llm_worker::llm_client::providers::anthropic::AnthropicClient;
-use llm_worker::llm_client::providers::gemini::GeminiClient;
-use llm_worker::llm_client::providers::ollama::OllamaClient;
-use llm_worker::llm_client::providers::openai::OpenAIClient;
+//! Pod マニフェストの [`ModelConfig`] を [`Box<dyn LlmClient>`]
+//! に落とすファクトリ。
+//!
+//! * `SchemeKind` を各 `Scheme` 実装にマップ
+//! * `AuthRef` を環境変数 / ファイルから解決して [`ResolvedAuth`] に
+//! * `scheme.required_auth()` と解決値を照合（非対応組合せは構築エラー）
+//! * `ModelCapability` は明示指定 → scheme 静的テーブル → 未知時はデフォルト
+//!
+//! llm-worker は低レベル基盤に留める方針なので、高レベル側で必要に
+//! なる認証ストア解決（Codex OAuth の `~/.codex/auth.json` 読取等）は
+//! このクレートに追加する。

-use manifest::{ProviderConfig, ProviderKind};
+use llm_worker::llm_client::{
+    LlmClient,
+    capability::{CacheStrategy, ModelCapability, StructuredOutput, ToolCallingSupport},
+    scheme::{
+        Scheme, anthropic::AnthropicScheme, gemini::GeminiScheme, openai_chat::OpenAIScheme,
+    },
+    transport::{HttpTransport, ResolvedAuth},
+};

-/// Errors from provider client construction.
+use manifest::{AuthRef, ModelConfig, SchemeKind};
+
+/// プロバイダ構築時のエラー。
 #[derive(Debug, thiserror::Error)]
 pub enum ProviderError {
-    #[error("provider configuration error: {0}")]
+    #[error("model configuration error: {0}")]
    Config(String),

-    #[error("API key not provided for {provider}")]
-    ApiKeyMissing { provider: String },
+    #[error("API key not provided for scheme {scheme:?}")]
+    ApiKeyMissing { scheme: SchemeKind },
+
+    #[error("scheme {scheme:?} does not support this auth")]
+    AuthMismatch { scheme: SchemeKind },
+
+    #[error("scheme {scheme:?} is not implemented yet")]
+    SchemeNotImplemented { scheme: SchemeKind },
 }

-/// Resolve the API key for the given provider configuration.
+/// `AuthRef` をランタイムで使える [`ResolvedAuth`] に解決する。
 ///
-/// Resolution order:
-/// 1. Environment variable `INSOMNIA_API_KEY_{KIND}`
-/// 2. File specified by `api_key_file` (must be an absolute path; the
-///    cascade layer is responsible for normalisation)
-/// 3. `None`
-fn resolve_api_key(config: &ProviderConfig) -> Result<Option<String>, ProviderError> {
-    let env_name = config.kind.env_var_name();
-    if let Ok(val) = std::env::var(&env_name) {
-        return Ok(Some(val));
-    }
-
-    if let Some(ref path) = config.api_key_file {
-        if !path.is_absolute() {
-            return Err(ProviderError::Config(format!(
-                "api_key_file must be absolute: {}",
-                path.display()
-            )));
+/// 解決順:
+/// 1. `AuthRef::ApiKey { env, .. }` で env が指定されていればその変数を参照
+/// 2. そうでなければ scheme 既定の環境変数 (`SchemeKind::default_env_var`)
+/// 3. それでも無ければ `file` を読む（絶対パスのみ）
+fn resolve_auth(
+    scheme: SchemeKind,
+    auth: &AuthRef,
+) -> Result<ResolvedAuth, ProviderError> {
+    match auth {
+        AuthRef::None => Ok(ResolvedAuth::None),
+        AuthRef::ApiKey { env, file } => {
+            let env_name = env.as_deref().unwrap_or(scheme.default_env_var());
+            if let Ok(val) = std::env::var(env_name)
+                && !val.is_empty()
+            {
+                return Ok(ResolvedAuth::ApiKey(val));
+            }
+            if let Some(path) = file {
+                if !path.is_absolute() {
+                    return Err(ProviderError::Config(format!(
+                        "auth.file must be absolute: {}",
+                        path.display()
+                    )));
+                }
+                let contents = std::fs::read_to_string(path).map_err(|e| {
+                    ProviderError::Config(format!(
+                        "failed to read auth.file {}: {e}",
+                        path.display()
+                    ))
+                })?;
+                return Ok(ResolvedAuth::ApiKey(contents.trim().to_owned()));
+            }
+            Err(ProviderError::ApiKeyMissing { scheme })
        }
-        let contents = std::fs::read_to_string(path).map_err(|e| {
-            ProviderError::Config(format!(
-                "failed to read api_key_file {}: {e}",
-                path.display()
-            ))
-        })?;
-        return Ok(Some(contents.trim().to_owned()));
+        AuthRef::CodexOAuth => Err(ProviderError::Config(
+            "codex_oauth auth not yet implemented (tickets/llm-auth-codex-oauth)".into(),
+        )),
    }
-
-    Ok(None)
 }

-/// Build an [`LlmClient`] from a [`ProviderConfig`].
-///
-/// `api_key_file` (if set) must already be an absolute path — relative
-/// paths are rejected because cascade resolution is the sole source of
-/// path normalisation.
-pub fn build_client(config: &ProviderConfig) -> Result<Box<dyn LlmClient>, ProviderError> {
-    let api_key = resolve_api_key(config)?;
+/// `SchemeKind` ごとに固定のデフォルト capability（未知モデル用）。
+fn default_capability(scheme: SchemeKind) -> ModelCapability {
+    match scheme {
+        SchemeKind::Anthropic => ModelCapability {
+            tool_calling: ToolCallingSupport::Parallel,
+            structured_output: StructuredOutput::JsonSchema,
+            reasoning: None,
+            vision: false,
+            // Ollama の /v1/messages 流用時に cache_control を拒否されないよう Auto
+            prompt_caching: CacheStrategy::Auto,
+        },
+        SchemeKind::OpenaiChat | SchemeKind::OpenaiResponses => ModelCapability {
+            tool_calling: ToolCallingSupport::Parallel,
+            structured_output: StructuredOutput::JsonSchema,
+            reasoning: None,
+            vision: false,
+            prompt_caching: CacheStrategy::Auto,
+        },
+        SchemeKind::Gemini => ModelCapability {
+            tool_calling: ToolCallingSupport::Parallel,
+            structured_output: StructuredOutput::JsonSchema,
+            reasoning: None,
+            vision: true,
+            prompt_caching: CacheStrategy::Auto,
+        },
+    }
+}

-    match config.kind {
-        ProviderKind::Anthropic => {
-            let key = api_key.ok_or_else(|| ProviderError::ApiKeyMissing {
-                provider: "anthropic".into(),
-            })?;
-            let mut client = AnthropicClient::new(key, &config.model);
-            if let Some(ref url) = config.base_url {
-                client = client.with_base_url(url);
-            }
-            Ok(Box::new(client))
-        }
-        ProviderKind::Openai => {
-            let key = api_key.ok_or_else(|| ProviderError::ApiKeyMissing {
-                provider: "openai".into(),
-            })?;
-            let mut client = OpenAIClient::new(key, &config.model);
-            if let Some(ref url) = config.base_url {
-                client = client.with_base_url(url);
-            }
-            Ok(Box::new(client))
-        }
-        ProviderKind::Gemini => {
-            let key = api_key.ok_or_else(|| ProviderError::ApiKeyMissing {
-                provider: "gemini".into(),
-            })?;
-            let mut client = GeminiClient::new(key, &config.model);
-            if let Some(ref url) = config.base_url {
-                client = client.with_base_url(url);
-            }
-            Ok(Box::new(client))
-        }
-        ProviderKind::Ollama => {
-            let mut client = OllamaClient::new(&config.model);
-            if let Some(ref url) = config.base_url {
-                client = client.with_base_url(url);
-            }
-            Ok(Box::new(client))
-        }
+fn build_transport<S: Scheme>(
+    scheme: S,
+    config: &ModelConfig,
+    resolved: ResolvedAuth,
+) -> Result<Box<dyn LlmClient>, ProviderError> {
+    if !resolved.matches(scheme.required_auth()) {
+        return Err(ProviderError::AuthMismatch {
+            scheme: config.scheme,
+        });
+    }
+    let capability = scheme
+        .capability_for(&config.model_id)
+        .unwrap_or_else(|| default_capability(config.scheme));
+    let base_url = config
+        .base_url
+        .clone()
+        .unwrap_or_else(|| scheme.default_base_url().to_string());
+    Ok(Box::new(HttpTransport::new(
+        scheme,
+        config.model_id.clone(),
+        base_url,
+        resolved,
+        capability,
+    )))
+}
+
+/// [`ModelConfig`] から [`LlmClient`] を構築する。
+pub fn build_client(config: &ModelConfig) -> Result<Box<dyn LlmClient>, ProviderError> {
+    let resolved = resolve_auth(config.scheme, &config.auth)?;
+    match config.scheme {
+        SchemeKind::Anthropic => build_transport(AnthropicScheme::new(), config, resolved),
+        SchemeKind::OpenaiChat => build_transport(OpenAIScheme::new(), config, resolved),
+        SchemeKind::Gemini => build_transport(GeminiScheme::new(), config, resolved),
+        SchemeKind::OpenaiResponses => Err(ProviderError::SchemeNotImplemented {
+            scheme: config.scheme,
+        }),
    }
 }

@ -104,23 +153,29 @@ mod tests {
    use std::io::Write;
    use std::path::PathBuf;

-    fn anthropic_config() -> ProviderConfig {
-        ProviderConfig {
-            kind: ProviderKind::Anthropic,
-            model: "test-model".into(),
-            api_key_file: None,
+    fn anthropic_config() -> ModelConfig {
+        ModelConfig {
+            scheme: SchemeKind::Anthropic,
            base_url: None,
+            model_id: "claude-sonnet-4-20250514".into(),
+            auth: AuthRef::ApiKey {
+                env: None,
+                file: None,
+            },
        }
    }

    #[test]
    #[serial]
    fn resolve_from_env() {
-        let env_name = ProviderKind::Anthropic.env_var_name();
-        unsafe { std::env::set_var(&env_name, "sk-from-env") };
-        let key = resolve_api_key(&anthropic_config()).unwrap();
-        unsafe { std::env::remove_var(&env_name) };
-        assert_eq!(key.as_deref(), Some("sk-from-env"));
+        let env_name = SchemeKind::Anthropic.default_env_var();
+        unsafe { std::env::set_var(env_name, "sk-from-env") };
+        let auth = resolve_auth(SchemeKind::Anthropic, &anthropic_config().auth).unwrap();
+        unsafe { std::env::remove_var(env_name) };
+        match auth {
+            ResolvedAuth::ApiKey(k) => assert_eq!(k, "sk-from-env"),
+            _ => panic!("expected ApiKey"),
+        }
    }

    #[test]
@ -129,14 +184,20 @@ mod tests {
        let key_path = dir.path().join("key.txt");
        {
            let mut f = std::fs::File::create(&key_path).unwrap();
-            write!(f, "  sk-from-file\n").unwrap();
+            writeln!(f, "  sk-from-file").unwrap();
        }
-        let config = ProviderConfig {
-            api_key_file: Some(key_path),
+        let config = ModelConfig {
+            auth: AuthRef::ApiKey {
+                env: Some("INSOMNIA_API_KEY_NONEXISTENT".into()),
+                file: Some(key_path),
+            },
            ..anthropic_config()
        };
-        let key = resolve_api_key(&config).unwrap();
-        assert_eq!(key.as_deref(), Some("sk-from-file"));
+        let auth = resolve_auth(config.scheme, &config.auth).unwrap();
+        match auth {
+            ResolvedAuth::ApiKey(k) => assert_eq!(k, "sk-from-file"),
+            _ => panic!("expected ApiKey"),
+        }
    }

    #[test]
@ -146,43 +207,57 @@ mod tests {
        let key_path = dir.path().join("key.txt");
        std::fs::write(&key_path, "sk-from-file").unwrap();

-        let env_name = ProviderKind::Anthropic.env_var_name();
-        unsafe { std::env::set_var(&env_name, "sk-from-env") };
+        let env_name = SchemeKind::Anthropic.default_env_var();
+        unsafe { std::env::set_var(env_name, "sk-from-env") };

-        let config = ProviderConfig {
-            api_key_file: Some(key_path),
+        let config = ModelConfig {
+            auth: AuthRef::ApiKey {
+                env: None,
+                file: Some(key_path),
+            },
            ..anthropic_config()
        };
-        let key = resolve_api_key(&config).unwrap();
-        unsafe { std::env::remove_var(&env_name) };
-        assert_eq!(key.as_deref(), Some("sk-from-env"));
+        let auth = resolve_auth(config.scheme, &config.auth).unwrap();
+        unsafe { std::env::remove_var(env_name) };
+        match auth {
+            ResolvedAuth::ApiKey(k) => assert_eq!(k, "sk-from-env"),
+            _ => panic!("expected ApiKey"),
+        }
    }

    #[test]
-    fn relative_api_key_file_is_rejected() {
-        let config = ProviderConfig {
-            api_key_file: Some(PathBuf::from("keys/anthropic")),
+    fn relative_auth_file_is_rejected() {
+        let config = ModelConfig {
+            auth: AuthRef::ApiKey {
+                env: Some("INSOMNIA_API_KEY_NONEXISTENT".into()),
+                file: Some(PathBuf::from("keys/anthropic")),
+            },
            ..anthropic_config()
        };
-        let err = resolve_api_key(&config).unwrap_err();
+        let err = resolve_auth(config.scheme, &config.auth).unwrap_err();
        assert!(matches!(err, ProviderError::Config(_)));
    }

    #[test]
+    #[serial]
    fn missing_key_returns_api_key_missing() {
-        let config = anthropic_config();
-        let result = build_client(&config);
+        let env_name = SchemeKind::Anthropic.default_env_var();
+        unsafe { std::env::remove_var(env_name) };
+        let result = build_client(&anthropic_config());
        assert!(matches!(result, Err(ProviderError::ApiKeyMissing { .. })));
    }

    #[test]
    fn ollama_succeeds_without_key() {
-        let config = ProviderConfig {
-            kind: ProviderKind::Ollama,
-            model: "llama3".into(),
-            api_key_file: None,
-            base_url: None,
+        // Ollama = Anthropic scheme + base_url 差し替え + AuthRef::None
+        let config = ModelConfig {
+            scheme: SchemeKind::Anthropic,
+            base_url: Some("http://localhost:11434".into()),
+            model_id: "llama3".into(),
+            auth: AuthRef::None,
        };
+        // scheme.required_auth() が XApiKey でも ResolvedAuth::None は許容する
+        // （None は全 scheme で受け入れるため）
        assert!(build_client(&config).is_ok());
    }
 }
--- a/tickets/llm-model-config.md
+++ b/tickets/llm-model-config.md
@ -1,5 +1,9 @@
 # LLM モデル設定の再編

+> **レビュー中** — 詳細は [`llm-model-config.review.md`](llm-model-config.review.md)
+> 主な指摘: 要件 6 の `ModelConfig.capability` override 未実装、`validate_config` の機能退化（OpenAI top_k warning 消失）。どちらも判断待ち。
+
+
 ## 背景

 決定済みの LLM プロバイダサポート方針（`docs/plan/llm_providers.md`）に従って llm-worker のプロバイダ層を再編する。Pod 側で「使う LLM モデル」を宣言する構造にし、共通の通信層 + scheme の組合せで任意のプロバイダを収容できるようにする。
--- a/tickets/llm-model-config.review.md
+++ b/tickets/llm-model-config.review.md
@ -0,0 +1,105 @@
+# LLM モデル設定の再編 — レビュー
+
+## 前提・要件の再確認
+
+`docs/plan/llm_providers.md` の第一級/二次/非サポート方針と、チケット本体の 9 要件 + 6 設計決定 を前提に、実装が意図と整合しているかを確認した。変更量は +1608 / -1174 行、41 ファイル。
+
+`cargo check` および `cargo test --workspace --lib` は通過。
+
+## 要件達成度
+
+| # | 要件 | 状況 | メモ |
+|---|---|---|---|
+| 1 | Pod マニフェスト `[model]` 宣言 | ✓ | `manifest/src/model.rs` + `config.rs::ModelConfigPartial` |
+| 2 | `providers/` 層廃止 | ✓ | 4 ファイル削除、`HttpTransport<S>` 1 本に集約 |
+| 3 | 既存 scheme 再編（openai → openai_chat、Ollama は流用） | ✓ | 各 scheme に `scheme_impl.rs` + `capability.rs` 追加 |
+| 4 | `AuthRef` 分離 | ✓ | `manifest/model.rs` + `llm_client/auth.rs::AuthRequirement` |
+| 5 | 第一級/二次 方針整合 | ✓ | `provider/lib.rs::build_client` + `SchemeKind` |
+| 6 | `ModelCapability` 分離 | △ | 型定義・静的テーブル・default はあり。**`ModelConfig` からのマニフェスト override は未実装** |
+| 7 | Streaming 現状維持 | ✓ | Event 型変更なし、`Scheme::State` で Anthropic block_type 補完 |
+| 8 | Ollama 運用注意点 | ✓ | `default_capability` で Anthropic scheme が `CacheStrategy::Auto`、`ollama_succeeds_without_key` テストあり |
+| 9 | 完了時動作 | ✓ | ビルド通過、既存テスト通過 |
+
+## 設計決定の反映
+
+| # | 決定 | 反映 |
+|---|---|---|
+| 1 | `Scheme` trait 方針A（全面抽象化） | ✓ `scheme/mod.rs::Scheme` に URL/認証/ヘッダ/body/SSE を集約。`State` associated type で Anthropic の `block_type` 補完を綺麗に処理 |
+| 2 | `AuthRef` 組合せ検証 方針B（構築時） | ✓ `ResolvedAuth::matches` + `build_transport` で照合 |
+| 3 | `crates/provider` 方針A（残す） | ✓ 薄いファクトリとして維持 |
+| 4 | `ModelCapability` ハイブリッド | △ scheme 側静的テーブルはあるが、マニフェスト override 側が欠落 |
+| 5 | フィールド単位 override | ✓ `ModelConfigPartial::merge` |
+| 6 | TOML 後方互換切り | ✓ 旧 `[provider]` は完全に新 `[model]` に置換 |
+
+## 指摘事項
+
+### 優先度: 中
+
+#### 1. 要件 6 の「ModelConfig で明示宣言すれば override」が未実装
+
+`ModelConfig` 構造体に `capability: Option<ModelCapability>` フィールドがない。設計決定 4（ハイブリッド: scheme 側テーブル → マニフェスト override → デフォルト）の **override 側が欠落**している。
+
+影響:
+- scheme 静的テーブルに無いモデル（OpenRouter / xAI の Grok / Groq の Kimi / OpenAI 互換ルーター系）は必ず `default_capability(scheme)` に落ちる
+- 二次サポートの共通枠の実用性に直結（例: Grok の `ReasoningSupport::Effort` が効かず reasoning 送れない）
+
+対応案:
+- A. 今チケットで `ModelConfig.capability: Option<ModelCapability>` を追加し `build_transport` で優先順位 `config.capability → scheme.capability_for → default_capability` に
+- B. Scope 外として明示し別チケットに切り出す
+
+ユーザーの決定方針（二次サポートを共通枠でカバー）からすると A が自然。ticket 本体の Scope 外にも記載がないため、A を推奨。
+
+#### 2. `validate_config` の機能退化
+
+旧 `providers/openai.rs` の `OpenAIClient` は `LlmClient::validate_config` をオーバーライドし「OpenAI は `top_k` 非対応」の warning を出していた。削除された `tests/validation_test.rs` はこの warning をテストしていた。
+
+今の `HttpTransport<S: Scheme>` は `validate_config` をオーバーライドしておらず、`LlmClient` trait のデフォルト実装（空 `Vec`）が使われる。つまり **`Worker::validate()` は scheme による制約（top_k, logprobs 等）を検出できなくなっている**。
+
+対応案:
+- `Scheme` trait に `validate_config(&RequestConfig) -> Vec<ConfigWarning>` を追加し、`HttpTransport` 側で scheme に委譲
+- 最低限 OpenAI Chat scheme で旧と同じ top_k warning を再実装
+- 合わせて新形式での regression test を追加（旧 `validation_test.rs` の代替）
+
+### 優先度: 低
+
+#### 3. `default_capability` の配置
+
+`crates/provider/lib.rs::default_capability` が `SchemeKind` ごとに直書き（同じ情報が `Scheme` trait 実装側と分離して存在）。`Scheme::default_capability()` メソッドに移動する方が関心事が集約される。今の形でも動作するが、新 scheme 追加時に 2 箇所編集が必要な点が弱い。
+
+#### 4. `AuthRequirement` 判定の緩さ
+
+`ResolvedAuth::matches` は `(None, _) => true` で常にパス。これは Ollama Anthropic 流用（`AuthRef::None` で `XApiKey` 要求）のための意図的設計だが、本来認証必須の scheme（Anthropic 本家）に誤って `AuthRef::None` を渡しても構築成功し、実行時の 401 で初めて失敗する。
+
+より厳密にするなら `AuthRequirement::XApiKeyOptional` のようなバリアント導入で分離できるが、実害は小さいので現状維持も許容範囲。
+
+#### 5. rustdoc のクロス crate リンク
+
+`scheme/mod.rs:47` の `[AuthRef](../../../manifest/enum.AuthRef.html)` は相対リンクで、`cargo doc --workspace` 時に切れる可能性。`[`manifest::AuthRef`]` 形式のクロス crate リンクにしておくと rustdoc が解決できる。
+
+## アーキテクチャ評価
+
+### 良い点
+- `Scheme::State` associated type の導入で「Anthropic の `content_block_stop` に `block_type` が載らない」といった具体的な痛みを抽象内で解決
+- `ResolvedAuth::matches` による構築時検証が `build_transport` 1 箇所に集約、分岐が明瞭
+- `ModelConfigPartial::merge` のフィールド単位 override が既存の cascade layer と自然に噛み合う
+- Ollama 運用の制約（`cache_control`/`tool_choice`/`metadata` 不可）が capability + scheme 側送出制御で分散、`provider::tests::ollama_succeeds_without_key` で境界条件がテストされている
+- `spawn_pod.rs::overlay_inherits_spawner_model` テストで親 Pod の `ModelConfig` が子にシームレスに伝播することを確認
+
+### コードベースを歪めていないか
+- 旧 `providers/` の 4 ファイルは綺麗に削除、重複は残っていない
+- `SchemeKind::OpenaiResponses` はマニフェスト側に先行存在するが、`build_client` で `SchemeNotImplemented` エラーを明示的に返す（別チケットで肉付け前提）。これは依存チケット設計通り
+- `AuthRef::CodexOAuth` も同様に予約のみ、`resolve_auth` でエラーを返す
+
+### 不必要な実装
+- `AuthRequirement::Custom` バリアントは Codex OAuth 用の先行予約で、今チケットでは使われない。将来の拡張点として小さい負債、許容範囲
+
+## 総合判定
+
+**コア要件は達成されている。構造再編は綺麗で、Scope の切り方も妥当**。実装ミス的な重大欠陥はなく、既存テストも全て通過している。
+
+ただし以下 2 点の判断が必要:
+
+1. **要件 6 の `ModelConfig.capability` override**: 今チケットで追加するか、Scope 外として明示するか
+2. **`validate_config` の退化**: 復活させるか、ticket 本体に「OpenAI の top_k warning 等の validate 機能は scheme 再編で意図的に落とした」旨を明記するか
+
+どちらも「今 close して後で別チケット」でも進められるが、最低限ticket 本体への記載（Scope 外明示 or 後続タスク言及）が必要。