From e975c838bea53b03fbd9d5e20fb9c9d09512bfbf Mon Sep 17 00:00:00 2001
From: Ken Jiang <ken@braintrustdata.com>
Date: Fri, 16 Jan 2026 11:45:59 -0500
Subject: [PATCH 1/5] add universla param configs

---
 .../cross-transformation-coverage.yml         |    8 +-
 Cargo.lock                                    |    1 +
 Makefile                                      |    1 +
 crates/braintrust-llm-router/src/error.rs     |   93 +-
 crates/braintrust-llm-router/src/router.rs    |    7 +-
 crates/braintrust-llm-router/src/streaming.rs |    2 +-
 crates/coverage-report/Cargo.toml             |    5 +
 crates/coverage-report/README.md              |  259 ++++
 crates/coverage-report/src/compact.rs         |  395 ++++++
 crates/coverage-report/src/discovery.rs       |   14 +-
 crates/coverage-report/src/expected.rs        |  444 ++++++
 crates/coverage-report/src/lib.rs             |   29 +
 crates/coverage-report/src/main.rs            |  217 ++-
 crates/coverage-report/src/normalizers.rs     |   95 ++
 crates/coverage-report/src/report.rs          |  699 +++++----
 .../src/requests_expected_differences.json    |  255 ++++
 .../src/responses_expected_differences.json   |  108 ++
 crates/coverage-report/src/runner.rs          | 1055 ++++++++------
 .../src/streaming_expected_differences.json   |   62 +
 crates/coverage-report/src/types.rs           |  264 +++-
 .../tests/cross_provider_test.rs              |   62 +
 crates/generate-types/src/main.rs             |   19 +-
 crates/lingua/src/error.rs                    |   16 +-
 crates/lingua/src/processing/adapters.rs      |   58 +-
 crates/lingua/src/processing/import.rs        |   11 +-
 crates/lingua/src/processing/transform.rs     |   25 +
 .../lingua/src/providers/anthropic/adapter.rs |  566 ++++++--
 .../lingua/src/providers/anthropic/convert.rs |  529 +++----
 .../src/providers/anthropic/generated.rs      |   13 +
 crates/lingua/src/providers/anthropic/mod.rs  |    1 +
 .../lingua/src/providers/anthropic/params.rs  |  157 +++
 .../lingua/src/providers/bedrock/adapter.rs   |  445 ++++--
 crates/lingua/src/providers/bedrock/mod.rs    |    1 +
 crates/lingua/src/providers/bedrock/params.rs |  107 ++
 crates/lingua/src/providers/google/adapter.rs |  639 ++++-----
 crates/lingua/src/providers/google/mod.rs     |    1 +
 crates/lingua/src/providers/google/params.rs  |   97 ++
 crates/lingua/src/providers/openai/adapter.rs | 1245 ++++++-----------
 crates/lingua/src/providers/openai/convert.rs |  732 ++++++++--
 crates/lingua/src/providers/openai/mod.rs     |   11 +-
 crates/lingua/src/providers/openai/params.rs  |  198 +++
 .../src/providers/openai/responses_adapter.rs |  848 +++++++++++
 .../providers/openai/test_chat_completions.rs |   56 +-
 crates/lingua/src/python.rs                   |    5 +-
 crates/lingua/src/universal/mod.rs            |   14 +-
 crates/lingua/src/universal/reasoning.rs      |  527 +++++++
 crates/lingua/src/universal/request.rs        |  577 +++++++-
 crates/lingua/src/universal/response.rs       |  298 +++-
 .../lingua/src/universal/response_format.rs   |  429 ++++++
 crates/lingua/src/universal/tool_choice.rs    |  447 ++++++
 crates/lingua/src/universal/tools.rs          |  873 ++++++++++++
 crates/lingua/src/wasm.rs                     |    5 +-
 payloads/scripts/providers/openai.ts          |    2 +
 payloads/scripts/validate.ts                  |    1 +
 payloads/scripts/validation/index.ts          |   65 +-
 payloads/scripts/validation/reporter.ts       |   15 +-
 56 files changed, 10411 insertions(+), 2697 deletions(-)
 create mode 100644 crates/coverage-report/README.md
 create mode 100644 crates/coverage-report/src/compact.rs
 create mode 100644 crates/coverage-report/src/expected.rs
 create mode 100644 crates/coverage-report/src/lib.rs
 create mode 100644 crates/coverage-report/src/normalizers.rs
 create mode 100644 crates/coverage-report/src/requests_expected_differences.json
 create mode 100644 crates/coverage-report/src/responses_expected_differences.json
 create mode 100644 crates/coverage-report/src/streaming_expected_differences.json
 create mode 100644 crates/coverage-report/tests/cross_provider_test.rs
 create mode 100644 crates/lingua/src/providers/anthropic/params.rs
 create mode 100644 crates/lingua/src/providers/bedrock/params.rs
 create mode 100644 crates/lingua/src/providers/google/params.rs
 create mode 100644 crates/lingua/src/providers/openai/params.rs
 create mode 100644 crates/lingua/src/providers/openai/responses_adapter.rs
 create mode 100644 crates/lingua/src/universal/reasoning.rs
 create mode 100644 crates/lingua/src/universal/response_format.rs
 create mode 100644 crates/lingua/src/universal/tool_choice.rs
 create mode 100644 crates/lingua/src/universal/tools.rs

diff --git a/.github/workflows/cross-transformation-coverage.yml b/.github/workflows/cross-transformation-coverage.yml
index 0a0eb7ce..0acb96ac 100644
--- a/.github/workflows/cross-transformation-coverage.yml
+++ b/.github/workflows/cross-transformation-coverage.yml
@@ -45,18 +45,22 @@ jobs:
       - name: Generate coverage report
         run: |
           cargo run -p coverage-report > coverage_report.md
-        # This job is informational only - it always succeeds
-        # Click into the job summary to see the actual coverage report
 
       - name: Post coverage to job summary
+        if: always()
         run: |
           echo "# 🔄 Cross-Provider Transformation Coverage" >> $GITHUB_STEP_SUMMARY
           echo "" >> $GITHUB_STEP_SUMMARY
           cat coverage_report.md >> $GITHUB_STEP_SUMMARY
 
       - name: Upload coverage artifact
+        if: always()
         uses: actions/upload-artifact@v4
         with:
           name: transformation-coverage-report
           path: coverage_report.md
           retention-days: 30
+
+      - name: Verify no unexpected failures
+        run: |
+          cargo test -p coverage-report --test cross_provider_test -- --nocapture
diff --git a/Cargo.lock b/Cargo.lock
index e47c6adc..b3d1f4d3 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -860,6 +860,7 @@ dependencies = [
  "big_serde_json",
  "bytes",
  "lingua",
+ "regex",
  "serde",
 ]
 
diff --git a/Makefile b/Makefile
index aef94b35..d7ff8712 100644
--- a/Makefile
+++ b/Makefile
@@ -55,6 +55,7 @@ test-typescript-integration: typescript ## Run TypeScript integration tests
 
 test-python: ## Run Python tests
 	@echo "Running Python tests..."
+	cd bindings/python && uv run maturin develop --features python
 	cd bindings/python && uv run pytest tests/ -v
 
 clean: ## Clean build artifacts
diff --git a/crates/braintrust-llm-router/src/error.rs b/crates/braintrust-llm-router/src/error.rs
index ea42487b..bd6e6495 100644
--- a/crates/braintrust-llm-router/src/error.rs
+++ b/crates/braintrust-llm-router/src/error.rs
@@ -84,8 +84,8 @@ pub enum Error {
     #[error("invalid request: {0}")]
     InvalidRequest(String),
 
-    #[error("lingua conversion failed: {0}")]
-    Lingua(String),
+    #[error("{0}")]
+    Lingua(#[from] lingua::TransformError),
 
     #[error("authentication error: {0}")]
     Auth(String),
@@ -107,6 +107,32 @@ impl Error {
             _ => None,
         }
     }
+
+    /// Returns true if this is a client-side error (400 Bad Request).
+    ///
+    /// Client errors indicate problems with the user's request that they
+    /// should fix, such as unknown models, unsupported formats, or invalid payloads.
+    pub fn is_client_error(&self) -> bool {
+        matches!(
+            self,
+            Error::UnknownModel(_) | Error::NoProvider(_) | Error::InvalidRequest(_)
+        ) || matches!(self, Error::Lingua(e) if e.is_client_error())
+    }
+
+    /// Returns true if this is an authentication error (401 Unauthorized).
+    ///
+    /// Auth errors indicate missing or invalid authentication credentials.
+    pub fn is_auth_error(&self) -> bool {
+        matches!(self, Error::NoAuth(_) | Error::Auth(_))
+    }
+
+    /// Returns true if this is an upstream provider error with HTTP details.
+    ///
+    /// Upstream errors should be passed through to the client with the original
+    /// status code, headers, and body from the provider.
+    pub fn is_upstream_error(&self) -> bool {
+        matches!(self, Error::Provider { http: Some(_), .. })
+    }
 }
 
 #[cfg(test)]
@@ -128,4 +154,67 @@ mod tests {
         assert_eq!(body, "not found");
         assert_eq!(returned_headers, vec![("x-test".into(), "value".into())]);
     }
+
+    #[test]
+    fn transform_error_classification() {
+        use lingua::TransformError;
+
+        // Client errors
+        assert!(TransformError::UnableToDetectFormat.is_client_error());
+        assert!(TransformError::ValidationFailed {
+            target: ProviderFormat::OpenAI,
+            reason: "test".into()
+        }
+        .is_client_error());
+        assert!(TransformError::DeserializationFailed("invalid json".into()).is_client_error());
+        assert!(TransformError::UnsupportedTargetFormat(ProviderFormat::OpenAI).is_client_error());
+        assert!(TransformError::UnsupportedSourceFormat(ProviderFormat::OpenAI).is_client_error());
+
+        // Server errors
+        assert!(!TransformError::SerializationFailed("test".into()).is_client_error());
+        assert!(!TransformError::FromUniversalFailed("test".into()).is_client_error());
+        assert!(!TransformError::ToUniversalFailed("test".into()).is_client_error());
+        assert!(!TransformError::StreamingNotImplemented("test".into()).is_client_error());
+    }
+
+    #[test]
+    fn router_error_classification() {
+        // Client errors
+        assert!(Error::UnknownModel("gpt-5".into()).is_client_error());
+        assert!(Error::NoProvider(ProviderFormat::OpenAI).is_client_error());
+        assert!(Error::InvalidRequest("bad".into()).is_client_error());
+        assert!(Error::Lingua(lingua::TransformError::UnableToDetectFormat).is_client_error());
+
+        // Auth errors
+        assert!(Error::NoAuth("openai".into()).is_auth_error());
+        assert!(Error::Auth("invalid".into()).is_auth_error());
+
+        // Not client errors
+        assert!(!Error::Timeout.is_client_error());
+        assert!(
+            !Error::Lingua(lingua::TransformError::SerializationFailed("test".into()))
+                .is_client_error()
+        );
+
+        // Upstream errors
+        let upstream_err = Error::Provider {
+            provider: "openai".into(),
+            source: anyhow::anyhow!("test"),
+            retry_after: None,
+            http: Some(UpstreamHttpError {
+                status: 404,
+                headers: vec![],
+                body: "not found".into(),
+            }),
+        };
+        assert!(upstream_err.is_upstream_error());
+
+        let non_upstream_err = Error::Provider {
+            provider: "openai".into(),
+            source: anyhow::anyhow!("test"),
+            retry_after: None,
+            http: None,
+        };
+        assert!(!non_upstream_err.is_upstream_error());
+    }
 }
diff --git a/crates/braintrust-llm-router/src/router.rs b/crates/braintrust-llm-router/src/router.rs
index f3a4b9e5..5fca83ea 100644
--- a/crates/braintrust-llm-router/src/router.rs
+++ b/crates/braintrust-llm-router/src/router.rs
@@ -154,7 +154,7 @@ impl Router {
             Ok(TransformResult::PassThrough(bytes)) => bytes,
             Ok(TransformResult::Transformed { bytes, .. }) => bytes,
             Err(TransformError::UnsupportedTargetFormat(_)) => body.clone(),
-            Err(e) => return Err(Error::Lingua(e.to_string())),
+            Err(e) => return Err(e.into()),
         };
 
         let response_bytes = self
@@ -168,8 +168,7 @@ impl Router {
             )
             .await?;
 
-        let result = lingua::transform_response(response_bytes.clone(), output_format)
-            .map_err(|e| Error::Lingua(e.to_string()))?;
+        let result = lingua::transform_response(response_bytes.clone(), output_format)?;
 
         let response = match result {
             TransformResult::PassThrough(bytes) => bytes,
@@ -211,7 +210,7 @@ impl Router {
             Ok(TransformResult::PassThrough(bytes)) => bytes,
             Ok(TransformResult::Transformed { bytes, .. }) => bytes,
             Err(TransformError::UnsupportedTargetFormat(_)) => body.clone(),
-            Err(e) => return Err(Error::Lingua(e.to_string())),
+            Err(e) => return Err(e.into()),
         };
 
         let raw_stream = provider
diff --git a/crates/braintrust-llm-router/src/streaming.rs b/crates/braintrust-llm-router/src/streaming.rs
index c49f2f8a..848654f0 100644
--- a/crates/braintrust-llm-router/src/streaming.rs
+++ b/crates/braintrust-llm-router/src/streaming.rs
@@ -59,7 +59,7 @@ pub fn transform_stream(raw: RawResponseStream, output_format: ProviderFormat) -
                             // Pass through unrecognized formats
                             Some(Ok(bytes))
                         }
-                        Err(e) => Some(Err(Error::Lingua(e.to_string()))),
+                        Err(e) => Some(Err(Error::Lingua(e))),
                     }
                 }
                 Err(e) => Some(Err(e)),
diff --git a/crates/coverage-report/Cargo.toml b/crates/coverage-report/Cargo.toml
index 56693d10..5e78e03a 100644
--- a/crates/coverage-report/Cargo.toml
+++ b/crates/coverage-report/Cargo.toml
@@ -5,6 +5,10 @@ edition.workspace = true
 publish = false
 description = "Cross-provider transformation coverage report generator for Lingua"
 
+[lib]
+name = "coverage_report"
+path = "src/lib.rs"
+
 [[bin]]
 name = "coverage-report"
 path = "src/main.rs"
@@ -14,3 +18,4 @@ lingua = { path = "../lingua", features = ["openai", "anthropic", "google", "bed
 serde.workspace = true
 big_serde_json.workspace = true
 bytes.workspace = true
+regex = "1"
diff --git a/crates/coverage-report/README.md b/crates/coverage-report/README.md
new file mode 100644
index 00000000..020b9dd1
--- /dev/null
+++ b/crates/coverage-report/README.md
@@ -0,0 +1,259 @@
+# Coverage Report
+
+Cross-provider transformation coverage report generator for Lingua.
+
+## Overview
+
+This tool runs transformation tests between all provider formats (OpenAI, Anthropic, Google, Bedrock, Responses) and generates a markdown report showing which transformations succeed, fail, or have known limitations.
+
+## What it tests
+
+1. **Request transformations**: Source provider request → Target provider request
+2. **Response transformations**: Source provider response → Target provider response
+3. **Streaming transformations**: Source streaming events → Target streaming events
+4. **Roundtrip tests**: Provider → Universal → Provider (same provider)
+
+## Architecture and difference handling
+
+### Design philosophy
+
+The coverage report tool follows a clean architecture where **runner.rs is mechanically pure**:
+
+- ✅ **Compares values objectively** - no special cases or equivalence decisions
+- ✅ **Reports differences accurately** - doesn't hide or transform failures
+- ✅ **Queries configuration** - delegates policy decisions to config files
+
+### Where difference handling lives
+
+All policy decisions about acceptable differences belong in one of two places:
+
+1. **Adapter code** (`lingua/src/providers/*/adapter.rs`)
+   - Transformation logic (how to convert between formats)
+   - Provider-specific defaults and normalization
+   - Example: Google/Bedrock model injection (required by those APIs)
+
+2. **Expected differences configuration** (JSON files in `src/`)
+   - `requests_expected_differences.json` - Request transformation limitations
+   - `responses_expected_differences.json` - Response transformation limitations
+   - `streaming_expected_differences.json` - Streaming transformation limitations
+
+### Configuration structure
+
+**Expected differences files** document known provider limitations using a two-tier structure:
+
+```json
+{
+  "global": [
+    {
+      "source": "*",
+      "target": "Anthropic",
+      "fields": [
+        { "pattern": "params.top_k", "reason": "OpenAI doesn't support top_k" }
+      ],
+      "errors": [
+        { "pattern": "does not support logprobs", "reason": "Anthropic lacks logprobs" }
+      ]
+    }
+  ],
+  "perTestCase": [
+    {
+      "testCase": "imageContentParam",
+      "source": "*",
+      "target": "Anthropic",
+      "skip": true,
+      "reason": "Anthropic assistant messages don't support image content"
+    }
+  ]
+}
+```
+
+**Global rules** apply to all test cases for a source→target pair. **Per-test-case rules** apply only to specific tests.
+
+## Provider-specific metadata handling
+
+Certain fields are intentionally lost during cross-provider transformations because they represent provider-specific metadata with no universal equivalent. These are marked as "limitations" in the coverage report:
+
+### Fields that don't translate across providers
+
+**Message/Response IDs** (`id`, `messages[*].id`):
+- Each provider uses different ID schemes that represent different concepts:
+  - **OpenAI Chat Completions**: Response-level `id` (e.g., `chatcmpl-ABC123`)
+  - **OpenAI Responses API**: Response-level `id` (e.g., `resp-XYZ789`)
+  - **Anthropic**: Message-level `id` (e.g., `msg_01AbCdEfG`)
+  - **Bedrock**: No IDs at all
+- These IDs cannot be meaningfully translated across providers
+
+**Timestamps** (`created`, `created_at`):
+- Provider-specific generation timestamps with inconsistent field names:
+  - **OpenAI Chat**: Uses `created` (Unix timestamp)
+  - **OpenAI Responses**: Uses `created_at` (Unix timestamp)
+  - **Anthropic/Bedrock**: Don't include timestamps
+- Represents when the response was generated, not part of actual content
+
+**Service tier** (`service_tier`):
+- OpenAI-specific billing tier indicating account level (`"default"` or `"scale"`)
+- Not present in other providers (Anthropic has different usage tracking structure)
+- This is API billing metadata, not universal content
+
+**System fingerprint** (`system_fingerprint`):
+- OpenAI-specific system identifier for tracking backend changes
+- Not present in other providers
+
+The Universal format is intentionally provider-agnostic and doesn't preserve these provider-specific metadata fields during cross-provider transformations.
+
+### How test results are classified
+
+Each test produces one of four outcomes:
+
+1. **Pass** ✅ - Transformation succeeded with no differences
+2. **Fail** ❌ - Transformation failed or produced unexpected differences
+3. **Limitation** ⚠️ - Differences match documented provider limitations
+4. **Skipped** ⊘ - Test case doesn't exist for this provider
+
+The runner mechanically compares values. The expected differences configuration determines which failures are "expected limitations" vs real bugs.
+
+## Usage
+
+```bash
+# Run all tests (default)
+cargo run --bin coverage-report
+
+# Filter by coverage type
+cargo run --bin coverage-report -- --coverage requests
+cargo run --bin coverage-report -- --coverage requests,responses
+cargo run --bin coverage-report -- --coverage roundtrip
+
+# Filter by test case name
+cargo run --bin coverage-report -- --test-cases seedParam
+cargo run --bin coverage-report -- -t seedParam,toolCallRequest
+
+# Filter with glob patterns
+cargo run --bin coverage-report -- -t "reasoning*"      # All reasoning tests
+cargo run --bin coverage-report -- -t "*Param"          # All param tests
+cargo run --bin coverage-report -- -t "tool*"           # All tool tests
+
+# Filter by provider
+cargo run --bin coverage-report -- --providers responses,anthropic
+cargo run --bin coverage-report -- -p anthropic,google
+
+# Filter by source/target direction
+cargo run --bin coverage-report -- --source responses --target anthropic
+cargo run --bin coverage-report -- --source anthropic
+
+# Combine filters
+cargo run --bin coverage-report -- \
+  -t seedParam \
+  -p responses,anthropic \
+  --coverage requests
+
+# Token-optimized compact output (~95% smaller)
+cargo run --bin coverage-report -- --format compact
+cargo run --bin coverage-report -- -f c
+```
+
+## Options
+
+| Option | Short | Description |
+|--------|-------|-------------|
+| `--coverage` | | Coverage types: `requests`, `responses`, `streaming`, `roundtrip`, `all` |
+| `--test-cases` | `-t` | Test case patterns (supports glob: `*` any chars, `?` single char) |
+| `--providers` | `-p` | Provider filter (both source AND target must match) |
+| `--source` | | Filter source providers only |
+| `--target` | | Filter target providers only |
+| `--format` | `-f` | Output format: `markdown` (default), `compact` |
+
+## Provider names
+
+| Name | Aliases |
+|------|---------|
+| `responses` | `response`, `openai-responses` |
+| `openai` | `chat-completions`, `chatcompletions`, `completions` |
+| `anthropic` | |
+| `google` | `gemini` |
+| `bedrock` | `converse` |
+
+## Test cases
+
+Test cases are discovered from `payloads/snapshots/`. Each test case directory contains provider-specific request/response JSON files:
+
+```
+payloads/snapshots/
+├── seedParam/
+│   ├── anthropic/
+│   │   ├── request.json
+│   │   ├── response.json
+│   │   └── response-streaming.json
+│   ├── responses/
+│   ├── chat-completions/
+│   ├── google/
+│   └── bedrock/
+├── toolCallRequest/
+├── reasoningRequest/
+└── ...
+```
+
+## Output formats
+
+### Markdown (default)
+
+The default format outputs detailed markdown with:
+
+- Summary statistics (pass/fail/limitation counts)
+- Cross-provider transformation matrix
+- Roundtrip test results per provider
+- Detailed failure information with diffs
+- Collapsible sections for easy navigation
+
+### Compact (token-optimized)
+
+The compact format (`-f compact`) produces ~95% smaller output optimized for LLM consumption:
+
+```
+# Coverage (compact)
+Stats: 669/1704 (39.3%) [512+157lim] 1035fail
+req:617/836 res:32/424 str:20/444
+
+## Failures (79 patterns, 1035 total)
+
+[P1] L:usage.prompt_cache_creation_tokens (123)
+  ant→ggl: cacheControl1hParam (response)...(+44)
+  ant→oai: cacheControl5mParam (response)...(+41)
+```
+
+Key optimizations:
+- **Provider abbreviations**: `oai`, `ant`, `ggl`, `bed`, `rsp`
+- **Error deduplication**: Groups failures by pattern with counts
+- **Test case compression**: `seedParam...(+27)` instead of listing all 28
+- **No HTML/markdown overhead**: Plain text with minimal structure
+
+## Examples
+
+### Quick check on a specific test case
+
+```bash
+cargo run --bin coverage-report -- -t seedParam --coverage requests
+```
+
+### Test Responses→Anthropic transformations
+
+```bash
+cargo run --bin coverage-report -- --source responses --target anthropic
+```
+
+### Test all reasoning-related features
+
+```bash
+cargo run --bin coverage-report -- -t "reasoning*"
+```
+
+### Full coverage report (CI)
+
+```bash
+cargo run --bin coverage-report > coverage.md
+```
+
+### Token-optimized report for LLM analysis
+
+```bash
+cargo run --bin coverage-report -- -f compact > coverage.txt
+```
diff --git a/crates/coverage-report/src/compact.rs b/crates/coverage-report/src/compact.rs
new file mode 100644
index 00000000..77e11a17
--- /dev/null
+++ b/crates/coverage-report/src/compact.rs
@@ -0,0 +1,395 @@
+/*!
+Compact (token-optimized) report generation.
+
+This module generates a condensed report format that minimizes token usage by:
+- Using provider abbreviations (oai, ant, ggl, bed, rsp)
+- Deduplicating errors by pattern and showing counts
+- Removing HTML/markdown formatting overhead
+- Using flat structure instead of nested sections
+*/
+
+use std::collections::HashMap;
+
+use lingua::processing::adapters::ProviderAdapter;
+
+use crate::types::{FailureWithDiff, PairResult, RoundtripDiff, TableStats};
+
+/// Abbreviate provider name for compact output.
+pub fn abbrev(name: &str) -> &'static str {
+    match name {
+        "Responses" => "rsp",
+        "ChatCompletions" => "oai",
+        "Anthropic" => "ant",
+        "Google" => "ggl",
+        "Bedrock" => "bed",
+        _ => "???",
+    }
+}
+
+/// Error pattern for deduplication.
+#[derive(Debug, Clone, Hash, Eq, PartialEq)]
+pub struct ErrorPattern {
+    pub pattern: String,
+    pub category: char,
+}
+
+/// Group of test cases with the same error pattern.
+#[derive(Debug)]
+pub struct PatternGroup {
+    pub pattern: ErrorPattern,
+    pub by_direction: HashMap<String, Vec<String>>,
+    pub total_count: usize,
+}
+
+/// Truncate a string to a maximum number of characters, adding "..." if truncated.
+/// Uses character count, not byte count, to avoid UTF-8 panics.
+fn truncate_str(s: &str, max_chars: usize) -> String {
+    let char_count = s.chars().count();
+    if char_count > max_chars {
+        let truncated: String = s.chars().take(max_chars.saturating_sub(3)).collect();
+        format!("{}...", truncated)
+    } else {
+        s.to_string()
+    }
+}
+
+/// Normalize field path for grouping (collapse array indices, truncate long paths).
+fn normalize_field_path(path: &str) -> String {
+    // Replace array indices with [*]
+    let mut result = String::new();
+    let mut chars = path.chars().peekable();
+
+    while let Some(c) = chars.next() {
+        if c == '[' {
+            result.push('[');
+            // Skip digits until ]
+            let mut is_numeric = true;
+            let mut inner = String::new();
+            while let Some(&next) = chars.peek() {
+                if next == ']' {
+                    break;
+                }
+                inner.push(chars.next().unwrap());
+                if !inner.chars().last().unwrap().is_ascii_digit() {
+                    is_numeric = false;
+                }
+            }
+            if is_numeric && !inner.is_empty() {
+                result.push('*');
+            } else {
+                result.push_str(&inner);
+            }
+        } else {
+            result.push(c);
+        }
+    }
+
+    // Truncate very long paths (character-safe)
+    truncate_str(&result, 40)
+}
+
+/// Normalize field list for pattern matching.
+fn normalize_field_list(fields: &[String]) -> String {
+    if fields.len() <= 3 {
+        fields
+            .iter()
+            .map(|f| normalize_field_path(f))
+            .collect::<Vec<_>>()
+            .join(",")
+    } else {
+        let first_two: Vec<_> = fields
+            .iter()
+            .take(2)
+            .map(|f| normalize_field_path(f))
+            .collect();
+        format!("{}...(+{})", first_two.join(","), fields.len() - 2)
+    }
+}
+
+/// Normalize error message for pattern grouping.
+fn normalize_error_message(error: &str) -> String {
+    truncate_str(error, 60)
+}
+
+/// Extract error pattern from a failure.
+pub fn extract_pattern(error: &str, diff: &Option<RoundtripDiff>) -> ErrorPattern {
+    if let Some(d) = diff {
+        if !d.lost_fields.is_empty() {
+            let fields = normalize_field_list(&d.lost_fields);
+            return ErrorPattern {
+                pattern: format!("L:{}", fields),
+                category: 'L',
+            };
+        }
+        if !d.added_fields.is_empty() {
+            let fields = normalize_field_list(&d.added_fields);
+            return ErrorPattern {
+                pattern: format!("A:{}", fields),
+                category: 'A',
+            };
+        }
+        if !d.changed_fields.is_empty() {
+            let fields: Vec<_> = d
+                .changed_fields
+                .iter()
+                .map(|(path, _, _)| normalize_field_path(path))
+                .collect();
+            let fields_str = if fields.len() <= 3 {
+                fields.join(",")
+            } else {
+                format!("{}...(+{})", fields[..2].join(","), fields.len() - 2)
+            };
+            return ErrorPattern {
+                pattern: format!("C:{}", fields_str),
+                category: 'C',
+            };
+        }
+    }
+
+    let normalized = normalize_error_message(error);
+    ErrorPattern {
+        pattern: normalized,
+        category: 'E',
+    }
+}
+
+/// Compact test case names using glob patterns where possible.
+fn compact_test_names(names: &[String]) -> String {
+    if names.len() <= 2 {
+        return names.join(",");
+    }
+    format!("{}...(+{})", names[0], names.len() - 1)
+}
+
+/// Group failures by error pattern.
+pub fn group_failures(failures: &[FailureWithDiff]) -> Vec<PatternGroup> {
+    let mut groups: HashMap<ErrorPattern, PatternGroup> = HashMap::new();
+
+    for (direction, test_case, error, diff) in failures {
+        let pattern = extract_pattern(error, diff);
+
+        let group = groups
+            .entry(pattern.clone())
+            .or_insert_with(|| PatternGroup {
+                pattern,
+                by_direction: HashMap::new(),
+                total_count: 0,
+            });
+
+        group
+            .by_direction
+            .entry(direction.clone())
+            .or_default()
+            .push(test_case.clone());
+        group.total_count += 1;
+    }
+
+    // Sort by count descending
+    let mut groups: Vec<_> = groups.into_values().collect();
+    groups.sort_by(|a, b| b.total_count.cmp(&a.total_count));
+    groups
+}
+
+/// Generate compact report header with stats.
+pub fn generate_compact_header(
+    req_stats: &TableStats,
+    resp_stats: &TableStats,
+    stream_stats: &TableStats,
+) -> String {
+    let mut output = String::new();
+    output.push_str("# Coverage (compact)\n");
+
+    let total_passed = req_stats.passed + resp_stats.passed + stream_stats.passed;
+    let total_failed = req_stats.failed + resp_stats.failed + stream_stats.failed;
+    let total_lim = req_stats.limitations + resp_stats.limitations + stream_stats.limitations;
+    let total_working = total_passed + total_lim;
+    let total = total_working + total_failed;
+    let pct = if total > 0 {
+        (total_working as f64 / total as f64) * 100.0
+    } else {
+        0.0
+    };
+
+    output.push_str(&format!(
+        "Stats: {}/{} ({:.1}%) [{}+{}lim] {}fail\n",
+        total_working, total, pct, total_passed, total_lim, total_failed
+    ));
+
+    // Per-type stats on one line
+    let req_total = req_stats.passed + req_stats.failed + req_stats.limitations;
+    let resp_total = resp_stats.passed + resp_stats.failed + resp_stats.limitations;
+    let str_total = stream_stats.passed + stream_stats.failed + stream_stats.limitations;
+
+    let mut type_stats = Vec::new();
+    if req_total > 0 {
+        type_stats.push(format!(
+            "req:{}/{}",
+            req_stats.passed + req_stats.limitations,
+            req_total
+        ));
+    }
+    if resp_total > 0 {
+        type_stats.push(format!(
+            "res:{}/{}",
+            resp_stats.passed + resp_stats.limitations,
+            resp_total
+        ));
+    }
+    if str_total > 0 {
+        type_stats.push(format!(
+            "str:{}/{}",
+            stream_stats.passed + stream_stats.limitations,
+            str_total
+        ));
+    }
+
+    if !type_stats.is_empty() {
+        output.push_str(&type_stats.join(" "));
+        output.push('\n');
+    }
+
+    output
+}
+
+/// Generate compact failures section.
+pub fn generate_compact_failures(failures: &[FailureWithDiff]) -> String {
+    let mut output = String::new();
+
+    if failures.is_empty() {
+        return output;
+    }
+
+    let groups = group_failures(failures);
+
+    output.push_str(&format!(
+        "\n## Failures ({} patterns, {} total)\n",
+        groups.len(),
+        failures.len()
+    ));
+
+    for (idx, group) in groups.iter().enumerate() {
+        output.push_str(&format!(
+            "\n[P{}] {} ({})\n",
+            idx + 1,
+            group.pattern.pattern,
+            group.total_count
+        ));
+
+        // Sort directions by count descending
+        let mut directions: Vec<_> = group.by_direction.iter().collect();
+        directions.sort_by(|a, b| b.1.len().cmp(&a.1.len()));
+
+        for (direction, test_cases) in directions {
+            // Abbreviate direction
+            let parts: Vec<_> = direction.split(" → ").collect();
+            let abbrev_dir = if parts.len() == 2 {
+                format!("{}→{}", abbrev(parts[0]), abbrev(parts[1]))
+            } else {
+                direction.clone()
+            };
+
+            let compact_names = compact_test_names(test_cases);
+            output.push_str(&format!("  {}: {}\n", abbrev_dir, compact_names));
+        }
+    }
+
+    output
+}
+
+/// Generate compact limitations section.
+pub fn generate_compact_limitations(limitations: &[(String, String, String)]) -> String {
+    let mut output = String::new();
+
+    if limitations.is_empty() {
+        return output;
+    }
+
+    // Group by direction
+    let mut by_direction: HashMap<String, Vec<(String, String)>> = HashMap::new();
+    for (direction, test_case, reason) in limitations {
+        by_direction
+            .entry(direction.clone())
+            .or_default()
+            .push((test_case.clone(), reason.clone()));
+    }
+
+    output.push_str(&format!("\n## Limitations ({})\n", limitations.len()));
+
+    let mut directions: Vec<_> = by_direction.into_iter().collect();
+    directions.sort_by(|a, b| b.1.len().cmp(&a.1.len()));
+
+    for (direction, items) in directions {
+        let parts: Vec<_> = direction.split(" → ").collect();
+        let abbrev_dir = if parts.len() == 2 {
+            format!("{}→{}", abbrev(parts[0]), abbrev(parts[1]))
+        } else {
+            direction.clone()
+        };
+        output.push_str(&format!(
+            "{}: {}\n",
+            abbrev_dir,
+            compact_test_names(&items.iter().map(|(t, _)| t.clone()).collect::<Vec<_>>())
+        ));
+    }
+
+    output
+}
+
+/// Collect statistics from results.
+pub fn collect_stats(results: &HashMap<(usize, usize), PairResult>) -> TableStats {
+    let mut stats = TableStats {
+        passed: 0,
+        failed: 0,
+        limitations: 0,
+    };
+    for pair_result in results.values() {
+        stats.passed += pair_result.passed;
+        stats.failed += pair_result.failed;
+        stats.limitations += pair_result.limitations;
+    }
+    stats
+}
+
+/// Collect failures from results with direction info.
+pub fn collect_failures(
+    results: &HashMap<(usize, usize), PairResult>,
+    adapters: &[Box<dyn ProviderAdapter>],
+) -> Vec<FailureWithDiff> {
+    let mut failures = Vec::new();
+    for ((source_idx, target_idx), pair_result) in results {
+        let direction = format!(
+            "{} → {}",
+            adapters[*source_idx].display_name(),
+            adapters[*target_idx].display_name()
+        );
+        for (test_case, error, diff) in &pair_result.failures {
+            failures.push((
+                direction.clone(),
+                test_case.clone(),
+                error.clone(),
+                diff.clone(),
+            ));
+        }
+    }
+    failures
+}
+
+/// Collect limitations from results with direction info.
+pub fn collect_limitations(
+    results: &HashMap<(usize, usize), PairResult>,
+    adapters: &[Box<dyn ProviderAdapter>],
+) -> Vec<(String, String, String)> {
+    let mut limitations = Vec::new();
+    for ((source_idx, target_idx), pair_result) in results {
+        let direction = format!(
+            "{} → {}",
+            adapters[*source_idx].display_name(),
+            adapters[*target_idx].display_name()
+        );
+        for (test_case, reason, _diff) in &pair_result.limitation_details {
+            // Compact mode ignores diff - just pass through test_case and reason
+            limitations.push((direction.clone(), test_case.clone(), reason.clone()));
+        }
+    }
+    limitations
+}
diff --git a/crates/coverage-report/src/discovery.rs b/crates/coverage-report/src/discovery.rs
index b7cfc009..2fa2d368 100644
--- a/crates/coverage-report/src/discovery.rs
+++ b/crates/coverage-report/src/discovery.rs
@@ -6,8 +6,18 @@ use bytes::Bytes;
 use std::fs;
 use std::path::PathBuf;
 
-/// Discover all test case directories in payloads/snapshots
-pub fn discover_test_cases() -> Vec<String> {
+use crate::types::TestFilter;
+
+/// Discover test case directories in payloads/snapshots, filtered by the provided filter.
+pub fn discover_test_cases_filtered(filter: &TestFilter) -> Vec<String> {
+    discover_all_test_cases()
+        .into_iter()
+        .filter(|name| filter.matches_test_case(name))
+        .collect()
+}
+
+/// Discover all test case directories in payloads/snapshots (unfiltered)
+fn discover_all_test_cases() -> Vec<String> {
     // Navigate from crates/coverage-report to workspace root
     let workspace_root = PathBuf::from(env!("CARGO_MANIFEST_DIR"))
         .parent() // crates/
diff --git a/crates/coverage-report/src/expected.rs b/crates/coverage-report/src/expected.rs
new file mode 100644
index 00000000..8225ebbd
--- /dev/null
+++ b/crates/coverage-report/src/expected.rs
@@ -0,0 +1,444 @@
+/*!
+Expected differences whitelist.
+
+This module defines expected differences between providers that are NOT bugs,
+but documented semantic differences due to provider limitations.
+
+This is the SINGLE SOURCE OF TRUTH for all expected limitations, covering:
+- Test case skips (entire tests that cannot transform between providers)
+- Field differences during comparison (params that don't exist in target provider)
+- Transform errors (features that fail transformation with expected errors)
+
+# JSON files
+
+Expected differences are split by test category:
+- `requests_expected_differences.json` - for request transformation tests
+- `responses_expected_differences.json` - for response transformation tests
+- `streaming_expected_differences.json` - for streaming response tests
+
+Each file uses a two-tier structure:
+
+```json
+{
+  "global": [
+    {
+      "source": "*",
+      "target": "Anthropic",
+      "fields": [
+        { "pattern": "params.top_k", "reason": "OpenAI doesn't support top_k" }
+      ],
+      "errors": [
+        { "pattern": "does not support logprobs", "reason": "Anthropic doesn't support logprobs" }
+      ]
+    }
+  ],
+  "perTestCase": [
+    {
+      "testCase": "imageContentParam",
+      "source": "*",
+      "target": "Anthropic",
+      "skip": true,
+      "reason": "Anthropic assistant messages don't support image content"
+    }
+  ]
+}
+```
+
+## Structure
+
+- **global**: Rules that apply to ALL tests for a source→target pair
+- **perTestCase**: Test-specific rules with explicit test case name
+  - Can have `skip: true` to skip entire test
+  - Can have `fields`/`errors` arrays for partial differences
+
+## Matching behavior
+
+- **Test case skip**: Exact match on testCase name
+- **Fields**: Prefix matching (e.g., "params.response_format" matches "params.response_format.json_schema")
+- **Errors**: Substring matching on error message
+
+## Provider matching
+
+`source` and `target` can be `"*"` to match any provider. This is useful for:
+- Universal limitations (e.g., image media_type normalization)
+- One-sided limitations (e.g., "any source → Anthropic" for frequency_penalty)
+*/
+
+use crate::types::ExpectedDifferences;
+use std::sync::LazyLock;
+
+/// The category of test this expected difference applies to.
+#[derive(Debug, Clone, Copy, PartialEq, Eq)]
+pub enum TestCategory {
+    Requests,
+    Responses,
+    Streaming,
+}
+
+/// Parse JSON content into ExpectedDifferences.
+fn parse_expected_differences(json: &str, filename: &str) -> ExpectedDifferences {
+    big_serde_json::from_str(json).unwrap_or_else(|e| panic!("Failed to parse {}: {}", filename, e))
+}
+
+/// Expected differences for request transformations.
+static EXPECTED_REQUESTS: LazyLock<ExpectedDifferences> = LazyLock::new(|| {
+    let json = include_str!("requests_expected_differences.json");
+    parse_expected_differences(json, "requests_expected_differences.json")
+});
+
+/// Expected differences for response transformations.
+static EXPECTED_RESPONSES: LazyLock<ExpectedDifferences> = LazyLock::new(|| {
+    let json = include_str!("responses_expected_differences.json");
+    parse_expected_differences(json, "responses_expected_differences.json")
+});
+
+/// Expected differences for streaming response transformations.
+static EXPECTED_STREAMING: LazyLock<ExpectedDifferences> = LazyLock::new(|| {
+    let json = include_str!("streaming_expected_differences.json");
+    parse_expected_differences(json, "streaming_expected_differences.json")
+});
+
+/// Get the expected differences for a given test category.
+fn get_expected_differences(category: TestCategory) -> &'static ExpectedDifferences {
+    match category {
+        TestCategory::Requests => &EXPECTED_REQUESTS,
+        TestCategory::Responses => &EXPECTED_RESPONSES,
+        TestCategory::Streaming => &EXPECTED_STREAMING,
+    }
+}
+
+/// Helper function for source/target matching with wildcard support.
+fn matches_source_target(rule_source: &str, rule_target: &str, source: &str, target: &str) -> bool {
+    (rule_source == "*" || rule_source == source) && (rule_target == "*" || rule_target == target)
+}
+
+/// Check if a test case is expected to be skipped for the given source→target.
+///
+/// Returns the reason if expected to skip, None otherwise.
+pub fn is_expected_test_case(
+    category: TestCategory,
+    source: &str,
+    target: &str,
+    test_case: &str,
+) -> Option<String> {
+    let diffs = get_expected_differences(category);
+
+    // Check per-test-case rules
+    for rule in &diffs.per_test_case {
+        if rule.test_case == test_case
+            && rule.skip
+            && matches_source_target(&rule.source, &rule.target, source, target)
+        {
+            return rule.reason.clone();
+        }
+    }
+
+    None
+}
+
+/// Check if a field difference is expected for the given source→target translation.
+///
+/// Returns the reason if the difference is expected, None if it's unexpected (a bug).
+pub fn is_expected_field(
+    category: TestCategory,
+    source: &str,
+    target: &str,
+    test_case: Option<&str>,
+    field: &str,
+) -> Option<String> {
+    let diffs = get_expected_differences(category);
+
+    // Helper to check if a pattern matches (prefix matching with [*] wildcard)
+    // Example: pattern "choices[*].delta.refusal" matches field "choices[0].delta.refusal"
+    let pattern_matches = |pattern: &str| {
+        if pattern.contains("[*]") {
+            // Convert pattern to regex: replace [*] with \[\d+\]
+            let regex_pattern = pattern
+                .replace("[", "\\[")
+                .replace("]", "\\]")
+                .replace("\\[*\\]", "\\[\\d+\\]");
+            regex::Regex::new(&format!("^{}", regex_pattern))
+                .map(|re| re.is_match(field))
+                .unwrap_or(false)
+        } else {
+            field.starts_with(pattern)
+        }
+    };
+
+    // Check per-test-case rules first (if we have a test case)
+    if let Some(test_name) = test_case {
+        for rule in &diffs.per_test_case {
+            if rule.test_case == test_name
+                && matches_source_target(&rule.source, &rule.target, source, target)
+            {
+                if let Some(entry) = rule.fields.iter().find(|e| pattern_matches(&e.pattern)) {
+                    return Some(entry.reason.clone());
+                }
+            }
+        }
+    }
+
+    // Check global rules
+    for rule in &diffs.global {
+        if matches_source_target(&rule.source, &rule.target, source, target) {
+            if let Some(entry) = rule.fields.iter().find(|e| pattern_matches(&e.pattern)) {
+                return Some(entry.reason.clone());
+            }
+        }
+    }
+
+    None
+}
+
+/// Check if a transform error is expected for the given source→target translation.
+///
+/// Returns the reason if the error is expected (limitation), None if it's unexpected (a bug).
+pub fn is_expected_error(
+    category: TestCategory,
+    source: &str,
+    target: &str,
+    test_case: Option<&str>,
+    error_msg: &str,
+) -> Option<String> {
+    let diffs = get_expected_differences(category);
+
+    // Helper to check if error pattern matches (substring matching)
+    let pattern_matches = |pattern: &str| error_msg.contains(pattern);
+
+    // Check per-test-case rules first
+    if let Some(test_name) = test_case {
+        for rule in &diffs.per_test_case {
+            if rule.test_case == test_name
+                && matches_source_target(&rule.source, &rule.target, source, target)
+            {
+                if let Some(entry) = rule.errors.iter().find(|e| pattern_matches(&e.pattern)) {
+                    return Some(entry.reason.clone());
+                }
+            }
+        }
+    }
+
+    // Check global rules
+    for rule in &diffs.global {
+        if matches_source_target(&rule.source, &rule.target, source, target) {
+            if let Some(entry) = rule.errors.iter().find(|e| pattern_matches(&e.pattern)) {
+                return Some(entry.reason.clone());
+            }
+        }
+    }
+
+    None
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    // =========================================================================
+    // Test case level tests
+    // =========================================================================
+
+    #[test]
+    fn test_test_case_exact_match() {
+        assert!(is_expected_test_case(
+            TestCategory::Requests,
+            "ChatCompletions",
+            "Anthropic",
+            "imageContentParam"
+        )
+        .is_some());
+    }
+
+    #[test]
+    fn test_test_case_any_source_match() {
+        // imageContentParam is configured with source=None, so any source should match
+        assert!(is_expected_test_case(
+            TestCategory::Requests,
+            "ChatCompletions",
+            "Anthropic",
+            "imageContentParam"
+        )
+        .is_some());
+        assert!(is_expected_test_case(
+            TestCategory::Requests,
+            "Responses",
+            "Anthropic",
+            "imageContentParam"
+        )
+        .is_some());
+    }
+
+    #[test]
+    fn test_test_case_specific_source_match() {
+        // codeInterpreterToolParam is configured with source=Responses
+        assert!(is_expected_test_case(
+            TestCategory::Requests,
+            "Responses",
+            "Anthropic",
+            "codeInterpreterToolParam"
+        )
+        .is_some());
+        // Should NOT match with ChatCompletions source
+        assert!(is_expected_test_case(
+            TestCategory::Requests,
+            "ChatCompletions",
+            "Anthropic",
+            "codeInterpreterToolParam"
+        )
+        .is_none());
+    }
+
+    #[test]
+    fn test_test_case_no_match() {
+        // Unknown test case should not match
+        assert!(is_expected_test_case(
+            TestCategory::Requests,
+            "Responses",
+            "Anthropic",
+            "unknownTestCase"
+        )
+        .is_none());
+        // Known test case but wrong target
+        assert!(is_expected_test_case(
+            TestCategory::Requests,
+            "ChatCompletions",
+            "ChatCompletions",
+            "imageContentParam"
+        )
+        .is_none());
+    }
+
+    // =========================================================================
+    // Field level tests
+    // =========================================================================
+
+    #[test]
+    fn test_field_exact_match() {
+        assert!(is_expected_field(
+            TestCategory::Requests,
+            "Anthropic",
+            "Responses",
+            None,
+            "params.reasoning.budget_tokens"
+        )
+        .is_some());
+    }
+
+    #[test]
+    fn test_field_any_source_match() {
+        // Use params.metadata which legitimately differs (not validated)
+        assert!(is_expected_field(
+            TestCategory::Requests,
+            "ChatCompletions",
+            "Anthropic",
+            None,
+            "params.metadata"
+        )
+        .is_some());
+        assert!(is_expected_field(
+            TestCategory::Requests,
+            "Responses",
+            "Anthropic",
+            None,
+            "params.metadata"
+        )
+        .is_some());
+    }
+
+    #[test]
+    fn test_field_prefix_match() {
+        assert!(is_expected_field(
+            TestCategory::Requests,
+            "ChatCompletions",
+            "Anthropic",
+            None,
+            "params.response_format.json_schema.schema"
+        )
+        .is_some());
+    }
+
+    #[test]
+    fn test_field_no_match() {
+        assert!(is_expected_field(
+            TestCategory::Requests,
+            "ChatCompletions",
+            "Responses",
+            None,
+            "messages[0].content"
+        )
+        .is_none());
+    }
+
+    #[test]
+    fn test_error_match() {
+        assert!(is_expected_error(
+            TestCategory::Requests,
+            "Anthropic",
+            "ChatCompletions",
+            None,
+            "Tool 'bash' of type 'bash_20250124' is not supported by OpenAI Chat Completions"
+        )
+        .is_some());
+    }
+
+    #[test]
+    fn test_error_missing_is_failure() {
+        // Errors with "missing" should always be failures, not limitations
+        assert!(is_expected_error(
+            TestCategory::Requests,
+            "Anthropic",
+            "ChatCompletions",
+            None,
+            "missing model"
+        )
+        .is_none());
+    }
+
+    #[test]
+    fn test_error_no_match() {
+        assert!(is_expected_error(
+            TestCategory::Requests,
+            "Anthropic",
+            "ChatCompletions",
+            None,
+            "some random error"
+        )
+        .is_none());
+    }
+
+    // =========================================================================
+    // Category isolation tests
+    // =========================================================================
+
+    #[test]
+    fn test_category_isolation() {
+        // Requests category should find entries in requests file
+        // Use params.metadata which legitimately differs (not validated)
+        assert!(is_expected_field(
+            TestCategory::Requests,
+            "ChatCompletions",
+            "Anthropic",
+            None,
+            "params.metadata"
+        )
+        .is_some());
+
+        // Responses and Streaming categories have empty files, should not find anything
+        assert!(is_expected_field(
+            TestCategory::Responses,
+            "ChatCompletions",
+            "Anthropic",
+            None,
+            "params.metadata"
+        )
+        .is_none());
+        assert!(is_expected_field(
+            TestCategory::Streaming,
+            "ChatCompletions",
+            "Anthropic",
+            None,
+            "params.metadata"
+        )
+        .is_none());
+    }
+}
diff --git a/crates/coverage-report/src/lib.rs b/crates/coverage-report/src/lib.rs
new file mode 100644
index 00000000..e9c757a6
--- /dev/null
+++ b/crates/coverage-report/src/lib.rs
@@ -0,0 +1,29 @@
+/*!
+Cross-provider transformation coverage testing library.
+
+This library provides the core functionality for running cross-provider
+transformation tests and generating coverage reports.
+
+## Usage
+
+```rust,ignore
+use coverage_report::{run_all_tests, types::TestFilter};
+use lingua::processing::adapters::adapters;
+
+let adapters = adapters();
+let filter = TestFilter::default();
+let (requests, responses, streaming) = run_all_tests(adapters, &filter);
+```
+*/
+
+pub mod compact;
+pub mod discovery;
+pub mod expected;
+mod normalizers;
+pub mod report;
+pub mod runner;
+pub mod types;
+
+// Re-export commonly used items
+pub use runner::run_all_tests;
+pub use types::{PairResult, TestFilter, ValidationLevel};
diff --git a/crates/coverage-report/src/main.rs b/crates/coverage-report/src/main.rs
index 2f5f0da6..9664d7dc 100644
--- a/crates/coverage-report/src/main.rs
+++ b/crates/coverage-report/src/main.rs
@@ -10,33 +10,224 @@ Validates:
 3. Key semantic fields are preserved (messages, model, tools, usage)
 
 Usage:
-    cargo run --bin generate-coverage-report
+    cargo run --bin coverage-report
+    cargo run --bin coverage-report -- --coverage requests,responses
+    cargo run --bin coverage-report -- --test-cases seedParam,toolCallRequest
+    cargo run --bin coverage-report -- --providers responses,anthropic
+    cargo run --bin coverage-report -- --source responses --target anthropic
 */
 
-mod discovery;
-mod report;
-mod runner;
-mod types;
+use std::str::FromStr;
 
+use coverage_report::report::generate_report;
+use coverage_report::runner::run_all_tests;
+use coverage_report::types::{parse_provider, CoverageSelection, OutputFormat, TestFilter};
 use lingua::processing::adapters::adapters;
-use report::generate_report;
-use runner::{run_all_tests, run_roundtrip_tests};
+
+struct CliArgs {
+    selection: CoverageSelection,
+    filter: TestFilter,
+    format: OutputFormat,
+}
+
+fn parse_cli_args() -> Result<CliArgs, String> {
+    let mut selection_arg: Option<String> = None;
+    let mut test_cases_arg: Option<String> = None;
+    let mut providers_arg: Option<String> = None;
+    let mut source_arg: Option<String> = None;
+    let mut target_arg: Option<String> = None;
+    let mut format_arg: Option<String> = None;
+
+    let mut args = std::env::args().skip(1);
+
+    while let Some(arg) = args.next() {
+        match arg.as_str() {
+            "--coverage" => {
+                selection_arg = args.next();
+                if selection_arg.is_none() {
+                    return Err("Missing value for --coverage".to_string());
+                }
+            }
+            "--test-cases" | "-t" => {
+                test_cases_arg = args.next();
+                if test_cases_arg.is_none() {
+                    return Err("Missing value for --test-cases".to_string());
+                }
+            }
+            "--providers" | "-p" => {
+                providers_arg = args.next();
+                if providers_arg.is_none() {
+                    return Err("Missing value for --providers".to_string());
+                }
+            }
+            "--source" => {
+                source_arg = args.next();
+                if source_arg.is_none() {
+                    return Err("Missing value for --source".to_string());
+                }
+            }
+            "--target" => {
+                target_arg = args.next();
+                if target_arg.is_none() {
+                    return Err("Missing value for --target".to_string());
+                }
+            }
+            "--format" | "-f" => {
+                format_arg = args.next();
+                if format_arg.is_none() {
+                    return Err("Missing value for --format".to_string());
+                }
+            }
+            _ if arg.starts_with("--coverage=") => {
+                selection_arg = Some(arg.strip_prefix("--coverage=").unwrap().to_string());
+            }
+            _ if arg.starts_with("--test-cases=") || arg.starts_with("-t=") => {
+                let prefix = if arg.starts_with("--test-cases=") {
+                    "--test-cases="
+                } else {
+                    "-t="
+                };
+                test_cases_arg = Some(arg.strip_prefix(prefix).unwrap().to_string());
+            }
+            _ if arg.starts_with("--providers=") || arg.starts_with("-p=") => {
+                let prefix = if arg.starts_with("--providers=") {
+                    "--providers="
+                } else {
+                    "-p="
+                };
+                providers_arg = Some(arg.strip_prefix(prefix).unwrap().to_string());
+            }
+            _ if arg.starts_with("--source=") => {
+                source_arg = Some(arg.strip_prefix("--source=").unwrap().to_string());
+            }
+            _ if arg.starts_with("--target=") => {
+                target_arg = Some(arg.strip_prefix("--target=").unwrap().to_string());
+            }
+            _ if arg.starts_with("--format=") || arg.starts_with("-f=") => {
+                let prefix = if arg.starts_with("--format=") {
+                    "--format="
+                } else {
+                    "-f="
+                };
+                format_arg = Some(arg.strip_prefix(prefix).unwrap().to_string());
+            }
+            _ => {
+                return Err(format!("Unknown argument: {}", arg));
+            }
+        }
+    }
+
+    // Parse coverage selection
+    let selection = match selection_arg {
+        Some(value) => CoverageSelection::from_list(&value)?,
+        None => CoverageSelection::all(),
+    };
+
+    // Parse output format
+    let format = match format_arg {
+        Some(value) => OutputFormat::from_str(&value)?,
+        None => OutputFormat::default(),
+    };
+
+    // Parse test filter
+    let mut filter = TestFilter::default();
+
+    // Parse test case patterns
+    if let Some(value) = test_cases_arg {
+        filter.test_case_patterns = value
+            .split(',')
+            .map(|s| s.trim().to_string())
+            .filter(|s| !s.is_empty())
+            .collect();
+    }
+
+    // Parse providers filter (both source AND target)
+    if let Some(value) = providers_arg {
+        let providers: Result<Vec<_>, _> =
+            value.split(',').map(|s| parse_provider(s.trim())).collect();
+        filter.providers = Some(providers?);
+    }
+
+    // Parse explicit source filter
+    if let Some(value) = source_arg {
+        let sources: Result<Vec<_>, _> =
+            value.split(',').map(|s| parse_provider(s.trim())).collect();
+        filter.sources = Some(sources?);
+    }
+
+    // Parse explicit target filter
+    if let Some(value) = target_arg {
+        let targets: Result<Vec<_>, _> =
+            value.split(',').map(|s| parse_provider(s.trim())).collect();
+        filter.targets = Some(targets?);
+    }
+
+    Ok(CliArgs {
+        selection,
+        filter,
+        format,
+    })
+}
+
+fn print_usage() {
+    eprintln!("Usage: coverage-report [OPTIONS]");
+    eprintln!();
+    eprintln!("Options:");
+    eprintln!("  --coverage <types>       Coverage types: requests,responses,streaming,all");
+    eprintln!(
+        "  -t, --test-cases <patterns>  Test case patterns (glob: seedParam, reasoning*, *Param)"
+    );
+    eprintln!(
+        "  -p, --providers <names>  Filter provider pairs (both source AND target must match)"
+    );
+    eprintln!("  --source <names>         Filter source providers");
+    eprintln!("  --target <names>         Filter target providers");
+    eprintln!("  -f, --format <format>    Output format: markdown (default), compact");
+    eprintln!();
+    eprintln!("Provider names: responses, chat-completions, anthropic, google, bedrock");
+    eprintln!();
+    eprintln!("Examples:");
+    eprintln!("  coverage-report                                    # Run all tests");
+    eprintln!(
+        "  coverage-report --coverage requests                # Only request transformations"
+    );
+    eprintln!("  coverage-report -t seedParam                       # Only seedParam test case");
+    eprintln!("  coverage-report -t \"reasoning*\"                    # All reasoning test cases");
+    eprintln!("  coverage-report -p chat-completions                # Roundtrip tests for ChatCompletions");
+    eprintln!("  coverage-report -p responses,anthropic             # Only Responses↔Anthropic");
+    eprintln!(
+        "  coverage-report --source responses --target anthropic  # Only Responses→Anthropic"
+    );
+    eprintln!("  coverage-report -f compact                         # Token-optimized output");
+}
 
 fn main() {
-    let adapters = adapters();
+    let CliArgs {
+        selection,
+        filter,
+        format,
+    } = match parse_cli_args() {
+        Ok(args) => args,
+        Err(error) => {
+            eprintln!("Error: {}", error);
+            eprintln!();
+            print_usage();
+            std::process::exit(2);
+        }
+    };
 
-    // Cross-provider transformation tests
-    let (request_results, response_results, streaming_results) = run_all_tests(adapters);
+    let adapters = adapters();
 
-    // Roundtrip transform tests (Provider → Universal → Provider)
-    let roundtrip_results = run_roundtrip_tests(adapters);
+    // Run all transformation tests (including roundtrip when source == target)
+    let (request_results, response_results, streaming_results) = run_all_tests(adapters, &filter);
 
     let report = generate_report(
         &request_results,
         &response_results,
         &streaming_results,
-        &roundtrip_results,
         adapters,
+        selection,
+        format,
     );
     println!("{}", report);
 }
diff --git a/crates/coverage-report/src/normalizers.rs b/crates/coverage-report/src/normalizers.rs
new file mode 100644
index 00000000..b53771c3
--- /dev/null
+++ b/crates/coverage-report/src/normalizers.rs
@@ -0,0 +1,95 @@
+/*!
+Semantic-equivalence normalizers for coverage-report diffs.
+
+These rules apply only to Universal types and keep scope explicit and type-safe.
+*/
+
+use lingua::serde_json::Value;
+use lingua::universal::{
+    message::{
+        AssistantContent, AssistantContentPart, Message, TextContentPart, UserContent,
+        UserContentPart,
+    },
+    UniversalRequest, UniversalResponse, UniversalStreamChunk,
+};
+
+/// Normalize a UniversalRequest for semantic comparison.
+///
+/// Rule: message content strings are equivalent to a single text-part array.
+pub fn normalize_request_for_comparison(req: &UniversalRequest) -> UniversalRequest {
+    let mut normalized = req.clone();
+    for message in &mut normalized.messages {
+        normalize_message_content(message);
+    }
+    normalized
+}
+
+/// Normalize a UniversalResponse for semantic comparison.
+///
+/// Rule: message content strings are equivalent to a single text-part array.
+pub fn normalize_response_for_comparison(resp: &UniversalResponse) -> UniversalResponse {
+    let mut normalized = resp.clone();
+    for message in &mut normalized.messages {
+        normalize_message_content(message);
+    }
+    normalized
+}
+
+/// Normalize a UniversalStreamChunk for semantic comparison.
+///
+/// Rule: stream deltas with content strings are equivalent to a single text-part array.
+pub fn normalize_stream_chunk_for_comparison(chunk: &UniversalStreamChunk) -> UniversalStreamChunk {
+    let mut normalized = chunk.clone();
+    for choice in &mut normalized.choices {
+        if let Some(Value::Object(map)) = choice.delta.as_mut() {
+            if let Some(Value::String(text)) = map.get("content").cloned() {
+                map.insert("content".to_string(), text_part_value(text));
+            }
+        }
+    }
+    normalized
+}
+
+fn normalize_message_content(message: &mut Message) {
+    match message {
+        Message::System { content } | Message::User { content } => {
+            normalize_user_content(content);
+        }
+        Message::Assistant { content, .. } => {
+            normalize_assistant_content(content);
+        }
+        Message::Tool { .. } => {}
+    }
+}
+
+fn normalize_user_content(content: &mut UserContent) {
+    if let UserContent::String(text) = content {
+        let text = std::mem::take(text);
+        *content = UserContent::Array(vec![UserContentPart::Text(text_part(text))]);
+    }
+}
+
+fn normalize_assistant_content(content: &mut AssistantContent) {
+    if let AssistantContent::String(text) = content {
+        let text = std::mem::take(text);
+        *content = AssistantContent::Array(vec![AssistantContentPart::Text(text_part(text))]);
+    }
+}
+
+fn text_part(text: String) -> TextContentPart {
+    TextContentPart {
+        text,
+        provider_options: None,
+    }
+}
+
+fn text_part_value(text: String) -> Value {
+    Value::Array(vec![Value::Object(
+        [
+            ("type".to_string(), Value::String("text".to_string())),
+            ("text".to_string(), Value::String(text)),
+        ]
+        .into_iter()
+        .collect(),
+    )])
+}
diff --git a/crates/coverage-report/src/report.rs b/crates/coverage-report/src/report.rs
index 05631724..cad77504 100644
--- a/crates/coverage-report/src/report.rs
+++ b/crates/coverage-report/src/report.rs
@@ -6,11 +6,16 @@ use std::collections::HashMap;
 
 use lingua::processing::adapters::ProviderAdapter;
 
-use crate::runner::RoundtripResults;
-use crate::types::{IssueEntry, PairResult, RoundtripResult, TableResult, TableStats};
+use crate::compact;
+use crate::types::{
+    CoverageSelection, FailureWithDiff, OutputFormat, PairResult, RoundtripDiff, TableOutput,
+    TableStats,
+};
 
 pub fn format_cell(pair_result: &PairResult) -> String {
-    let total = pair_result.passed + pair_result.failed;
+    // Working = passed + limitations (both represent successful translations)
+    let working = pair_result.passed + pair_result.limitations;
+    let total = working + pair_result.failed;
     if total == 0 {
         return "-".to_string();
     }
@@ -20,25 +25,55 @@ pub fn format_cell(pair_result: &PairResult) -> String {
     } else {
         "❌"
     };
-    format!("{} {}/{}", emoji, pair_result.passed, total)
+    format!("{} {}/{}", emoji, working, total)
 }
 
-/// Generate a coverage table with statistics and issue details.
+/// Truncate a string to a maximum number of characters, adding "..." if truncated.
+/// Uses character count, not byte count, to avoid UTF-8 panics on multi-byte characters.
+fn truncate_display(s: &str, max_chars: usize) -> String {
+    let char_count = s.chars().count();
+    if char_count > max_chars {
+        let truncated: String = s.chars().take(max_chars.saturating_sub(3)).collect();
+        format!("{}...", truncated)
+    } else {
+        s.to_string()
+    }
+}
+
+/// Render a simple link to the expected differences JSON file.
+fn render_limitations_link(count: usize, transformation_type: &str) -> String {
+    if count == 0 {
+        return String::new();
+    }
+
+    // Map transformation type to JSON filename
+    let json_file = match transformation_type {
+        "Request" => "requests_expected_differences.json",
+        "Response" => "responses_expected_differences.json",
+        "Streaming" | "Streaming Response" => "streaming_expected_differences.json",
+        _ => "expected_differences.json",
+    };
+
+    format!(
+        "\n⚠️ {} tests have expected differences — [View {}](src/{})\n",
+        count, json_file, json_file
+    )
+}
+
+/// Generate a coverage table for a specific transformation type.
 pub fn generate_table(
     results: &HashMap<(usize, usize), PairResult>,
     adapters: &[Box<dyn ProviderAdapter>],
     title: &str,
-) -> TableResult {
+) -> TableOutput {
     let mut table = String::new();
     let mut stats = TableStats {
         passed: 0,
         failed: 0,
         limitations: 0,
-        missing_fixtures: 0,
     };
-    let mut all_failures: Vec<IssueEntry> = Vec::new();
-    let mut all_limitations: Vec<IssueEntry> = Vec::new();
-    let mut all_missing_fixtures: Vec<IssueEntry> = Vec::new();
+    let mut all_failures: Vec<FailureWithDiff> = Vec::new();
+    let mut all_limitations: Vec<(String, String, String, Option<RoundtripDiff>)> = Vec::new();
 
     table.push_str(&format!("### {}\n\n", title));
     table.push_str("| Source ↓ / Target → |");
@@ -54,314 +89,303 @@ pub fn generate_table(
     for (source_idx, source) in adapters.iter().enumerate() {
         table.push_str(&format!("| {} |", source.display_name()));
         for (target_idx, target) in adapters.iter().enumerate() {
-            if source_idx == target_idx {
-                table.push_str(" - |");
-            } else {
-                let pair_result = results.get(&(source_idx, target_idx)).unwrap();
+            if let Some(pair_result) = results.get(&(source_idx, target_idx)) {
                 table.push_str(&format!(" {} |", format_cell(pair_result)));
 
                 stats.passed += pair_result.passed;
                 stats.failed += pair_result.failed;
                 stats.limitations += pair_result.limitations;
-                stats.missing_fixtures += pair_result.missing_fixtures;
 
-                for (test_case, error) in &pair_result.failures {
+                for (test_case, error, diff) in &pair_result.failures {
                     all_failures.push((
                         format!("{} → {}", source.display_name(), target.display_name()),
                         test_case.clone(),
                         error.clone(),
+                        diff.clone(),
                     ));
                 }
 
-                for (test_case, error) in &pair_result.limitation_details {
+                for (test_case, error, limitation_diff) in &pair_result.limitation_details {
                     all_limitations.push((
                         format!("{} → {}", source.display_name(), target.display_name()),
                         test_case.clone(),
                         error.clone(),
+                        limitation_diff.clone(),
                     ));
                 }
-
-                for (test_case, error) in &pair_result.missing_fixture_details {
-                    all_missing_fixtures.push((
-                        format!("{} → {}", source.display_name(), target.display_name()),
-                        test_case.clone(),
-                        error.clone(),
-                    ));
-                }
+            } else {
+                // Pair was filtered out
+                table.push_str(" - |");
             }
         }
         table.push('\n');
     }
 
-    TableResult {
-        markdown: table,
+    TableOutput {
+        table_markdown: table,
         stats,
         failures: all_failures,
         limitations: all_limitations,
-        missing_fixtures: all_missing_fixtures,
     }
 }
 
-// ============================================================================
-// Roundtrip report section
-// ============================================================================
-
-fn format_roundtrip_cell(passed: usize, failed: usize) -> String {
-    let total = passed + failed;
-    if total == 0 {
-        return "-".to_string();
-    }
-    let emoji = if failed == 0 { "✅" } else { "❌" };
-    format!("{} {}/{}", emoji, passed, total)
-}
-
-fn format_roundtrip_diff(result: &RoundtripResult) -> String {
-    let mut output = String::new();
-
-    if let Some(error) = &result.error {
-        output.push_str(&format!("{}\n", error));
-    }
-
-    if let Some(diff) = &result.diff {
-        if !diff.lost_fields.is_empty() {
-            output.push_str("        Lost: ");
-            output.push_str(&diff.lost_fields.join(", "));
-            output.push('\n');
-        }
-        if !diff.added_fields.is_empty() {
-            output.push_str("        Added: ");
-            output.push_str(&diff.added_fields.join(", "));
-            output.push('\n');
-        }
-        if !diff.changed_fields.is_empty() {
-            output.push_str("        Changed:\n");
-            for (path, original, roundtripped) in &diff.changed_fields {
-                // Truncate long values
-                let orig_display = if original.len() > 50 {
-                    format!("{}...", &original[..47])
-                } else {
-                    original.clone()
-                };
-                let round_display = if roundtripped.len() > 50 {
-                    format!("{}...", &roundtripped[..47])
-                } else {
-                    roundtripped.clone()
-                };
-                output.push_str(&format!(
-                    "          - `{}`: {} → {}\n",
-                    path, orig_display, round_display
-                ));
+fn format_diff(diff: &Option<RoundtripDiff>) -> String {
+    match diff {
+        Some(d) if !d.is_empty() => {
+            let mut output = String::new();
+            if !d.lost_fields.is_empty() {
+                output.push_str("\n        Lost: ");
+                output.push_str(&d.lost_fields.join(", "));
+            }
+            if !d.added_fields.is_empty() {
+                output.push_str("\n        Added: ");
+                output.push_str(&d.added_fields.join(", "));
+            }
+            if !d.changed_fields.is_empty() {
+                output.push_str("\n        Changed:");
+                for (path, original, roundtripped) in &d.changed_fields {
+                    let orig_display = truncate_display(original, 50);
+                    let round_display = truncate_display(roundtripped, 50);
+                    output.push_str(&format!(
+                        "\n          - `{}`: {} → {}",
+                        path, orig_display, round_display
+                    ));
+                }
             }
+            output
         }
+        _ => String::new(),
     }
+}
 
-    output
+pub fn generate_report(
+    request_results: &HashMap<(usize, usize), PairResult>,
+    response_results: &HashMap<(usize, usize), PairResult>,
+    streaming_results: &HashMap<(usize, usize), PairResult>,
+    adapters: &[Box<dyn ProviderAdapter>],
+    selection: CoverageSelection,
+    format: OutputFormat,
+) -> String {
+    match format {
+        OutputFormat::Markdown => generate_markdown_report(
+            request_results,
+            response_results,
+            streaming_results,
+            adapters,
+            selection,
+        ),
+        OutputFormat::Compact => generate_compact_report(
+            request_results,
+            response_results,
+            streaming_results,
+            adapters,
+            selection,
+        ),
+    }
 }
 
-/// Generate the roundtrip transform coverage section of the report.
-pub fn generate_roundtrip_section(
-    roundtrip_results: &RoundtripResults,
+fn generate_compact_report(
+    request_results: &HashMap<(usize, usize), PairResult>,
+    response_results: &HashMap<(usize, usize), PairResult>,
+    streaming_results: &HashMap<(usize, usize), PairResult>,
     adapters: &[Box<dyn ProviderAdapter>],
+    selection: CoverageSelection,
 ) -> String {
     let mut report = String::new();
 
-    report.push_str("## Roundtrip Transform Coverage\n\n");
-    report.push_str("Tests Provider → Universal → Provider fidelity.\n\n");
-
-    // Summary table
-    report.push_str("### Summary\n\n");
-    report.push_str("| Provider | Requests | Responses |\n");
-    report.push_str("|----------|----------|----------|\n");
-
-    let mut total_req_passed = 0;
-    let mut total_req_failed = 0;
-    let mut total_resp_passed = 0;
-    let mut total_resp_failed = 0;
-
-    for (adapter_idx, adapter) in adapters.iter().enumerate() {
-        if let Some(result) = roundtrip_results.get(&adapter_idx) {
-            let req_cell = format_roundtrip_cell(result.request_passed, result.request_failed);
-            let resp_cell = format_roundtrip_cell(result.response_passed, result.response_failed);
-            report.push_str(&format!(
-                "| {} | {} | {} |\n",
-                adapter.display_name(),
-                req_cell,
-                resp_cell
-            ));
-
-            total_req_passed += result.request_passed;
-            total_req_failed += result.request_failed;
-            total_resp_passed += result.response_passed;
-            total_resp_failed += result.response_failed;
-        }
-    }
+    // Collect stats
+    let req_stats = compact::collect_stats(request_results);
+    let resp_stats = compact::collect_stats(response_results);
+    let stream_stats = compact::collect_stats(streaming_results);
 
-    let total_passed = total_req_passed + total_resp_passed;
-    let total_failed = total_req_failed + total_resp_failed;
-    let total = total_passed + total_failed;
-    let pass_percentage = if total > 0 {
-        (total_passed as f64 / total as f64) * 100.0
-    } else {
-        0.0
-    };
-
-    report.push_str(&format!(
-        "\n**{}/{} ({:.1}%)** - {} failed\n",
-        total_passed, total, pass_percentage, total_failed
+    // Header with stats
+    report.push_str(&compact::generate_compact_header(
+        &req_stats,
+        &resp_stats,
+        &stream_stats,
     ));
 
-    // Issues by provider
-    let has_failures = roundtrip_results.values().any(|r| r.total_failed() > 0);
-
-    if has_failures {
-        report.push_str("\n### Issues by Provider\n\n");
-
-        // Sort providers by failure count
-        let mut providers_with_failures: Vec<_> = adapters
-            .iter()
-            .enumerate()
-            .filter_map(|(idx, adapter)| {
-                roundtrip_results
-                    .get(&idx)
-                    .filter(|r| r.total_failed() > 0)
-                    .map(|r| (adapter, r))
-            })
-            .collect();
-        providers_with_failures.sort_by(|a, b| b.1.total_failed().cmp(&a.1.total_failed()));
-
-        for (adapter, result) in providers_with_failures {
-            let total_issues = result.total_failed();
-            report.push_str("<details>\n");
-            report.push_str(&format!(
-                "<summary>❌ {} ({} issues)</summary>\n\n",
-                adapter.display_name(),
-                total_issues
-            ));
-
-            // Request roundtrip issues
-            if !result.request_failures.is_empty() {
-                report.push_str(&format!(
-                    "**Request roundtrip issues ({}):**\n\n",
-                    result.request_failures.len()
-                ));
-                for (test_case, roundtrip_result) in &result.request_failures {
-                    report.push_str(&format!("- `{}`\n", test_case));
-                    let diff_output = format_roundtrip_diff(roundtrip_result);
-                    if !diff_output.is_empty() {
-                        report.push_str(&diff_output);
-                    }
-                }
-                report.push('\n');
-            }
+    // Collect all failures
+    let mut all_failures = Vec::new();
+    if selection.requests {
+        all_failures.extend(compact::collect_failures(request_results, adapters));
+    }
+    if selection.responses {
+        all_failures.extend(compact::collect_failures(response_results, adapters));
+    }
+    if selection.streaming {
+        all_failures.extend(compact::collect_failures(streaming_results, adapters));
+    }
 
-            // Response roundtrip issues
-            if !result.response_failures.is_empty() {
-                report.push_str(&format!(
-                    "**Response roundtrip issues ({}):**\n\n",
-                    result.response_failures.len()
-                ));
-                for (test_case, roundtrip_result) in &result.response_failures {
-                    report.push_str(&format!("- `{}`\n", test_case));
-                    let diff_output = format_roundtrip_diff(roundtrip_result);
-                    if !diff_output.is_empty() {
-                        report.push_str(&diff_output);
-                    }
-                }
-                report.push('\n');
-            }
+    // Deduplicated failures section
+    report.push_str(&compact::generate_compact_failures(&all_failures));
 
-            report.push_str("</details>\n\n");
-        }
+    // Collect all limitations
+    let mut all_limitations = Vec::new();
+    if selection.requests {
+        all_limitations.extend(compact::collect_limitations(request_results, adapters));
+    }
+    if selection.responses {
+        all_limitations.extend(compact::collect_limitations(response_results, adapters));
+    }
+    if selection.streaming {
+        all_limitations.extend(compact::collect_limitations(streaming_results, adapters));
     }
 
+    // Limitations section
+    report.push_str(&compact::generate_compact_limitations(&all_limitations));
+
     report
 }
 
-pub fn generate_report(
+fn generate_markdown_report(
     request_results: &HashMap<(usize, usize), PairResult>,
     response_results: &HashMap<(usize, usize), PairResult>,
     streaming_results: &HashMap<(usize, usize), PairResult>,
-    roundtrip_results: &RoundtripResults,
     adapters: &[Box<dyn ProviderAdapter>],
+    selection: CoverageSelection,
 ) -> String {
     let mut report = String::new();
 
-    report.push_str("## Cross-Provider Transformation Coverage\n\n");
+    report.push_str("## Transformation Coverage\n\n");
 
-    let req = generate_table(request_results, adapters, "Request Transformations");
-    report.push_str(&req.markdown);
+    // Add explanatory paragraph about test semantics
+    report.push_str("Tests format interoperability between providers. ");
+    report.push_str(
+        "Diagonal cells (e.g., ChatCompletions→ChatCompletions) test roundtrip fidelity. ",
+    );
+    report.push_str("Off-diagonal cells test cross-provider translation.\n\n");
 
-    report.push('\n');
-    let resp = generate_table(response_results, adapters, "Response Transformations");
-    report.push_str(&resp.markdown);
+    let mut req_stats = TableStats {
+        passed: 0,
+        failed: 0,
+        limitations: 0,
+    };
+    let mut resp_stats = TableStats {
+        passed: 0,
+        failed: 0,
+        limitations: 0,
+    };
+    let mut stream_stats = TableStats {
+        passed: 0,
+        failed: 0,
+        limitations: 0,
+    };
 
-    report.push('\n');
-    let stream = generate_table(
-        streaming_results,
-        adapters,
-        "Streaming Response Transformations",
-    );
-    report.push_str(&stream.markdown);
+    let mut req_failures: Vec<FailureWithDiff> = Vec::new();
+    let mut resp_failures: Vec<FailureWithDiff> = Vec::new();
+    let mut stream_failures: Vec<FailureWithDiff> = Vec::new();
+
+    let mut has_table = false;
+    if selection.requests {
+        let output = generate_table(request_results, adapters, "Request Transformations");
+        report.push_str(&output.table_markdown);
+        report.push_str(&render_limitations_link(
+            output.stats.limitations,
+            "Request",
+        ));
+        req_stats = output.stats;
+        req_failures = output.failures;
+        has_table = true;
+    }
 
-    let total_passed = req.stats.passed + resp.stats.passed + stream.stats.passed;
-    let total_failed = req.stats.failed + resp.stats.failed + stream.stats.failed;
+    if selection.responses {
+        if has_table {
+            report.push('\n');
+        }
+        let output = generate_table(response_results, adapters, "Response Transformations");
+        report.push_str(&output.table_markdown);
+        report.push_str(&render_limitations_link(
+            output.stats.limitations,
+            "Response",
+        ));
+        resp_stats = output.stats;
+        resp_failures = output.failures;
+        has_table = true;
+    }
+
+    if selection.streaming {
+        if has_table {
+            report.push('\n');
+        }
+        let output = generate_table(
+            streaming_results,
+            adapters,
+            "Streaming Response Transformations",
+        );
+        report.push_str(&output.table_markdown);
+        report.push_str(&render_limitations_link(
+            output.stats.limitations,
+            "Streaming",
+        ));
+        stream_stats = output.stats;
+        stream_failures = output.failures;
+    }
+
+    let total_passed = req_stats.passed + resp_stats.passed + stream_stats.passed;
+    let total_failed = req_stats.failed + resp_stats.failed + stream_stats.failed;
     let total_limitations =
-        req.stats.limitations + resp.stats.limitations + stream.stats.limitations;
-    let total_missing =
-        req.stats.missing_fixtures + resp.stats.missing_fixtures + stream.stats.missing_fixtures;
-    let total = total_passed + total_failed;
+        req_stats.limitations + resp_stats.limitations + stream_stats.limitations;
 
-    let pass_percentage = if total > 0 {
-        (total_passed as f64 / total as f64) * 100.0
+    // "Working" = passed + limitations (both represent successful translations)
+    let total_working = total_passed + total_limitations;
+    let working_total = total_working + total_failed;
+    let working_percentage = if working_total > 0 {
+        (total_working as f64 / working_total as f64) * 100.0
     } else {
         0.0
     };
 
     report.push_str("\n### Summary\n\n");
     report.push_str(&format!(
-        "**{}/{} ({:.1}%)** - {} failed, {} limitations, {} missing fixtures\n",
-        total_passed, total, pass_percentage, total_failed, total_limitations, total_missing
+        "**{}/{} ({:.1}%) working** [{} full + {} limited] - {} failed\n",
+        total_working,
+        working_total,
+        working_percentage,
+        total_passed,
+        total_limitations,
+        total_failed
     ));
 
-    let req_total = req.stats.passed + req.stats.failed;
-    let resp_total = resp.stats.passed + resp.stats.failed;
-    let stream_total = stream.stats.passed + stream.stats.failed;
-
-    report.push_str(&format!(
-        "\n**Requests:** {}/{} passed, {} failed, {} limitations, {} missing\n",
-        req.stats.passed,
-        req_total,
-        req.stats.failed,
-        req.stats.limitations,
-        req.stats.missing_fixtures
-    ));
-    report.push_str(&format!(
-        "**Responses:** {}/{} passed, {} failed, {} limitations, {} missing\n",
-        resp.stats.passed,
-        resp_total,
-        resp.stats.failed,
-        resp.stats.limitations,
-        resp.stats.missing_fixtures
-    ));
-    report.push_str(&format!(
-        "**Streaming:** {}/{} passed, {} failed, {} limitations, {} missing\n",
-        stream.stats.passed,
-        stream_total,
-        stream.stats.failed,
-        stream.stats.limitations,
-        stream.stats.missing_fixtures
-    ));
+    if selection.requests {
+        let req_working = req_stats.passed + req_stats.limitations;
+        let req_total = req_working + req_stats.failed;
+        report.push_str(&format!(
+            "\n**Requests:** {}/{} working [{} full + {} limited], {} failed\n",
+            req_working, req_total, req_stats.passed, req_stats.limitations, req_stats.failed
+        ));
+    }
+    if selection.responses {
+        let resp_working = resp_stats.passed + resp_stats.limitations;
+        let resp_total = resp_working + resp_stats.failed;
+        report.push_str(&format!(
+            "**Responses:** {}/{} working [{} full + {} limited], {} failed\n",
+            resp_working, resp_total, resp_stats.passed, resp_stats.limitations, resp_stats.failed
+        ));
+    }
+    if selection.streaming {
+        let stream_working = stream_stats.passed + stream_stats.limitations;
+        let stream_total = stream_working + stream_stats.failed;
+        report.push_str(&format!(
+            "**Streaming:** {}/{} working [{} full + {} limited], {} failed\n",
+            stream_working,
+            stream_total,
+            stream_stats.passed,
+            stream_stats.limitations,
+            stream_stats.failed
+        ));
+    }
 
     // Organize issues by source provider → request/response/streaming → target
-    if !req.failures.is_empty() || !resp.failures.is_empty() || !stream.failures.is_empty() {
+    if !req_failures.is_empty() || !resp_failures.is_empty() || !stream_failures.is_empty() {
         report.push_str("\n### Issues by Source\n\n");
 
         // Group failures by source provider, keeping request/response/streaming separate
-        let mut req_by_source: HashMap<String, Vec<IssueEntry>> = HashMap::new();
-        let mut resp_by_source: HashMap<String, Vec<IssueEntry>> = HashMap::new();
-        let mut stream_by_source: HashMap<String, Vec<IssueEntry>> = HashMap::new();
+        let mut req_by_source: HashMap<String, Vec<FailureWithDiff>> = HashMap::new();
+        let mut resp_by_source: HashMap<String, Vec<FailureWithDiff>> = HashMap::new();
+        let mut stream_by_source: HashMap<String, Vec<FailureWithDiff>> = HashMap::new();
 
-        for (direction, test_case, error) in req.failures {
+        for (direction, test_case, error, diff) in req_failures {
             let source = direction
                 .split(" → ")
                 .next()
@@ -370,10 +394,10 @@ pub fn generate_report(
             req_by_source
                 .entry(source)
                 .or_default()
-                .push((direction, test_case, error));
+                .push((direction, test_case, error, diff));
         }
 
-        for (direction, test_case, error) in resp.failures {
+        for (direction, test_case, error, diff) in resp_failures {
             let source = direction
                 .split(" → ")
                 .next()
@@ -382,10 +406,10 @@ pub fn generate_report(
             resp_by_source
                 .entry(source)
                 .or_default()
-                .push((direction, test_case, error));
+                .push((direction, test_case, error, diff));
         }
 
-        for (direction, test_case, error) in stream.failures {
+        for (direction, test_case, error, diff) in stream_failures {
             let source = direction
                 .split(" → ")
                 .next()
@@ -394,7 +418,7 @@ pub fn generate_report(
             stream_by_source
                 .entry(source)
                 .or_default()
-                .push((direction, test_case, error));
+                .push((direction, test_case, error, diff));
         }
 
         // Get all unique sources and sort by total failure count
@@ -428,17 +452,19 @@ pub fn generate_report(
                 ));
 
                 // Group by target
-                let mut by_target: HashMap<String, Vec<(String, String)>> = HashMap::new();
-                for (direction, test_case, error) in req_failures {
+                let mut by_target: HashMap<String, Vec<(String, String, Option<RoundtripDiff>)>> =
+                    HashMap::new();
+                for (direction, test_case, error, diff) in req_failures {
                     let target = direction
                         .split(" → ")
                         .nth(1)
                         .unwrap_or("Unknown")
                         .to_string();
-                    by_target
-                        .entry(target)
-                        .or_default()
-                        .push((test_case.clone(), error.clone()));
+                    by_target.entry(target).or_default().push((
+                        test_case.clone(),
+                        error.clone(),
+                        diff.clone(),
+                    ));
                 }
 
                 let mut targets: Vec<_> = by_target.into_iter().collect();
@@ -452,8 +478,13 @@ pub fn generate_report(
                         target_failures.len()
                     ));
 
-                    for (test_case, error) in target_failures {
-                        report.push_str(&format!("      - `{}` - {}\n", test_case, error));
+                    for (test_case, error, diff) in target_failures {
+                        report.push_str(&format!(
+                            "      - `{}` - {}{}\n",
+                            test_case,
+                            error,
+                            format_diff(&diff)
+                        ));
                     }
 
                     report.push_str("\n</details>\n\n");
@@ -471,17 +502,19 @@ pub fn generate_report(
                 ));
 
                 // Group by target
-                let mut by_target: HashMap<String, Vec<(String, String)>> = HashMap::new();
-                for (direction, test_case, error) in resp_failures {
+                let mut by_target: HashMap<String, Vec<(String, String, Option<RoundtripDiff>)>> =
+                    HashMap::new();
+                for (direction, test_case, error, diff) in resp_failures {
                     let target = direction
                         .split(" → ")
                         .nth(1)
                         .unwrap_or("Unknown")
                         .to_string();
-                    by_target
-                        .entry(target)
-                        .or_default()
-                        .push((test_case.clone(), error.clone()));
+                    by_target.entry(target).or_default().push((
+                        test_case.clone(),
+                        error.clone(),
+                        diff.clone(),
+                    ));
                 }
 
                 let mut targets: Vec<_> = by_target.into_iter().collect();
@@ -495,8 +528,13 @@ pub fn generate_report(
                         target_failures.len()
                     ));
 
-                    for (test_case, error) in target_failures {
-                        report.push_str(&format!("      - `{}` - {}\n", test_case, error));
+                    for (test_case, error, diff) in target_failures {
+                        report.push_str(&format!(
+                            "      - `{}` - {}{}\n",
+                            test_case,
+                            error,
+                            format_diff(&diff)
+                        ));
                     }
 
                     report.push_str("\n</details>\n\n");
@@ -514,17 +552,19 @@ pub fn generate_report(
                 ));
 
                 // Group by target
-                let mut by_target: HashMap<String, Vec<(String, String)>> = HashMap::new();
-                for (direction, test_case, error) in stream_failures {
+                let mut by_target: HashMap<String, Vec<(String, String, Option<RoundtripDiff>)>> =
+                    HashMap::new();
+                for (direction, test_case, error, diff) in stream_failures {
                     let target = direction
                         .split(" → ")
                         .nth(1)
                         .unwrap_or("Unknown")
                         .to_string();
-                    by_target
-                        .entry(target)
-                        .or_default()
-                        .push((test_case.clone(), error.clone()));
+                    by_target.entry(target).or_default().push((
+                        test_case.clone(),
+                        error.clone(),
+                        diff.clone(),
+                    ));
                 }
 
                 let mut targets: Vec<_> = by_target.into_iter().collect();
@@ -538,8 +578,13 @@ pub fn generate_report(
                         target_failures.len()
                     ));
 
-                    for (test_case, error) in target_failures {
-                        report.push_str(&format!("      - `{}` - {}\n", test_case, error));
+                    for (test_case, error, diff) in target_failures {
+                        report.push_str(&format!(
+                            "      - `{}` - {}{}\n",
+                            test_case,
+                            error,
+                            format_diff(&diff)
+                        ));
                     }
 
                     report.push_str("\n</details>\n\n");
@@ -552,119 +597,5 @@ pub fn generate_report(
         }
     }
 
-    // Add provider limitations section
-    let all_limitations: Vec<_> = req
-        .limitations
-        .into_iter()
-        .chain(resp.limitations)
-        .chain(stream.limitations)
-        .collect();
-
-    if !all_limitations.is_empty() {
-        report.push_str("\n### Provider Limitations\n\n");
-        report.push_str("These are provider-specific features that cannot be transformed:\n\n");
-
-        // Group by source provider
-        let mut by_source: HashMap<String, Vec<IssueEntry>> = HashMap::new();
-        for (direction, test_case, error) in all_limitations {
-            let source = direction
-                .split(" → ")
-                .next()
-                .unwrap_or(&direction)
-                .to_string();
-            by_source
-                .entry(source)
-                .or_default()
-                .push((direction, test_case, error));
-        }
-
-        let mut sources: Vec<_> = by_source.into_iter().collect();
-        sources.sort_by(|a, b| b.1.len().cmp(&a.1.len()));
-
-        for (source, limitations) in sources {
-            report.push_str("<details>\n");
-            report.push_str(&format!(
-                "<summary>⚠️ {} ({} limitations)</summary>\n\n",
-                source,
-                limitations.len()
-            ));
-
-            // Group by target
-            let mut by_target: HashMap<String, Vec<(String, String)>> = HashMap::new();
-            for (direction, test_case, error) in limitations {
-                let target = direction
-                    .split(" → ")
-                    .nth(1)
-                    .unwrap_or("Unknown")
-                    .to_string();
-                by_target
-                    .entry(target)
-                    .or_default()
-                    .push((test_case, error));
-            }
-
-            let mut targets: Vec<_> = by_target.into_iter().collect();
-            targets.sort_by(|a, b| b.1.len().cmp(&a.1.len()));
-
-            for (target, target_limitations) in targets {
-                report.push_str(&format!("**→ {}:**\n", target));
-                for (test_case, error) in target_limitations {
-                    report.push_str(&format!("  - `{}` - {}\n", test_case, error));
-                }
-                report.push('\n');
-            }
-
-            report.push_str("</details>\n\n");
-        }
-    }
-
-    // Add missing fixtures section (collapsed by default)
-    let all_missing: Vec<_> = req
-        .missing_fixtures
-        .into_iter()
-        .chain(resp.missing_fixtures)
-        .chain(stream.missing_fixtures)
-        .collect();
-
-    if !all_missing.is_empty() {
-        report.push_str("\n### Missing Test Fixtures\n\n");
-        report.push_str("<details>\n");
-        report.push_str(&format!(
-            "<summary>📁 {} missing fixtures (expand to see details)</summary>\n\n",
-            all_missing.len()
-        ));
-
-        // Group by source provider
-        let mut by_source: HashMap<String, Vec<IssueEntry>> = HashMap::new();
-        for (direction, test_case, error) in all_missing {
-            let source = direction
-                .split(" → ")
-                .next()
-                .unwrap_or(&direction)
-                .to_string();
-            by_source
-                .entry(source)
-                .or_default()
-                .push((direction, test_case, error));
-        }
-
-        let mut sources: Vec<_> = by_source.into_iter().collect();
-        sources.sort_by(|a, b| b.1.len().cmp(&a.1.len()));
-
-        for (source, missing) in sources {
-            report.push_str(&format!("**{}** ({} missing):\n", source, missing.len()));
-            for (_, test_case, _) in missing {
-                report.push_str(&format!("  - `{}`\n", test_case));
-            }
-            report.push('\n');
-        }
-
-        report.push_str("</details>\n");
-    }
-
-    // Add roundtrip section
-    report.push('\n');
-    report.push_str(&generate_roundtrip_section(roundtrip_results, adapters));
-
     report
 }
diff --git a/crates/coverage-report/src/requests_expected_differences.json b/crates/coverage-report/src/requests_expected_differences.json
new file mode 100644
index 00000000..9e9d1f2f
--- /dev/null
+++ b/crates/coverage-report/src/requests_expected_differences.json
@@ -0,0 +1,255 @@
+{
+  "global": [
+    {
+      "source": "*",
+      "target": "*",
+      "fields": [
+        { "pattern": "params.service_tier", "reason": "OpenAI-specific billing tier not universal across providers" },
+        { "pattern": "messages[*].id", "reason": "Message/response IDs are provider-specific (OpenAI uses response-level IDs, Anthropic uses message-level IDs, Bedrock has none)" }
+      ]
+    },
+    {
+      "source": "*",
+      "target": "Anthropic",
+      "fields": [
+        { "pattern": "params.reasoning.summary", "reason": "Anthropic doesn't support reasoning summary" },
+        { "pattern": "params.response_format.format_type", "reason": "Anthropic converts json_object to json_schema" },
+        { "pattern": "params.response_format.json_schema.name", "reason": "Anthropic rejects 'name' field" },
+        { "pattern": "params.response_format.json_schema.strict", "reason": "Anthropic rejects 'strict' field" },
+        { "pattern": "params.response_format.json_schema", "reason": "Anthropic uses different json_schema format" },
+        { "pattern": "params.response_format", "reason": "Anthropic doesn't support Text format type" },
+        { "pattern": "params.metadata", "reason": "Anthropic only accepts user_id in metadata" },
+        { "pattern": "params.parallel_tool_calls", "reason": "Anthropic only supports disable_parallel via tool_choice" },
+        { "pattern": "params.tool_choice", "reason": "Anthropic requires tool_choice to express disable_parallel_tool_use" }
+      ],
+      "errors": [
+        { "pattern": "does not support logprobs", "reason": "Anthropic doesn't support logprobs parameter" },
+        { "pattern": "does not support top_logprobs", "reason": "Anthropic doesn't support top_logprobs parameter" },
+        { "pattern": "does not support frequency_penalty", "reason": "Anthropic doesn't support frequency_penalty parameter" },
+        { "pattern": "does not support presence_penalty", "reason": "Anthropic doesn't support presence_penalty parameter" },
+        { "pattern": "does not support seed", "reason": "Anthropic doesn't support seed parameter" },
+        { "pattern": "does not support store", "reason": "Anthropic doesn't support store parameter" },
+        { "pattern": "does not support n > 1", "reason": "Anthropic doesn't support multiple completions" }
+      ]
+    },
+    {
+      "source": "*",
+      "target": "ChatCompletions",
+      "fields": [
+        { "pattern": "params.reasoning.summary", "reason": "ChatCompletions doesn't support reasoning summary" }
+      ],
+      "errors": [
+        { "pattern": "does not support top_k", "reason": "OpenAI Chat Completions doesn't support top_k parameter" },
+        { "pattern": "is not supported by OpenAI Chat Completions", "reason": "Provider-specific built-in tool has no OpenAI equivalent" },
+        { "pattern": "Unsupported input type: UserContentPart variant: File", "reason": "Anthropic document blocks not supported in OpenAI" }
+      ]
+    },
+    {
+      "source": "ChatCompletions",
+      "target": "*",
+      "fields": [
+        { "pattern": "messages[*].refusal", "reason": "ChatCompletions refusal field has no equivalent in other providers" },
+        { "pattern": "messages[*].annotations", "reason": "ChatCompletions annotations field has no equivalent in other providers" }
+      ]
+    },
+    {
+      "source": "*",
+      "target": "Responses",
+      "fields": [
+      ],
+      "errors": [
+        { "pattern": "does not support top_k", "reason": "OpenAI Responses API doesn't support top_k parameter" },
+        { "pattern": "does not support stop sequences", "reason": "OpenAI Responses API doesn't support stop sequences" },
+        { "pattern": "is not supported by OpenAI Responses API", "reason": "Provider-specific built-in tool has no OpenAI equivalent" },
+        { "pattern": "Unsupported input type: UserContentPart variant: File", "reason": "Anthropic document blocks not supported in OpenAI" },
+        { "pattern": "ToolResult { tool_name: \"web_search\"", "reason": "Anthropic web_search encrypted results cannot be transformed to OpenAI" }
+      ]
+    },
+    {
+      "source": "ChatCompletions",
+      "target": "Responses",
+      "fields": [
+        { "pattern": "params.frequency_penalty", "reason": "Responses API doesn't support frequency_penalty" },
+        { "pattern": "params.presence_penalty", "reason": "Responses API doesn't support presence_penalty" },
+        { "pattern": "params.seed", "reason": "Responses API doesn't support seed" },
+        { "pattern": "params.logprobs", "reason": "Responses API doesn't support logprobs boolean (use top_logprobs)" }
+      ]
+    },
+    {
+      "source": "Anthropic",
+      "target": "Responses",
+      "fields": [
+        { "pattern": "params.reasoning.budget_tokens", "reason": "OpenAI uses effort levels, budget_tokens gets quantized" },
+        { "pattern": "params.tools", "reason": "Anthropic built-in tools not supported in OpenAI" },
+        { "pattern": "messages.length", "reason": "Responses API expands tool messages to separate function_call_output items" }
+      ]
+    },
+    {
+      "source": "Anthropic",
+      "target": "ChatCompletions",
+      "fields": [
+        { "pattern": "params.reasoning.budget_tokens", "reason": "OpenAI uses effort levels, budget_tokens gets quantized" },
+        { "pattern": "params.tools", "reason": "Anthropic built-in tools not supported in OpenAI" }
+      ]
+    },
+    {
+      "source": "*",
+      "target": "Bedrock",
+      "fields": [
+        { "pattern": "params.temperature", "reason": "Bedrock requires temperature=1.0 for extended thinking" },
+        { "pattern": "params.stream", "reason": "Bedrock uses endpoint-based streaming" },
+        { "pattern": "params.metadata", "reason": "Bedrock doesn't support metadata" }
+      ]
+    },
+    {
+      "source": "*",
+      "target": "Google",
+      "fields": [
+        { "pattern": "params.stream", "reason": "Google uses endpoint-based streaming" },
+        { "pattern": "params.metadata", "reason": "Google doesn't support metadata" }
+      ]
+    }
+  ],
+  "perTestCase": [
+    {
+      "testCase": "imageContentParam",
+      "source": "*",
+      "target": "Anthropic",
+      "skip": true,
+      "reason": "Anthropic assistant messages don't support image content"
+    },
+    {
+      "testCase": "documentContentParam",
+      "source": "*",
+      "target": "Anthropic",
+      "skip": true,
+      "reason": "Anthropic assistant messages don't support document content"
+    },
+    {
+      "testCase": "multimodalRequest",
+      "source": "*",
+      "target": "Anthropic",
+      "skip": true,
+      "reason": "Anthropic assistant messages don't support image content"
+    },
+    {
+      "testCase": "complexReasoningRequest",
+      "source": "*",
+      "target": "Anthropic",
+      "skip": true,
+      "reason": "Anthropic requires temperature=1.0 for extended thinking"
+    },
+    {
+      "testCase": "reasoningEffortLowParam",
+      "source": "*",
+      "target": "Anthropic",
+      "skip": true,
+      "reason": "Anthropic requires temperature=1.0 for extended thinking"
+    },
+    {
+      "testCase": "reasoningRequest",
+      "source": "*",
+      "target": "Anthropic",
+      "skip": true,
+      "reason": "Anthropic requires temperature=1.0 for extended thinking"
+    },
+    {
+      "testCase": "reasoningRequestTruncated",
+      "source": "*",
+      "target": "Anthropic",
+      "skip": true,
+      "reason": "Anthropic requires temperature=1.0 for extended thinking"
+    },
+    {
+      "testCase": "reasoningSummaryParam",
+      "source": "*",
+      "target": "Anthropic",
+      "skip": true,
+      "reason": "Anthropic requires temperature=1.0 for extended thinking"
+    },
+    {
+      "testCase": "reasoningWithOutput",
+      "source": "*",
+      "target": "Anthropic",
+      "skip": true,
+      "reason": "Anthropic requires temperature=1.0 for extended thinking"
+    },
+    {
+      "testCase": "simpleRequest",
+      "source": "*",
+      "target": "Anthropic",
+      "skip": true,
+      "reason": "Anthropic requires temperature=1.0 for extended thinking"
+    },
+    {
+      "testCase": "codeInterpreterToolParam",
+      "source": "Responses",
+      "target": "Anthropic",
+      "skip": true,
+      "reason": "OpenAI code_interpreter tool has no Anthropic equivalent"
+    },
+    {
+      "testCase": "webSearchToolParam",
+      "source": "Responses",
+      "target": "Anthropic",
+      "skip": true,
+      "reason": "OpenAI web_search_preview tool has no Anthropic equivalent"
+    },
+    {
+      "testCase": "multimodalRequest",
+      "source": "ChatCompletions",
+      "target": "Responses",
+      "skip": true,
+      "reason": "Image media_type normalization artifact"
+    },
+    {
+      "testCase": "instructionsParam",
+      "source": "ChatCompletions",
+      "target": "Anthropic",
+      "skip": true,
+      "reason": "Anthropic extracts system messages to separate system parameter"
+    },
+    {
+      "testCase": "instructionsParam",
+      "source": "Responses",
+      "target": "Anthropic",
+      "skip": true,
+      "reason": "Anthropic extracts system messages to separate system parameter"
+    },
+    {
+      "testCase": "multimodalRequest",
+      "source": "Responses",
+      "target": "ChatCompletions",
+      "skip": true,
+      "reason": "Image provider_options not preserved in cross-provider transformation"
+    },
+    {
+      "testCase": "complexReasoningRequest",
+      "source": "Responses",
+      "target": "ChatCompletions",
+      "skip": true,
+      "reason": "ChatCompletions collapses reasoning summary blocks to single string"
+    },
+    {
+      "testCase": "webSearchToolParam",
+      "source": "Anthropic",
+      "target": "Responses",
+      "skip": true,
+      "reason": "Anthropic web_search encrypted results cannot be transformed to OpenAI"
+    },
+    {
+      "testCase": "webSearchToolAdvancedParam",
+      "source": "Anthropic",
+      "target": "Responses",
+      "skip": true,
+      "reason": "Anthropic web_search encrypted results cannot be transformed to OpenAI"
+    },
+    {
+      "testCase": "documentContentParam",
+      "source": "Anthropic",
+      "target": "ChatCompletions",
+      "skip": true,
+      "reason": "Anthropic document blocks not supported in OpenAI ChatCompletions"
+    }
+  ]
+}
diff --git a/crates/coverage-report/src/responses_expected_differences.json b/crates/coverage-report/src/responses_expected_differences.json
new file mode 100644
index 00000000..a8ac797f
--- /dev/null
+++ b/crates/coverage-report/src/responses_expected_differences.json
@@ -0,0 +1,108 @@
+{
+  "global": [
+    {
+      "source": "*",
+      "target": "*",
+      "fields": [
+        { "pattern": "messages[*].id", "reason": "Message/response IDs are provider-specific and represent different concepts across providers" },
+        { "pattern": "params.service_tier", "reason": "OpenAI-specific billing tier not universal" }
+      ]
+    },
+    {
+      "source": "Anthropic",
+      "target": "*",
+      "fields": [
+        { "pattern": "usage.prompt_cache_creation_tokens", "reason": "Only Anthropic reports cache creation tokens" }
+      ]
+    },
+    {
+      "source": "*",
+      "target": "Anthropic",
+      "fields": [
+        { "pattern": "usage.completion_reasoning_tokens", "reason": "Anthropic doesn't expose reasoning tokens separately (included in output_tokens)" }
+      ]
+    }
+  ],
+  "perTestCase": [
+    {
+      "testCase": "nMultipleCompletionsParam",
+      "source": "ChatCompletions",
+      "target": "Anthropic",
+      "fields": [
+        { "pattern": "messages.length", "reason": "Anthropic doesn't support n>1 (multiple completions), only first choice is preserved" }
+      ]
+    },
+    {
+      "testCase": "reasoningEffortLowParam",
+      "source": "Anthropic",
+      "target": "Responses",
+      "fields": [
+        { "pattern": "messages[0].content.length", "reason": "Anthropic thinking blocks become separate 'reasoning' output items in Responses API" }
+      ]
+    },
+    {
+      "testCase": "reasoningSummaryParam",
+      "source": "Anthropic",
+      "target": "Responses",
+      "fields": [
+        { "pattern": "messages[0].content.length", "reason": "Anthropic thinking blocks become separate 'reasoning' output items in Responses API" }
+      ]
+    },
+    {
+      "testCase": "codeInterpreterToolParam",
+      "source": "Anthropic",
+      "target": "Responses",
+      "fields": [
+        { "pattern": "messages[0].content.length", "reason": "Anthropic thinking blocks become separate 'reasoning' output items in Responses API" }
+      ]
+    },
+    {
+      "testCase": "parallelToolCallsDisabledParam",
+      "source": "Anthropic",
+      "target": "Responses",
+      "fields": [
+        { "pattern": "messages[0].content.length", "reason": "Anthropic thinking blocks become separate 'reasoning' output items in Responses API" }
+      ]
+    },
+    {
+      "testCase": "toolCallRequest",
+      "source": "Anthropic",
+      "target": "Responses",
+      "fields": [
+        { "pattern": "messages[0].content.length", "reason": "Anthropic thinking blocks become separate 'reasoning' output items in Responses API" }
+      ]
+    },
+    {
+      "testCase": "webSearchToolParam",
+      "source": "Anthropic",
+      "target": "Responses",
+      "fields": [
+        { "pattern": "messages[0].content.length", "reason": "Anthropic web search content blocks become 'web_search_call' output items in Responses API" }
+      ]
+    },
+    {
+      "testCase": "webSearchToolAdvancedParam",
+      "source": "Anthropic",
+      "target": "Responses",
+      "fields": [
+        { "pattern": "messages[0].content.length", "reason": "Anthropic web search content blocks become 'web_search_call' output items in Responses API" }
+      ]
+    },
+    {
+      "testCase": "webSearchToolParam",
+      "source": "Anthropic",
+      "target": "ChatCompletions",
+      "fields": [
+        { "pattern": "messages[0].content.length", "reason": "Anthropic web search content blocks don't map 1:1 to ChatCompletions structure" }
+      ]
+    },
+    {
+      "testCase": "webSearchToolAdvancedParam",
+      "source": "Anthropic",
+      "target": "ChatCompletions",
+      "fields": [
+        { "pattern": "messages[0].content.length", "reason": "Anthropic web search content blocks don't map 1:1 to ChatCompletions structure" }
+      ]
+    }
+  ]
+}
diff --git a/crates/coverage-report/src/runner.rs b/crates/coverage-report/src/runner.rs
index 72cf8902..3b29a044 100644
--- a/crates/coverage-report/src/runner.rs
+++ b/crates/coverage-report/src/runner.rs
@@ -11,34 +11,49 @@ use lingua::processing::transform::{
     transform_request, transform_response, transform_stream_chunk,
 };
 use lingua::serde_json::Value;
+use lingua::universal::{UniversalRequest, UniversalResponse, UniversalStreamChunk};
 
-use crate::discovery::{discover_test_cases, load_payload};
-use crate::types::{PairResult, TransformResult, ValidationLevel};
+use crate::discovery::{discover_test_cases_filtered, load_payload};
+use crate::expected::TestCategory;
+use crate::normalizers::{
+    normalize_request_for_comparison, normalize_response_for_comparison,
+    normalize_stream_chunk_for_comparison,
+};
+use crate::types::{PairResult, TestFilter, TransformResult, ValidationLevel};
 
 type PairResults = HashMap<(usize, usize), PairResult>;
 type AllResults = (PairResults, PairResults, PairResults);
 
-// Patterns that indicate provider limitations (real gaps, not bugs)
-const LIMITATION_PATTERNS: &[&str] = &[
-    "Provider limitation",
-    "has no OpenAI equivalent",
-    "has no Anthropic equivalent",
-    "has no Bedrock equivalent",
-    "has no Google equivalent",
-    "Unsupported",
-];
-
-// Patterns that indicate missing test fixtures (test coverage gaps)
-const MISSING_FIXTURE_PATTERNS: &[&str] = &["Source payload not found"];
-
-/// Classify an error into failure, limitation, or missing fixture.
-fn classify_error(error: &str) -> ValidationLevel {
-    if MISSING_FIXTURE_PATTERNS.iter().any(|p| error.contains(p)) {
-        ValidationLevel::MissingFixture
-    } else if LIMITATION_PATTERNS.iter().any(|p| error.contains(p)) {
-        ValidationLevel::Limitation
+fn universal_request_to_value(req: &UniversalRequest) -> Value {
+    lingua::serde_json::to_value(normalize_request_for_comparison(req)).unwrap_or(Value::Null)
+}
+
+fn universal_response_to_value(resp: &UniversalResponse) -> Value {
+    lingua::serde_json::to_value(normalize_response_for_comparison(resp)).unwrap_or(Value::Null)
+}
+
+fn universal_stream_to_value(chunk: &UniversalStreamChunk) -> Value {
+    lingua::serde_json::to_value(normalize_stream_chunk_for_comparison(chunk))
+        .unwrap_or(Value::Null)
+}
+
+fn diff_to_transform_result(result: RoundtripResult) -> TransformResult {
+    // For limitations, extract reason from expected_diffs if available
+    let limitation_reason = if result.level == ValidationLevel::Limitation {
+        result
+            .diff
+            .as_ref()
+            .and_then(|d| d.expected_diffs.first())
+            .map(|(_, _, _, reason)| reason.clone())
     } else {
-        ValidationLevel::Fail
+        None
+    };
+
+    TransformResult {
+        level: result.level,
+        error: result.error,
+        diff: result.diff,
+        limitation_reason,
     }
 }
 
@@ -56,8 +71,10 @@ pub fn test_request_transformation(
         None => {
             let error = format!("Source payload not found: {}", filename);
             return TransformResult {
-                level: ValidationLevel::MissingFixture,
+                level: ValidationLevel::Skipped,
                 error: Some(error),
+                diff: None,
+                limitation_reason: None,
             };
         }
     };
@@ -69,15 +86,39 @@ pub fn test_request_transformation(
         _ => None,
     };
 
+    let payload_value: Value = match lingua::serde_json::from_slice(&payload) {
+        Ok(v) => v,
+        Err(e) => {
+            return TransformResult {
+                level: ValidationLevel::Fail,
+                error: Some(format!("Failed to parse source payload: {}", e)),
+                diff: None,
+                limitation_reason: None,
+            };
+        }
+    };
+
+    let mut expected_universal = match source_adapter.request_to_universal(payload_value) {
+        Ok(u) => u,
+        Err(e) => {
+            return TransformResult {
+                level: ValidationLevel::Fail,
+                error: Some(format!("Conversion to universal format failed: {}", e)),
+                diff: None,
+                limitation_reason: None,
+            };
+        }
+    };
+
+    if model.is_some() && expected_universal.model.is_none() {
+        expected_universal.model = model.map(String::from);
+    }
+
+    target_adapter.apply_defaults(&mut expected_universal);
+    let expected_universal_value = universal_request_to_value(&expected_universal);
+
     match transform_request(payload, target_adapter.format(), model) {
         Ok(result) => {
-            if result.is_passthrough() && source_adapter.format() == target_adapter.format() {
-                return TransformResult {
-                    level: ValidationLevel::Pass,
-                    error: None,
-                };
-            }
-
             // Parse result bytes to Value for validation
             let output_bytes = result.into_bytes();
             let transformed: Value = match lingua::serde_json::from_slice(&output_bytes) {
@@ -86,28 +127,69 @@ pub fn test_request_transformation(
                     return TransformResult {
                         level: ValidationLevel::Fail,
                         error: Some(format!("Failed to parse transformed output: {}", e)),
+                        diff: None,
+                        limitation_reason: None,
                     }
                 }
             };
 
             // Use request_to_universal to validate - gives detailed error info
             match target_adapter.request_to_universal(transformed) {
-                Ok(_) => TransformResult {
-                    level: ValidationLevel::Pass,
-                    error: None,
-                },
+                Ok(target_universal) => {
+                    let target_universal_value = universal_request_to_value(&target_universal);
+                    let context = CompareContext::for_cross_provider(
+                        TestCategory::Requests,
+                        source_adapter,
+                        target_adapter,
+                        test_case,
+                    );
+                    let roundtrip_result = compare_values(
+                        &expected_universal_value,
+                        &target_universal_value,
+                        context.as_ref(),
+                    );
+                    diff_to_transform_result(roundtrip_result)
+                }
                 Err(e) => TransformResult {
                     level: ValidationLevel::Fail,
-                    error: Some(e.to_string()),
+                    error: Some(format!("Conversion from universal format failed: {}", e)),
+                    diff: None,
+                    limitation_reason: None,
                 },
             }
         }
         Err(e) => {
-            let error = format!("{}", e);
-            let level = classify_error(&error);
+            let error_msg = e.to_string();
+            let context = CompareContext::for_cross_provider(
+                TestCategory::Requests,
+                source_adapter,
+                target_adapter,
+                test_case,
+            );
+            // For roundtrip tests (context=None), all errors are real failures
+            let reason = context.as_ref().and_then(|ctx| {
+                ctx.is_test_case_limitation().or_else(|| {
+                    is_expected_error(
+                        ctx.category,
+                        ctx.source,
+                        ctx.target,
+                        Some(ctx.test_case),
+                        &error_msg,
+                    )
+                })
+            });
+
+            let level = if reason.is_some() {
+                ValidationLevel::Limitation
+            } else {
+                ValidationLevel::Fail
+            };
+
             TransformResult {
                 level,
-                error: Some(error),
+                error: Some(error_msg),
+                diff: None,
+                limitation_reason: reason.map(|r| r.to_string()),
             }
         }
     }
@@ -123,12 +205,40 @@ pub fn test_response_transformation(
         Some(p) => p,
         None => {
             return TransformResult {
-                level: ValidationLevel::Fail,
+                level: ValidationLevel::Skipped,
                 error: Some(format!("Response payload not found: {}", filename)),
+                diff: None,
+                limitation_reason: None,
             }
         }
     };
 
+    let payload_value: Value = match lingua::serde_json::from_slice(&payload) {
+        Ok(v) => v,
+        Err(e) => {
+            return TransformResult {
+                level: ValidationLevel::Fail,
+                error: Some(format!("Failed to parse source payload: {}", e)),
+                diff: None,
+                limitation_reason: None,
+            };
+        }
+    };
+
+    let expected_universal = match source_adapter.response_to_universal(payload_value) {
+        Ok(u) => u,
+        Err(e) => {
+            return TransformResult {
+                level: ValidationLevel::Fail,
+                error: Some(format!("Conversion to universal format failed: {}", e)),
+                diff: None,
+                limitation_reason: None,
+            };
+        }
+    };
+
+    let expected_universal_value = universal_response_to_value(&expected_universal);
+
     match transform_response(payload, target_adapter.format()) {
         Ok(result) => {
             // Parse result bytes to Value for validation
@@ -139,26 +249,71 @@ pub fn test_response_transformation(
                     return TransformResult {
                         level: ValidationLevel::Fail,
                         error: Some(format!("Failed to parse transformed output: {}", e)),
+                        diff: None,
+                        limitation_reason: None,
                     }
                 }
             };
 
             // Use response_to_universal to validate - gives detailed error info
             match target_adapter.response_to_universal(transformed) {
-                Ok(_) => TransformResult {
-                    level: ValidationLevel::Pass,
-                    error: None,
-                },
+                Ok(target_universal) => {
+                    let target_universal_value = universal_response_to_value(&target_universal);
+                    let context = CompareContext::for_cross_provider(
+                        TestCategory::Responses,
+                        source_adapter,
+                        target_adapter,
+                        test_case,
+                    );
+                    let roundtrip_result = compare_values(
+                        &expected_universal_value,
+                        &target_universal_value,
+                        context.as_ref(),
+                    );
+                    diff_to_transform_result(roundtrip_result)
+                }
                 Err(e) => TransformResult {
                     level: ValidationLevel::Fail,
-                    error: Some(e.to_string()),
+                    error: Some(format!("Conversion from universal format failed: {}", e)),
+                    diff: None,
+                    limitation_reason: None,
                 },
             }
         }
-        Err(e) => TransformResult {
-            level: ValidationLevel::Fail,
-            error: Some(format!("{}", e)),
-        },
+        Err(e) => {
+            let error_msg = e.to_string();
+            let context = CompareContext::for_cross_provider(
+                TestCategory::Responses,
+                source_adapter,
+                target_adapter,
+                test_case,
+            );
+            // For roundtrip tests (context=None), all errors are real failures
+            let reason = context.as_ref().and_then(|ctx| {
+                ctx.is_test_case_limitation().or_else(|| {
+                    is_expected_error(
+                        ctx.category,
+                        ctx.source,
+                        ctx.target,
+                        Some(ctx.test_case),
+                        &error_msg,
+                    )
+                })
+            });
+
+            let level = if reason.is_some() {
+                ValidationLevel::Limitation
+            } else {
+                ValidationLevel::Fail
+            };
+
+            TransformResult {
+                level,
+                error: Some(error_msg),
+                diff: None,
+                limitation_reason: reason.map(|r| r.to_string()),
+            }
+        }
     }
 }
 
@@ -173,10 +328,12 @@ pub fn test_streaming_transformation(
     let payload_bytes = match load_payload(test_case, source_adapter.directory_name(), filename) {
         Some(p) => p,
         None => {
-            // No streaming file - report as not found
+            // No streaming file - skip this test
             return TransformResult {
-                level: ValidationLevel::Fail,
+                level: ValidationLevel::Skipped,
                 error: Some(format!("Streaming payload not found: {}", filename)),
+                diff: None,
+                limitation_reason: None,
             };
         }
     };
@@ -188,6 +345,8 @@ pub fn test_streaming_transformation(
             return TransformResult {
                 level: ValidationLevel::Fail,
                 error: Some(format!("Failed to parse streaming payload: {}", e)),
+                diff: None,
+                limitation_reason: None,
             };
         }
     };
@@ -198,27 +357,24 @@ pub fn test_streaming_transformation(
             return TransformResult {
                 level: ValidationLevel::Fail,
                 error: Some("Streaming payload is not an array".to_string()),
+                diff: None,
+                limitation_reason: None,
             };
         }
     };
 
     // Test all events - fail if any event fails
     for (idx, event) in events.iter().enumerate() {
-        // Serialize each event back to bytes for the transform function
-        let event_bytes = match lingua::serde_json::to_vec(event) {
-            Ok(b) => Bytes::from(b),
-            Err(e) => {
-                return TransformResult {
-                    level: ValidationLevel::Fail,
-                    error: Some(format!("Event {}: failed to serialize: {}", idx, e)),
-                };
-            }
-        };
-
-        if let Err(e) = test_single_stream_event(event_bytes, target_adapter) {
+        let result = test_single_stream_event(event, source_adapter, target_adapter, test_case);
+        if result.level != ValidationLevel::Pass {
             return TransformResult {
-                level: ValidationLevel::Fail,
-                error: Some(format!("Event {}: {}", idx, e)),
+                level: result.level,
+                error: result
+                    .error
+                    .map(|e| format!("Event {}: {}", idx, e))
+                    .or(Some(format!("Event {} failed", idx))),
+                diff: result.diff,
+                limitation_reason: result.limitation_reason,
             };
         }
     }
@@ -226,42 +382,129 @@ pub fn test_streaming_transformation(
     TransformResult {
         level: ValidationLevel::Pass,
         error: None,
+        diff: None,
+        limitation_reason: None,
     }
 }
 
 /// Test a single streaming event transformation
 fn test_single_stream_event(
-    event: Bytes,
+    event: &Value,
+    source_adapter: &dyn ProviderAdapter,
     target_adapter: &dyn ProviderAdapter,
-) -> Result<(), String> {
+    test_case: &str,
+) -> TransformResult {
+    let source_universal = match source_adapter.stream_to_universal(event.clone()) {
+        Ok(u) => u,
+        Err(e) => {
+            return TransformResult {
+                level: ValidationLevel::Fail,
+                error: Some(format!("Conversion to universal format failed: {}", e)),
+                diff: None,
+                limitation_reason: None,
+            }
+        }
+    };
+
+    // Serialize each event back to bytes for the transform function
+    let event_bytes = match lingua::serde_json::to_vec(event) {
+        Ok(b) => Bytes::from(b),
+        Err(e) => {
+            return TransformResult {
+                level: ValidationLevel::Fail,
+                error: Some(format!("failed to serialize: {}", e)),
+                diff: None,
+                limitation_reason: None,
+            };
+        }
+    };
+
     // Transform the event to target format
-    let result =
-        transform_stream_chunk(event, target_adapter.format()).map_err(|e| e.to_string())?;
+    let result = match transform_stream_chunk(event_bytes, target_adapter.format()) {
+        Ok(r) => r,
+        Err(e) => {
+            return TransformResult {
+                level: ValidationLevel::Fail,
+                error: Some(e.to_string()),
+                diff: None,
+                limitation_reason: None,
+            }
+        }
+    };
 
     // Parse result bytes to Value for validation
     let output_bytes = result.into_bytes();
-    let transformed: Value =
-        lingua::serde_json::from_slice(&output_bytes).map_err(|e| e.to_string())?;
+    let transformed: Value = match lingua::serde_json::from_slice(&output_bytes) {
+        Ok(v) => v,
+        Err(e) => {
+            return TransformResult {
+                level: ValidationLevel::Fail,
+                error: Some(e.to_string()),
+                diff: None,
+                limitation_reason: None,
+            }
+        }
+    };
 
     // Validate transformed output can be parsed by target adapter
-    match target_adapter.stream_to_universal(transformed) {
-        Ok(Some(_chunk)) => Ok(()),
-        Ok(None) => Ok(()), // Keep-alive events are valid
-        Err(e) => Err(e.to_string()),
+    let target_universal = match target_adapter.stream_to_universal(transformed) {
+        Ok(u) => u,
+        Err(e) => {
+            return TransformResult {
+                level: ValidationLevel::Fail,
+                error: Some(format!("Conversion from universal format failed: {}", e)),
+                diff: None,
+                limitation_reason: None,
+            }
+        }
+    };
+
+    let context = CompareContext::for_cross_provider(
+        TestCategory::Streaming,
+        source_adapter,
+        target_adapter,
+        test_case,
+    );
+
+    match (source_universal, target_universal) {
+        (None, None) => TransformResult {
+            level: ValidationLevel::Pass,
+            error: None,
+            diff: None,
+            limitation_reason: None,
+        },
+        (Some(source_chunk), Some(target_chunk)) => {
+            let source_value = universal_stream_to_value(&source_chunk);
+            let target_value = universal_stream_to_value(&target_chunk);
+            let roundtrip_result = compare_values(&source_value, &target_value, context.as_ref());
+            diff_to_transform_result(roundtrip_result)
+        }
+        (source, target) => {
+            let source_value = source
+                .as_ref()
+                .map(universal_stream_to_value)
+                .unwrap_or(Value::Null);
+            let target_value = target
+                .as_ref()
+                .map(universal_stream_to_value)
+                .unwrap_or(Value::Null);
+            let roundtrip_result = compare_values(&source_value, &target_value, context.as_ref());
+            diff_to_transform_result(roundtrip_result)
+        }
     }
 }
 
 /// Run all cross-transformation tests and collect results
-pub fn run_all_tests(adapters: &[Box<dyn ProviderAdapter>]) -> AllResults {
-    let test_cases = discover_test_cases();
+pub fn run_all_tests(adapters: &[Box<dyn ProviderAdapter>], filter: &TestFilter) -> AllResults {
+    let test_cases = discover_test_cases_filtered(filter);
     let mut request_results: PairResults = HashMap::new();
     let mut response_results: PairResults = HashMap::new();
     let mut streaming_results: PairResults = HashMap::new();
 
-    // Initialize results for all pairs
-    for (source_idx, _) in adapters.iter().enumerate() {
-        for (target_idx, _) in adapters.iter().enumerate() {
-            if source_idx != target_idx {
+    // Initialize results for all pairs that match the filter (including self-pairs for roundtrip)
+    for (source_idx, source_adapter) in adapters.iter().enumerate() {
+        for (target_idx, target_adapter) in adapters.iter().enumerate() {
+            if filter.matches_provider_pair(source_adapter.format(), target_adapter.format()) {
                 request_results.insert((source_idx, target_idx), PairResult::default());
                 response_results.insert((source_idx, target_idx), PairResult::default());
                 streaming_results.insert((source_idx, target_idx), PairResult::default());
@@ -269,11 +512,12 @@ pub fn run_all_tests(adapters: &[Box<dyn ProviderAdapter>]) -> AllResults {
         }
     }
 
-    // Test each source→target pair for each test case
+    // Test each source→target pair for each test case (including self-pairs for roundtrip)
     for test_case in &test_cases {
         for (source_idx, source) in adapters.iter().enumerate() {
             for (target_idx, target) in adapters.iter().enumerate() {
-                if source_idx == target_idx {
+                // Skip pairs that don't match the filter
+                if !filter.matches_provider_pair(source.format(), target.format()) {
                     continue;
                 }
 
@@ -285,67 +529,59 @@ pub fn run_all_tests(adapters: &[Box<dyn ProviderAdapter>]) -> AllResults {
                 let pair_result = request_results.get_mut(&(source_idx, target_idx)).unwrap();
 
                 match result.level {
+                    ValidationLevel::Skipped => { /* do nothing */ }
                     ValidationLevel::Pass => pair_result.passed += 1,
                     ValidationLevel::Fail => {
                         pair_result.failed += 1;
-                        if let Some(error) = result.error {
-                            pair_result
-                                .failures
-                                .push((format!("{} (request)", test_case), error));
-                        }
+                        let error = result.error.unwrap_or_else(|| "Unknown error".to_string());
+                        pair_result.failures.push((
+                            format!("{} (request)", test_case),
+                            error,
+                            result.diff,
+                        ));
                     }
                     ValidationLevel::Limitation => {
                         pair_result.limitations += 1;
-                        if let Some(error) = result.error {
-                            pair_result
-                                .limitation_details
-                                .push((format!("{} (request)", test_case), error));
-                        }
-                    }
-                    ValidationLevel::MissingFixture => {
-                        pair_result.missing_fixtures += 1;
-                        if let Some(error) = result.error {
-                            pair_result
-                                .missing_fixture_details
-                                .push((format!("{} (request)", test_case), error));
-                        }
+                        let detail = result
+                            .limitation_reason
+                            .or(result.error)
+                            .unwrap_or_else(|| "Unknown limitation".to_string());
+                        pair_result.limitation_details.push((
+                            format!("{} (request)", test_case),
+                            detail,
+                            result.diff,
+                        ));
                     }
                 }
 
                 // Test followup request if exists
                 let followup_result =
                     test_request_transformation(test_case, source, target, "followup-request.json");
-                if followup_result
-                    .error
-                    .as_ref()
-                    .is_none_or(|e| !e.contains("not found"))
-                {
-                    match followup_result.level {
-                        ValidationLevel::Pass => pair_result.passed += 1,
-                        ValidationLevel::Fail => {
-                            pair_result.failed += 1;
-                            if let Some(error) = followup_result.error {
-                                pair_result
-                                    .failures
-                                    .push((format!("{} (followup)", test_case), error));
-                            }
-                        }
-                        ValidationLevel::Limitation => {
-                            pair_result.limitations += 1;
-                            if let Some(error) = followup_result.error {
-                                pair_result
-                                    .limitation_details
-                                    .push((format!("{} (followup)", test_case), error));
-                            }
-                        }
-                        ValidationLevel::MissingFixture => {
-                            pair_result.missing_fixtures += 1;
-                            if let Some(error) = followup_result.error {
-                                pair_result
-                                    .missing_fixture_details
-                                    .push((format!("{} (followup)", test_case), error));
-                            }
-                        }
+                match followup_result.level {
+                    ValidationLevel::Skipped => { /* do nothing */ }
+                    ValidationLevel::Pass => pair_result.passed += 1,
+                    ValidationLevel::Fail => {
+                        pair_result.failed += 1;
+                        let error = followup_result
+                            .error
+                            .unwrap_or_else(|| "Unknown error".to_string());
+                        pair_result.failures.push((
+                            format!("{} (followup)", test_case),
+                            error,
+                            followup_result.diff,
+                        ));
+                    }
+                    ValidationLevel::Limitation => {
+                        pair_result.limitations += 1;
+                        let detail = followup_result
+                            .limitation_reason
+                            .or(followup_result.error)
+                            .unwrap_or_else(|| "Unknown limitation".to_string());
+                        pair_result.limitation_details.push((
+                            format!("{} (followup)", test_case),
+                            detail,
+                            followup_result.diff,
+                        ));
                     }
                 }
 
@@ -354,37 +590,31 @@ pub fn run_all_tests(adapters: &[Box<dyn ProviderAdapter>]) -> AllResults {
                     test_response_transformation(test_case, source, target, "response.json");
                 let resp_pair_result = response_results.get_mut(&(source_idx, target_idx)).unwrap();
 
-                if response_result
-                    .error
-                    .as_ref()
-                    .is_none_or(|e| !e.contains("not found"))
-                {
-                    match response_result.level {
-                        ValidationLevel::Pass => resp_pair_result.passed += 1,
-                        ValidationLevel::Fail => {
-                            resp_pair_result.failed += 1;
-                            if let Some(error) = response_result.error {
-                                resp_pair_result
-                                    .failures
-                                    .push((format!("{} (response)", test_case), error));
-                            }
-                        }
-                        ValidationLevel::Limitation => {
-                            resp_pair_result.limitations += 1;
-                            if let Some(error) = response_result.error {
-                                resp_pair_result
-                                    .limitation_details
-                                    .push((format!("{} (response)", test_case), error));
-                            }
-                        }
-                        ValidationLevel::MissingFixture => {
-                            resp_pair_result.missing_fixtures += 1;
-                            if let Some(error) = response_result.error {
-                                resp_pair_result
-                                    .missing_fixture_details
-                                    .push((format!("{} (response)", test_case), error));
-                            }
-                        }
+                match response_result.level {
+                    ValidationLevel::Skipped => { /* do nothing */ }
+                    ValidationLevel::Pass => resp_pair_result.passed += 1,
+                    ValidationLevel::Fail => {
+                        resp_pair_result.failed += 1;
+                        let error = response_result
+                            .error
+                            .unwrap_or_else(|| "Unknown error".to_string());
+                        resp_pair_result.failures.push((
+                            format!("{} (response)", test_case),
+                            error,
+                            response_result.diff,
+                        ));
+                    }
+                    ValidationLevel::Limitation => {
+                        resp_pair_result.limitations += 1;
+                        let detail = response_result
+                            .limitation_reason
+                            .or(response_result.error)
+                            .unwrap_or_else(|| "Unknown limitation".to_string());
+                        resp_pair_result.limitation_details.push((
+                            format!("{} (response)", test_case),
+                            detail,
+                            response_result.diff,
+                        ));
                     }
                 }
 
@@ -399,37 +629,31 @@ pub fn run_all_tests(adapters: &[Box<dyn ProviderAdapter>]) -> AllResults {
                     target,
                     "response-streaming.json",
                 );
-                if streaming_result
-                    .error
-                    .as_ref()
-                    .is_none_or(|e| !e.contains("not found"))
-                {
-                    match streaming_result.level {
-                        ValidationLevel::Pass => stream_pair_result.passed += 1,
-                        ValidationLevel::Fail => {
-                            stream_pair_result.failed += 1;
-                            if let Some(error) = streaming_result.error {
-                                stream_pair_result
-                                    .failures
-                                    .push((format!("{} (streaming)", test_case), error));
-                            }
-                        }
-                        ValidationLevel::Limitation => {
-                            stream_pair_result.limitations += 1;
-                            if let Some(error) = streaming_result.error {
-                                stream_pair_result
-                                    .limitation_details
-                                    .push((format!("{} (streaming)", test_case), error));
-                            }
-                        }
-                        ValidationLevel::MissingFixture => {
-                            stream_pair_result.missing_fixtures += 1;
-                            if let Some(error) = streaming_result.error {
-                                stream_pair_result
-                                    .missing_fixture_details
-                                    .push((format!("{} (streaming)", test_case), error));
-                            }
-                        }
+                match streaming_result.level {
+                    ValidationLevel::Skipped => { /* do nothing */ }
+                    ValidationLevel::Pass => stream_pair_result.passed += 1,
+                    ValidationLevel::Fail => {
+                        stream_pair_result.failed += 1;
+                        let error = streaming_result
+                            .error
+                            .unwrap_or_else(|| "Unknown error".to_string());
+                        stream_pair_result.failures.push((
+                            format!("{} (streaming)", test_case),
+                            error,
+                            streaming_result.diff,
+                        ));
+                    }
+                    ValidationLevel::Limitation => {
+                        stream_pair_result.limitations += 1;
+                        let detail = streaming_result
+                            .limitation_reason
+                            .or(streaming_result.error)
+                            .unwrap_or_else(|| "Unknown limitation".to_string());
+                        stream_pair_result.limitation_details.push((
+                            format!("{} (streaming)", test_case),
+                            detail,
+                            streaming_result.diff,
+                        ));
                     }
                 }
 
@@ -440,37 +664,31 @@ pub fn run_all_tests(adapters: &[Box<dyn ProviderAdapter>]) -> AllResults {
                     target,
                     "followup-response-streaming.json",
                 );
-                if followup_streaming_result
-                    .error
-                    .as_ref()
-                    .is_none_or(|e| !e.contains("not found"))
-                {
-                    match followup_streaming_result.level {
-                        ValidationLevel::Pass => stream_pair_result.passed += 1,
-                        ValidationLevel::Fail => {
-                            stream_pair_result.failed += 1;
-                            if let Some(error) = followup_streaming_result.error {
-                                stream_pair_result
-                                    .failures
-                                    .push((format!("{} (followup-streaming)", test_case), error));
-                            }
-                        }
-                        ValidationLevel::Limitation => {
-                            stream_pair_result.limitations += 1;
-                            if let Some(error) = followup_streaming_result.error {
-                                stream_pair_result
-                                    .limitation_details
-                                    .push((format!("{} (followup-streaming)", test_case), error));
-                            }
-                        }
-                        ValidationLevel::MissingFixture => {
-                            stream_pair_result.missing_fixtures += 1;
-                            if let Some(error) = followup_streaming_result.error {
-                                stream_pair_result
-                                    .missing_fixture_details
-                                    .push((format!("{} (followup-streaming)", test_case), error));
-                            }
-                        }
+                match followup_streaming_result.level {
+                    ValidationLevel::Skipped => { /* do nothing */ }
+                    ValidationLevel::Pass => stream_pair_result.passed += 1,
+                    ValidationLevel::Fail => {
+                        stream_pair_result.failed += 1;
+                        let error = followup_streaming_result
+                            .error
+                            .unwrap_or_else(|| "Unknown error".to_string());
+                        stream_pair_result.failures.push((
+                            format!("{} (followup-streaming)", test_case),
+                            error,
+                            followup_streaming_result.diff,
+                        ));
+                    }
+                    ValidationLevel::Limitation => {
+                        stream_pair_result.limitations += 1;
+                        let detail = followup_streaming_result
+                            .limitation_reason
+                            .or(followup_streaming_result.error)
+                            .unwrap_or_else(|| "Unknown limitation".to_string());
+                        stream_pair_result.limitation_details.push((
+                            format!("{} (followup-streaming)", test_case),
+                            detail,
+                            followup_streaming_result.diff,
+                        ));
                     }
                 }
             }
@@ -484,34 +702,117 @@ pub fn run_all_tests(adapters: &[Box<dyn ProviderAdapter>]) -> AllResults {
 // Roundtrip testing (Provider → Universal → Provider)
 // ============================================================================
 
-use crate::types::{ProviderRoundtripResult, RoundtripDiff, RoundtripResult};
+use crate::expected::{is_expected_error, is_expected_field, is_expected_test_case};
+use crate::types::{RoundtripDiff, RoundtripResult};
 use std::collections::HashSet;
 
-/// Type alias for roundtrip results indexed by adapter index
-pub type RoundtripResults = HashMap<usize, ProviderRoundtripResult>;
+/// Context for value comparison, carrying provider names for expected-difference filtering.
+struct CompareContext<'a> {
+    category: TestCategory,
+    source: &'a str,
+    target: &'a str,
+    test_case: &'a str,
+}
 
-/// Fields that are expected to change during roundtrip and should be ignored.
-/// These are typically metadata fields set by providers or computed values.
-const IGNORED_FIELDS: &[&str] = &[
-    "id",
-    "created",
-    "system_fingerprint",
-    "service_tier",
-    "object",
-];
+impl<'a> CompareContext<'a> {
+    fn new(category: TestCategory, source: &'a str, target: &'a str, test_case: &'a str) -> Self {
+        Self {
+            category,
+            source,
+            target,
+            test_case,
+        }
+    }
+
+    /// Create context for cross-provider comparison, or None for roundtrip tests.
+    /// Roundtrip tests (source == target) don't use expected differences because
+    /// any data loss in Format→Universal→Format is a real bug, not a "limitation".
+    fn for_cross_provider(
+        category: TestCategory,
+        source_adapter: &'a dyn ProviderAdapter,
+        target_adapter: &'a dyn ProviderAdapter,
+        test_case: &'a str,
+    ) -> Option<Self> {
+        if source_adapter.format() == target_adapter.format() {
+            None
+        } else {
+            Some(Self::new(
+                category,
+                source_adapter.display_name(),
+                target_adapter.display_name(),
+                test_case,
+            ))
+        }
+    }
+
+    /// Check if this entire test case is an expected limitation.
+    fn is_test_case_limitation(&self) -> Option<String> {
+        is_expected_test_case(self.category, self.source, self.target, self.test_case)
+    }
+
+    /// Check if a field difference is expected for this source→target translation.
+    /// Returns the reason if expected, None otherwise.
+    fn is_expected(&self, field: &str) -> Option<String> {
+        is_expected_field(
+            self.category,
+            self.source,
+            self.target,
+            Some(self.test_case),
+            field,
+        )
+    }
+}
 
 /// Compare two JSON values and produce a RoundtripDiff.
-fn compare_values(original: &Value, roundtripped: &Value) -> RoundtripResult {
+///
+/// When `context` is provided, expected differences (based on source/target provider)
+/// are filtered out and tracked as limitations. When `context` is None, all differences are reported.
+fn compare_values(
+    original: &Value,
+    roundtripped: &Value,
+    context: Option<&CompareContext>,
+) -> RoundtripResult {
+    // Check if entire test case is a known limitation (coarsest check)
+    let test_case_limitation = context.and_then(|ctx| ctx.is_test_case_limitation());
+
+    // Always run comparison to capture the actual diffs
     let mut diff = RoundtripDiff::default();
-    compare_recursive(original, roundtripped, "", &mut diff);
-
-    if diff.is_empty() {
-        RoundtripResult {
-            level: ValidationLevel::Pass,
-            error: None,
-            diff: None,
+    compare_recursive(original, roundtripped, "", &mut diff, context);
+
+    // If this is a test-case-level limitation, move all diffs to expected_diffs
+    if let Some(reason) = &test_case_limitation {
+        // Move lost fields to expected_diffs
+        for field in diff.lost_fields.drain(..) {
+            diff.expected_diffs.push((
+                field,
+                "(had value)".to_string(),
+                "(missing)".to_string(),
+                reason.clone(),
+            ));
         }
-    } else {
+        // Move added fields to expected_diffs
+        for field in diff.added_fields.drain(..) {
+            diff.expected_diffs.push((
+                field,
+                "(missing)".to_string(),
+                "(has value)".to_string(),
+                reason.clone(),
+            ));
+        }
+        // Move changed fields to expected_diffs
+        for (field, before, after) in diff.changed_fields.drain(..) {
+            diff.expected_diffs
+                .push((field, before, after, reason.clone()));
+        }
+    }
+
+    let has_real_diffs = !diff.lost_fields.is_empty()
+        || !diff.added_fields.is_empty()
+        || !diff.changed_fields.is_empty();
+    let has_expected_diffs = !diff.expected_diffs.is_empty();
+
+    if has_real_diffs {
+        // Real failures - report as Fail
         RoundtripResult {
             level: ValidationLevel::Fail,
             error: Some(format!(
@@ -522,11 +823,38 @@ fn compare_values(original: &Value, roundtripped: &Value) -> RoundtripResult {
             )),
             diff: Some(diff),
         }
+    } else if has_expected_diffs {
+        // Only expected differences - report as Limitation
+        let error_msg = if let Some(reason) = test_case_limitation {
+            format!("Expected limitation: {}", reason)
+        } else {
+            format!("{} expected limitation(s)", diff.expected_diffs.len())
+        };
+        RoundtripResult {
+            level: ValidationLevel::Limitation,
+            error: Some(error_msg),
+            diff: Some(diff),
+        }
+    } else {
+        // No differences at all - Pass
+        RoundtripResult {
+            level: ValidationLevel::Pass,
+            error: None,
+            diff: None,
+        }
     }
 }
 
 /// Recursively compare two JSON values and accumulate differences.
-fn compare_recursive(original: &Value, roundtripped: &Value, path: &str, diff: &mut RoundtripDiff) {
+///
+/// When `context` is provided, expected differences are filtered out.
+fn compare_recursive(
+    original: &Value,
+    roundtripped: &Value,
+    path: &str,
+    diff: &mut RoundtripDiff,
+    context: Option<&CompareContext>,
+) {
     match (original, roundtripped) {
         (Value::Object(orig), Value::Object(round)) => {
             let orig_keys: HashSet<_> = orig.keys().collect();
@@ -539,8 +867,17 @@ fn compare_recursive(original: &Value, roundtripped: &Value, path: &str, diff: &
                 } else {
                     format!("{}.{}", path, key)
                 };
-                // Skip ignored fields
-                if !IGNORED_FIELDS.contains(&key.as_str()) {
+                // Track expected differences as limitations
+                if let Some(reason) = context.and_then(|ctx| ctx.is_expected(&field_path)) {
+                    let before = lingua::serde_json::to_string(&orig[*key])
+                        .unwrap_or_else(|_| "?".to_string());
+                    diff.expected_diffs.push((
+                        field_path,
+                        before,
+                        "(missing)".to_string(),
+                        reason.to_string(),
+                    ));
+                } else {
                     diff.lost_fields.push(field_path);
                 }
             }
@@ -552,8 +889,17 @@ fn compare_recursive(original: &Value, roundtripped: &Value, path: &str, diff: &
                 } else {
                     format!("{}.{}", path, key)
                 };
-                // Skip ignored fields
-                if !IGNORED_FIELDS.contains(&key.as_str()) {
+                // Track expected differences as limitations
+                if let Some(reason) = context.and_then(|ctx| ctx.is_expected(&field_path)) {
+                    let after = lingua::serde_json::to_string(&round[*key])
+                        .unwrap_or_else(|_| "?".to_string());
+                    diff.expected_diffs.push((
+                        field_path,
+                        "(missing)".to_string(),
+                        after,
+                        reason.to_string(),
+                    ));
+                } else {
                     diff.added_fields.push(field_path);
                 }
             }
@@ -565,24 +911,35 @@ fn compare_recursive(original: &Value, roundtripped: &Value, path: &str, diff: &
                 } else {
                     format!("{}.{}", path, key)
                 };
-                compare_recursive(&orig[*key], &round[*key], &new_path, diff);
+                compare_recursive(&orig[*key], &round[*key], &new_path, diff, context);
             }
         }
         (Value::Array(orig), Value::Array(round)) => {
             // Compare array lengths
             if orig.len() != round.len() {
-                diff.changed_fields.push((
-                    format!("{}.length", path),
-                    orig.len().to_string(),
-                    round.len().to_string(),
-                ));
+                let len_path = format!("{}.length", path);
+                // Track expected differences as limitations
+                if let Some(reason) = context.and_then(|ctx| ctx.is_expected(&len_path)) {
+                    diff.expected_diffs.push((
+                        len_path,
+                        orig.len().to_string(),
+                        round.len().to_string(),
+                        reason.to_string(),
+                    ));
+                } else {
+                    diff.changed_fields.push((
+                        len_path,
+                        orig.len().to_string(),
+                        round.len().to_string(),
+                    ));
+                }
                 return;
             }
 
             // Compare element by element
             for (idx, (o, r)) in orig.iter().zip(round.iter()).enumerate() {
                 let new_path = format!("{}[{}]", path, idx);
-                compare_recursive(o, r, &new_path, diff);
+                compare_recursive(o, r, &new_path, diff, context);
             }
         }
         (Value::Null, Value::Null) => {}
@@ -590,181 +947,17 @@ fn compare_recursive(original: &Value, roundtripped: &Value, path: &str, diff: &
         (Value::Number(o), Value::Number(r)) if o == r => {}
         (Value::String(o), Value::String(r)) if o == r => {}
         _ => {
-            // Values differ - skip if this is an ignored field
-            let field_name = path.rsplit('.').next().unwrap_or(path);
-            if !IGNORED_FIELDS.contains(&field_name) {
-                diff.changed_fields.push((
-                    path.to_string(),
-                    lingua::serde_json::to_string(original).unwrap_or_else(|_| "?".to_string()),
-                    lingua::serde_json::to_string(roundtripped).unwrap_or_else(|_| "?".to_string()),
-                ));
+            // Values differ - track expected differences as limitations
+            let before =
+                lingua::serde_json::to_string(original).unwrap_or_else(|_| "?".to_string());
+            let after =
+                lingua::serde_json::to_string(roundtripped).unwrap_or_else(|_| "?".to_string());
+            if let Some(reason) = context.and_then(|ctx| ctx.is_expected(path)) {
+                diff.expected_diffs
+                    .push((path.to_string(), before, after, reason.to_string()));
+            } else {
+                diff.changed_fields.push((path.to_string(), before, after));
             }
         }
     }
 }
-
-/// Test request roundtrip: Provider → Universal → Provider
-pub fn test_request_roundtrip(
-    test_case: &str,
-    adapter: &dyn ProviderAdapter,
-    filename: &str,
-) -> Option<RoundtripResult> {
-    // 1. Load payload
-    let payload = load_payload(test_case, adapter.directory_name(), filename)?;
-
-    // 2. Parse to Value
-    let original: Value = match lingua::serde_json::from_slice(&payload) {
-        Ok(v) => v,
-        Err(e) => {
-            return Some(RoundtripResult {
-                level: ValidationLevel::Fail,
-                error: Some(format!("Failed to parse payload: {}", e)),
-                diff: None,
-            });
-        }
-    };
-
-    // 3. Convert to Universal
-    let universal = match adapter.request_to_universal(original.clone()) {
-        Ok(u) => u,
-        Err(e) => {
-            return Some(RoundtripResult {
-                level: ValidationLevel::Fail,
-                error: Some(format!("request_to_universal failed: {}", e)),
-                diff: None,
-            });
-        }
-    };
-
-    // 4. Convert back to provider format
-    let roundtripped = match adapter.request_from_universal(&universal) {
-        Ok(r) => r,
-        Err(e) => {
-            return Some(RoundtripResult {
-                level: ValidationLevel::Fail,
-                error: Some(format!("request_from_universal failed: {}", e)),
-                diff: None,
-            });
-        }
-    };
-
-    // 5. Compare original vs roundtripped
-    Some(compare_values(&original, &roundtripped))
-}
-
-/// Test response roundtrip: Provider → Universal → Provider
-pub fn test_response_roundtrip(
-    test_case: &str,
-    adapter: &dyn ProviderAdapter,
-    filename: &str,
-) -> Option<RoundtripResult> {
-    // 1. Load payload
-    let payload = load_payload(test_case, adapter.directory_name(), filename)?;
-
-    // 2. Parse to Value
-    let original: Value = match lingua::serde_json::from_slice(&payload) {
-        Ok(v) => v,
-        Err(e) => {
-            return Some(RoundtripResult {
-                level: ValidationLevel::Fail,
-                error: Some(format!("Failed to parse payload: {}", e)),
-                diff: None,
-            });
-        }
-    };
-
-    // 3. Convert to Universal
-    let universal = match adapter.response_to_universal(original.clone()) {
-        Ok(u) => u,
-        Err(e) => {
-            return Some(RoundtripResult {
-                level: ValidationLevel::Fail,
-                error: Some(format!("response_to_universal failed: {}", e)),
-                diff: None,
-            });
-        }
-    };
-
-    // 4. Convert back to provider format
-    let roundtripped = match adapter.response_from_universal(&universal) {
-        Ok(r) => r,
-        Err(e) => {
-            return Some(RoundtripResult {
-                level: ValidationLevel::Fail,
-                error: Some(format!("response_from_universal failed: {}", e)),
-                diff: None,
-            });
-        }
-    };
-
-    // 5. Compare original vs roundtripped
-    Some(compare_values(&original, &roundtripped))
-}
-
-/// Run all roundtrip tests for all providers.
-pub fn run_roundtrip_tests(adapters: &[Box<dyn ProviderAdapter>]) -> RoundtripResults {
-    let test_cases = discover_test_cases();
-    let mut results: RoundtripResults = HashMap::new();
-
-    // Initialize results for each adapter
-    for (adapter_idx, _) in adapters.iter().enumerate() {
-        results.insert(adapter_idx, ProviderRoundtripResult::default());
-    }
-
-    // Test each provider's roundtrip for each test case
-    for test_case in &test_cases {
-        for (adapter_idx, adapter) in adapters.iter().enumerate() {
-            let adapter = adapter.as_ref();
-            let provider_result = results.get_mut(&adapter_idx).unwrap();
-
-            // Test request roundtrip
-            if let Some(result) = test_request_roundtrip(test_case, adapter, "request.json") {
-                match result.level {
-                    ValidationLevel::Pass => provider_result.request_passed += 1,
-                    ValidationLevel::Fail
-                    | ValidationLevel::Limitation
-                    | ValidationLevel::MissingFixture => {
-                        provider_result.request_failed += 1;
-                        provider_result
-                            .request_failures
-                            .push((format!("{} (request)", test_case), result));
-                    }
-                }
-            }
-
-            // Test followup request roundtrip if exists
-            if let Some(result) =
-                test_request_roundtrip(test_case, adapter, "followup-request.json")
-            {
-                match result.level {
-                    ValidationLevel::Pass => provider_result.request_passed += 1,
-                    ValidationLevel::Fail
-                    | ValidationLevel::Limitation
-                    | ValidationLevel::MissingFixture => {
-                        provider_result.request_failed += 1;
-                        provider_result
-                            .request_failures
-                            .push((format!("{} (followup-request)", test_case), result));
-                    }
-                }
-            }
-
-            // Test response roundtrip
-            if let Some(result) = test_response_roundtrip(test_case, adapter, "response.json") {
-                match result.level {
-                    ValidationLevel::Pass => provider_result.response_passed += 1,
-                    ValidationLevel::Fail
-                    | ValidationLevel::Limitation
-                    | ValidationLevel::MissingFixture => {
-                        provider_result.response_failed += 1;
-                        provider_result
-                            .response_failures
-                            .push((format!("{} (response)", test_case), result));
-                    }
-                }
-            }
-        }
-    }
-
-    results
-}
diff --git a/crates/coverage-report/src/streaming_expected_differences.json b/crates/coverage-report/src/streaming_expected_differences.json
new file mode 100644
index 00000000..897a4f09
--- /dev/null
+++ b/crates/coverage-report/src/streaming_expected_differences.json
@@ -0,0 +1,62 @@
+{
+  "global": [
+    {
+      "source": "*",
+      "target": "*",
+      "fields": [
+        { "pattern": "created", "reason": "Provider-set timestamp with inconsistent field names (OpenAI: 'created', Responses: 'created_at', Anthropic: none)" },
+        { "pattern": "service_tier", "reason": "OpenAI-specific billing tier not present in other providers" },
+        { "pattern": "system_fingerprint", "reason": "OpenAI-specific system identifier not universal" },
+        { "pattern": "messages[*].id", "reason": "Message/response IDs vary by provider and represent different concepts" }
+      ]
+    },
+    {
+      "source": "Anthropic",
+      "target": "*",
+      "fields": [
+        { "pattern": "usage.prompt_cache_creation_tokens", "reason": "Only Anthropic reports cache creation tokens" }
+      ]
+    },
+    {
+      "source": "Responses",
+      "target": "*",
+      "fields": [
+        { "pattern": "usage.prompt_tokens", "reason": "Responses API sends usage at end, other providers expect it at start" },
+        { "pattern": "usage.completion_tokens", "reason": "Responses API sends usage at end, other providers expect it at start" }
+      ]
+    },
+    {
+      "source": "ChatCompletions",
+      "target": "*",
+      "fields": [
+        { "pattern": "choices[*].delta.refusal", "reason": "ChatCompletions refusal field has no equivalent in other providers" },
+        { "pattern": "choices[*].delta.tool_calls", "reason": "Streaming tool_calls transformation not yet implemented" }
+      ]
+    },
+    {
+      "source": "*",
+      "target": "Bedrock",
+      "fields": [
+        { "pattern": "model", "reason": "Bedrock streaming format doesn't include model in events" }
+      ]
+    }
+  ],
+  "perTestCase": [
+    {
+      "testCase": "toolCallRequest",
+      "source": "ChatCompletions",
+      "target": "*",
+      "fields": [
+        { "pattern": "choices[*].delta.content", "reason": "ChatCompletions sends null content when tool_calls are present; not preserved in transformation" }
+      ]
+    },
+    {
+      "testCase": "toolChoiceRequiredParam",
+      "source": "ChatCompletions",
+      "target": "*",
+      "fields": [
+        { "pattern": "choices[*].delta.content", "reason": "ChatCompletions sends null content when tool_calls are present; not preserved in transformation" }
+      ]
+    }
+  ]
+}
diff --git a/crates/coverage-report/src/types.rs b/crates/coverage-report/src/types.rs
index a4f1061e..078ef786 100644
--- a/crates/coverage-report/src/types.rs
+++ b/crates/coverage-report/src/types.rs
@@ -2,20 +2,141 @@
 Type definitions for coverage-report.
 */
 
+use lingua::capabilities::ProviderFormat;
+
+/// Output format for the coverage report.
+#[derive(Debug, Clone, Copy, PartialEq, Default)]
+pub enum OutputFormat {
+    #[default]
+    Markdown,
+    Compact,
+}
+
+impl std::str::FromStr for OutputFormat {
+    type Err = String;
+
+    fn from_str(s: &str) -> Result<Self, Self::Err> {
+        match s.to_lowercase().as_str() {
+            "compact" | "c" | "token" | "t" => Ok(OutputFormat::Compact),
+            "markdown" | "md" | "full" => Ok(OutputFormat::Markdown),
+            _ => Err(format!("Unknown output format: {}", s)),
+        }
+    }
+}
+
+/// Filter configuration for granular test selection.
+#[derive(Debug, Clone, Default)]
+pub struct TestFilter {
+    /// Glob patterns to match test case names (empty = match all)
+    pub test_case_patterns: Vec<String>,
+    /// Filter both source AND target to this set of providers
+    pub providers: Option<Vec<ProviderFormat>>,
+    /// Explicit source provider filter
+    pub sources: Option<Vec<ProviderFormat>>,
+    /// Explicit target provider filter
+    pub targets: Option<Vec<ProviderFormat>>,
+}
+
+impl TestFilter {
+    /// Check if a test case name matches the filter patterns.
+    /// If no patterns specified, matches all test cases.
+    pub fn matches_test_case(&self, name: &str) -> bool {
+        if self.test_case_patterns.is_empty() {
+            return true;
+        }
+        self.test_case_patterns
+            .iter()
+            .any(|pattern| glob_match(pattern, name))
+    }
+
+    /// Check if a provider pair matches the filter.
+    /// Logic:
+    /// - If `providers` is set: both source AND target must be in the list
+    /// - If `sources` is set: source must be in the list
+    /// - If `targets` is set: target must be in the list
+    /// - Filters combine with AND logic
+    pub fn matches_provider_pair(&self, source: ProviderFormat, target: ProviderFormat) -> bool {
+        // Check providers filter (both must match)
+        if let Some(ref providers) = self.providers {
+            if !providers.contains(&source) || !providers.contains(&target) {
+                return false;
+            }
+        }
+
+        // Check explicit source filter
+        if let Some(ref sources) = self.sources {
+            if !sources.contains(&source) {
+                return false;
+            }
+        }
+
+        // Check explicit target filter
+        if let Some(ref targets) = self.targets {
+            if !targets.contains(&target) {
+                return false;
+            }
+        }
+
+        true
+    }
+}
+
+/// Simple glob pattern matching.
+/// Supports `*` (match any sequence) and `?` (match single char).
+fn glob_match(pattern: &str, text: &str) -> bool {
+    // Convert glob pattern to regex
+    let regex_pattern = pattern
+        .chars()
+        .map(|c| match c {
+            '*' => ".*".to_string(),
+            '?' => ".".to_string(),
+            // Escape regex special chars
+            '.' | '+' | '^' | '$' | '(' | ')' | '[' | ']' | '{' | '}' | '|' | '\\' => {
+                format!("\\{}", c)
+            }
+            _ => c.to_string(),
+        })
+        .collect::<String>();
+
+    // Anchor the pattern to match the entire string
+    let full_pattern = format!("^{}$", regex_pattern);
+
+    regex::Regex::new(&full_pattern)
+        .map(|re| re.is_match(text))
+        .unwrap_or(false)
+}
+
+/// Parse a provider name string into a ProviderFormat.
+pub fn parse_provider(name: &str) -> Result<ProviderFormat, String> {
+    match name.to_lowercase().as_str() {
+        "responses" | "response" | "openai-responses" => Ok(ProviderFormat::Responses),
+        "chat-completions" | "chatcompletions" | "completions" | "openai" => {
+            Ok(ProviderFormat::OpenAI)
+        }
+        "anthropic" => Ok(ProviderFormat::Anthropic),
+        "google" | "gemini" => Ok(ProviderFormat::Google),
+        "bedrock" | "converse" => Ok(ProviderFormat::Converse),
+        _ => Err(format!("Unknown provider: {}", name)),
+    }
+}
+
 #[derive(Debug, Clone, Copy, PartialEq)]
 pub enum ValidationLevel {
     Pass,
     Fail,
     /// Provider limitation - feature that can't be transformed (e.g., "has no OpenAI equivalent")
     Limitation,
-    /// Missing test fixture - "Source payload not found"
-    MissingFixture,
+    /// Test skipped (e.g., payload file not found)
+    Skipped,
 }
 
 #[derive(Debug)]
 pub struct TransformResult {
     pub level: ValidationLevel,
     pub error: Option<String>,
+    pub diff: Option<RoundtripDiff>,
+    /// Human-readable reason from expected.rs whitelist (for limitations only)
+    pub limitation_reason: Option<String>,
 }
 
 #[derive(Debug, Default)]
@@ -23,17 +144,74 @@ pub struct PairResult {
     pub passed: usize,
     pub failed: usize,
     pub limitations: usize,
-    pub missing_fixtures: usize,
-    pub failures: Vec<(String, String)>,
-    pub limitation_details: Vec<(String, String)>,
-    pub missing_fixture_details: Vec<(String, String)>,
+    /// (test_case, error_message, optional_diff)
+    pub failures: Vec<(String, String, Option<RoundtripDiff>)>,
+    /// (test_case, reason, optional_diff)
+    pub limitation_details: Vec<(String, String, Option<RoundtripDiff>)>,
 }
 
 pub struct TableStats {
     pub passed: usize,
     pub failed: usize,
     pub limitations: usize,
-    pub missing_fixtures: usize,
+}
+
+/// Failure with diff info: (direction, test_case, error, optional_diff)
+pub type FailureWithDiff = (String, String, String, Option<RoundtripDiff>);
+
+/// Output from generate_table function containing table markdown and statistics.
+pub struct TableOutput {
+    pub table_markdown: String,
+    pub stats: TableStats,
+    pub failures: Vec<FailureWithDiff>,
+    /// (direction, test_case, reason, optional_diff)
+    pub limitations: Vec<(String, String, String, Option<RoundtripDiff>)>,
+}
+
+#[derive(Debug, Clone, Copy)]
+pub struct CoverageSelection {
+    pub requests: bool,
+    pub responses: bool,
+    pub streaming: bool,
+}
+
+impl CoverageSelection {
+    pub fn all() -> Self {
+        Self {
+            requests: true,
+            responses: true,
+            streaming: true,
+        }
+    }
+
+    pub fn from_list(value: &str) -> Result<Self, String> {
+        let mut selection = Self {
+            requests: false,
+            responses: false,
+            streaming: false,
+        };
+
+        for raw in value.split(',') {
+            let token = raw.trim().to_lowercase();
+            if token.is_empty() {
+                continue;
+            }
+
+            match token.as_str() {
+                "all" => return Ok(Self::all()),
+                "requests" | "request" => selection.requests = true,
+                "responses" | "response" => selection.responses = true,
+                "streaming" | "stream" => selection.streaming = true,
+                _ => return Err(format!("Unknown coverage section: {}", token)),
+            }
+        }
+
+        if !selection.requests && !selection.responses && !selection.streaming {
+            return Err("No valid coverage sections provided".to_string());
+        }
+
+        Ok(selection)
+    }
 }
 
 /// An issue entry: (direction, test_case, error_message)
@@ -58,11 +236,13 @@ pub struct TableResult {
 /// - `lost_fields`: Fields present in original but missing after roundtrip
 /// - `added_fields`: Fields added during roundtrip (not in original)
 /// - `changed_fields`: Fields where values changed (path, original, roundtripped)
-#[derive(Debug, Default)]
+/// - `expected_diffs`: Fields that differed but are whitelisted limitations (field_path, before, after, reason)
+#[derive(Debug, Default, Clone)]
 pub struct RoundtripDiff {
     pub lost_fields: Vec<String>,
     pub added_fields: Vec<String>,
     pub changed_fields: Vec<(String, String, String)>,
+    pub expected_diffs: Vec<(String, String, String, String)>,
 }
 
 impl RoundtripDiff {
@@ -86,24 +266,58 @@ pub struct RoundtripResult {
     pub diff: Option<RoundtripDiff>,
 }
 
-/// Per-provider aggregated roundtrip test results.
-#[derive(Debug, Default)]
-pub struct ProviderRoundtripResult {
-    pub request_passed: usize,
-    pub request_failed: usize,
-    pub request_failures: Vec<(String, RoundtripResult)>,
-    pub response_passed: usize,
-    pub response_failed: usize,
-    pub response_failures: Vec<(String, RoundtripResult)>,
+// ============================================================================
+// Expected differences types
+// ============================================================================
+
+use serde::{Deserialize, Serialize};
+
+/// Root structure for expected differences with two-tier organization.
+#[derive(Debug, Clone, Deserialize, Serialize)]
+pub struct ExpectedDifferences {
+    /// Global rules that apply to all test cases for a source→target pair
+    #[serde(default)]
+    pub global: Vec<GlobalRule>,
+    /// Per-test-case rules that only apply to specific tests
+    #[serde(default, rename = "perTestCase")]
+    pub per_test_case: Vec<PerTestCaseRule>,
 }
 
-impl ProviderRoundtripResult {
-    #[allow(dead_code)]
-    pub fn total_passed(&self) -> usize {
-        self.request_passed + self.response_passed
-    }
+/// Global rule that applies to all tests for a source→target transformation.
+#[derive(Debug, Clone, Deserialize, Serialize)]
+pub struct GlobalRule {
+    pub source: String,
+    pub target: String,
+    #[serde(default, skip_serializing_if = "Vec::is_empty")]
+    pub fields: Vec<DifferenceEntry>,
+    #[serde(default, skip_serializing_if = "Vec::is_empty")]
+    pub errors: Vec<DifferenceEntry>,
+}
 
-    pub fn total_failed(&self) -> usize {
-        self.request_failed + self.response_failed
-    }
+/// Per-test-case rule that applies only to a specific test.
+#[derive(Debug, Clone, Deserialize, Serialize)]
+pub struct PerTestCaseRule {
+    #[serde(rename = "testCase")]
+    pub test_case: String,
+    pub source: String,
+    pub target: String,
+    /// If true, entire test should be skipped
+    #[serde(default)]
+    pub skip: bool,
+    /// Reason for the skip or differences
+    #[serde(skip_serializing_if = "Option::is_none")]
+    pub reason: Option<String>,
+    /// Field differences expected for this test
+    #[serde(default, skip_serializing_if = "Vec::is_empty")]
+    pub fields: Vec<DifferenceEntry>,
+    /// Error patterns expected for this test
+    #[serde(default, skip_serializing_if = "Vec::is_empty")]
+    pub errors: Vec<DifferenceEntry>,
+}
+
+/// A single field or error pattern with explanation.
+#[derive(Debug, Clone, Deserialize, Serialize)]
+pub struct DifferenceEntry {
+    pub pattern: String,
+    pub reason: String,
 }
diff --git a/crates/coverage-report/tests/cross_provider_test.rs b/crates/coverage-report/tests/cross_provider_test.rs
new file mode 100644
index 00000000..31f5d5e7
--- /dev/null
+++ b/crates/coverage-report/tests/cross_provider_test.rs
@@ -0,0 +1,62 @@
+/*!
+Integration test for cross-provider transformations.
+
+This test ensures that transformations between required providers have no
+unexpected failures. Known limitations (documented in expected_differences.json)
+are allowed, but regressions will cause this test to fail.
+*/
+
+use coverage_report::runner::run_all_tests;
+use coverage_report::types::TestFilter;
+use lingua::capabilities::ProviderFormat;
+use lingua::processing::adapters::adapters;
+
+/// Required providers for CI: Anthropic <-> ChatCompletions <-> Responses
+const REQUIRED_PROVIDERS: &[ProviderFormat] = &[
+    ProviderFormat::Responses,
+    ProviderFormat::OpenAI, // ChatCompletions
+    ProviderFormat::Anthropic,
+];
+
+#[test]
+fn cross_provider_transformations_have_no_unexpected_failures() {
+    let adapters = adapters();
+    let filter = TestFilter {
+        providers: Some(REQUIRED_PROVIDERS.to_vec()),
+        ..Default::default()
+    };
+
+    let (request_results, response_results, streaming_results) = run_all_tests(adapters, &filter);
+
+    let mut failures = Vec::new();
+
+    // Collect failures from all result categories
+    for (category, results) in [
+        ("requests", &request_results),
+        ("responses", &response_results),
+        ("streaming", &streaming_results),
+    ] {
+        for ((src_idx, tgt_idx), pair_result) in results.iter() {
+            if pair_result.failed > 0 {
+                let src_format = adapters[*src_idx].format();
+                let tgt_format = adapters[*tgt_idx].format();
+
+                // Collect detailed failure messages
+                for (test_case, error, _diff) in &pair_result.failures {
+                    failures.push(format!(
+                        "  [{category}] {:?} -> {:?}: {test_case}\n    Error: {error}",
+                        src_format, tgt_format
+                    ));
+                }
+            }
+        }
+    }
+
+    assert!(
+        failures.is_empty(),
+        "Unexpected cross-provider transformation failures:\n\n{}\n\n\
+         These failures are NOT in the expected_differences.json whitelist.\n\
+         Either fix the regression or add an entry to the appropriate *_expected_differences.json file.",
+        failures.join("\n\n")
+    );
+}
diff --git a/crates/generate-types/src/main.rs b/crates/generate-types/src/main.rs
index 725d4131..f9dca1b9 100644
--- a/crates/generate-types/src/main.rs
+++ b/crates/generate-types/src/main.rs
@@ -1180,15 +1180,11 @@ fn add_ts_type_annotations(content: &str) -> String {
 
 /// Add #[serde(skip_serializing_if = "Option::is_none")] to all Option<T> fields
 fn add_serde_skip_if_none(content: &str) -> String {
-    let processed = content.to_string();
-
-    // Use regex-like approach to find Option<T> fields and add serde attributes
-    let lines: Vec<&str> = processed.lines().collect();
+    let lines: Vec<&str> = content.lines().collect();
     let mut result_lines = Vec::new();
 
     for i in 0..lines.len() {
         let line = lines[i];
-        result_lines.push(line.to_string());
 
         // Check if this line contains a pub field with Option<T> (but not nested Options)
         if line.trim_start().starts_with("pub ") && line.ends_with(",") {
@@ -1197,22 +1193,23 @@ fn add_serde_skip_if_none(content: &str) -> String {
             if field_parts.len() >= 3 {
                 let field_type = field_parts[2].trim_end_matches(',');
                 if field_type.starts_with("Option<") {
-                    // Check if the next line already has a serde attribute
-                    let next_line = lines.get(i + 1).map(|l| l.trim()).unwrap_or("");
-                    if !next_line.starts_with("#[serde(") && !line.contains("#[serde(") {
+                    // FIX: Check if the PREVIOUS line already has the skip_serializing_if attribute
+                    // Serde attributes come BEFORE the field they annotate
+                    let prev_line = if i > 0 { lines[i - 1].trim() } else { "" };
+                    if !prev_line.contains("skip_serializing_if") {
                         // Get the indentation level from the current line
                         let indent = line.len() - line.trim_start().len();
                         let serde_attr = format!(
                             "{}#[serde(skip_serializing_if = \"Option::is_none\")]",
                             " ".repeat(indent)
                         );
-
-                        // Insert the serde attribute before the field
-                        result_lines.insert(result_lines.len() - 1, serde_attr);
+                        result_lines.push(serde_attr);
                     }
                 }
             }
         }
+
+        result_lines.push(line.to_string());
     }
 
     result_lines.join("\n")
diff --git a/crates/lingua/src/error.rs b/crates/lingua/src/error.rs
index 8870696e..1bd3f3a9 100644
--- a/crates/lingua/src/error.rs
+++ b/crates/lingua/src/error.rs
@@ -9,12 +9,22 @@ pub enum ConvertError {
     #[error("Missing required field: {field}")]
     MissingRequiredField { field: String },
 
-    #[error("Invalid role: {role}")]
-    InvalidRole { role: String },
-
     #[error("Content conversion failed: {reason}")]
     ContentConversionFailed { reason: String },
 
     #[error("JSON serialization failed for field '{field}': {error}")]
     JsonSerializationFailed { field: String, error: String },
+
+    #[error("Invalid {type_name} value: '{value}'")]
+    InvalidEnumValue {
+        type_name: &'static str,
+        value: String,
+    },
+
+    #[error("Tool '{tool_name}' of type '{tool_type}' is not supported by {target_provider}")]
+    UnsupportedToolType {
+        tool_name: String,
+        tool_type: String,
+        target_provider: String,
+    },
 }
diff --git a/crates/lingua/src/processing/adapters.rs b/crates/lingua/src/processing/adapters.rs
index 11ff3eae..f7bf1eb7 100644
--- a/crates/lingua/src/processing/adapters.rs
+++ b/crates/lingua/src/processing/adapters.rs
@@ -12,19 +12,53 @@ provider-specific logic into a single interface.
 3. Register it in `adapters()` with the appropriate feature gate
 */
 
+/// Macro to reject unsupported parameters in provider adapters.
+///
+/// This macro reduces boilerplate when validating that a UniversalRequest doesn't
+/// contain parameters that a provider doesn't support.
+///
+/// # Example
+///
+/// ```ignore
+/// reject_params!(req, ProviderFormat::Anthropic,
+///     logprobs,
+///     top_logprobs,
+///     presence_penalty,
+///     frequency_penalty,
+///     seed,
+///     store
+/// );
+/// ```
+///
+/// This expands to individual checks for each field, returning a ValidationFailed
+/// error if any unsupported field is present.
+#[macro_export]
+macro_rules! reject_params {
+    ($req:expr, $target:expr, $($field:ident),+ $(,)?) => {
+        $(
+            if $req.params.$field.is_some() {
+                return Err($crate::processing::transform::TransformError::ValidationFailed {
+                    target: $target,
+                    reason: concat!("does not support ", stringify!($field)).to_string(),
+                });
+            }
+        )+
+    };
+}
+
 use std::sync::LazyLock;
 
 use crate::capabilities::ProviderFormat;
 use crate::processing::transform::TransformError;
 use crate::serde_json::{Map, Number, Value};
-use crate::universal::{FinishReason, UniversalRequest, UniversalResponse, UniversalStreamChunk};
+use crate::universal::{UniversalRequest, UniversalResponse, UniversalStreamChunk};
 
 /// Trait for provider-specific request and response handling.
 ///
 /// Implementations handle:
 /// - Format detection for both requests and responses
 /// - Conversion to/from universal request/response format
-/// - Provider-specific defaults and finish reason mapping
+/// - Provider-specific defaults
 pub trait ProviderAdapter: Send + Sync {
     // =========================================================================
     // Metadata
@@ -59,12 +93,6 @@ pub trait ProviderAdapter: Send + Sync {
     /// This builds a complete request payload in the provider's format.
     fn request_from_universal(&self, req: &UniversalRequest) -> Result<Value, TransformError>;
 
-    /// Apply provider-specific defaults to a universal request.
-    ///
-    /// This is called after conversion but before building the final payload.
-    /// For example, Anthropic requires `max_tokens` to be set.
-    fn apply_defaults(&self, req: &mut UniversalRequest);
-
     // =========================================================================
     // Response handling
     // =========================================================================
@@ -82,13 +110,15 @@ pub trait ProviderAdapter: Send + Sync {
     /// This builds a complete response payload in the provider's format.
     fn response_from_universal(&self, resp: &UniversalResponse) -> Result<Value, TransformError>;
 
-    /// Map a universal FinishReason to provider-specific string.
+    /// Apply provider-specific defaults to a universal request.
     ///
-    /// Each provider uses different strings for finish reasons:
-    /// - OpenAI: "stop", "length", "tool_calls", "content_filter"
-    /// - Anthropic: "end_turn", "max_tokens", "tool_use"
-    /// - Google: "STOP", "MAX_TOKENS"
-    fn map_finish_reason(&self, reason: Option<&FinishReason>) -> Option<String>;
+    /// This is called after conversion but before building the final payload.
+    /// For example, Anthropic requires `max_tokens` to be set.
+    ///
+    /// Default implementation is a no-op. Override if your provider requires specific defaults.
+    fn apply_defaults(&self, _req: &mut UniversalRequest) {
+        // Default: no-op - override if provider requires specific defaults
+    }
 
     // =========================================================================
     // Streaming response handling
diff --git a/crates/lingua/src/processing/import.rs b/crates/lingua/src/processing/import.rs
index a794de70..127a9634 100644
--- a/crates/lingua/src/processing/import.rs
+++ b/crates/lingua/src/processing/import.rs
@@ -1,4 +1,5 @@
 use crate::providers::anthropic::generated as anthropic;
+use crate::providers::openai::convert::ChatCompletionRequestMessageExt;
 use crate::providers::openai::generated as openai;
 use crate::serde_json;
 use crate::serde_json::Value;
@@ -82,12 +83,14 @@ fn try_converting_to_messages(data: &Value) -> Vec<Message> {
     };
 
     // Try Chat Completions format (most common)
+    // Use extended type to capture reasoning field from vLLM/OpenRouter convention
     if let Ok(provider_messages) =
-        serde_json::from_value::<Vec<openai::ChatCompletionRequestMessage>>(data_to_parse.clone())
+        serde_json::from_value::<Vec<ChatCompletionRequestMessageExt>>(data_to_parse.clone())
     {
-        if let Ok(messages) = <Vec<Message> as TryFromLLM<
-            Vec<openai::ChatCompletionRequestMessage>,
-        >>::try_from(provider_messages)
+        if let Ok(messages) =
+            <Vec<Message> as TryFromLLM<Vec<ChatCompletionRequestMessageExt>>>::try_from(
+                provider_messages,
+            )
         {
             if !messages.is_empty() {
                 return messages;
diff --git a/crates/lingua/src/processing/transform.rs b/crates/lingua/src/processing/transform.rs
index aeceefd0..6c2e5e5f 100644
--- a/crates/lingua/src/processing/transform.rs
+++ b/crates/lingua/src/processing/transform.rs
@@ -14,6 +14,7 @@ passthrough in async contexts.
 use bytes::Bytes;
 
 use crate::capabilities::ProviderFormat;
+use crate::error::ConvertError;
 use crate::processing::adapters::{adapter_for_format, adapters, ProviderAdapter};
 use crate::serde_json::Value;
 use crate::universal::{UniversalResponse, UniversalStreamChunk};
@@ -57,6 +58,29 @@ pub enum TransformError {
     StreamingNotImplemented(String),
 }
 
+impl TransformError {
+    /// Returns true if this is a client-side error (user's fault).
+    ///
+    /// Client errors indicate invalid input or unsupported configurations
+    /// that the user should fix in their request.
+    pub fn is_client_error(&self) -> bool {
+        matches!(
+            self,
+            TransformError::UnableToDetectFormat
+                | TransformError::ValidationFailed { .. }
+                | TransformError::DeserializationFailed(_)
+                | TransformError::UnsupportedTargetFormat(_)
+                | TransformError::UnsupportedSourceFormat(_)
+        )
+    }
+}
+
+impl From<ConvertError> for TransformError {
+    fn from(err: ConvertError) -> Self {
+        TransformError::FromUniversalFailed(err.to_string())
+    }
+}
+
 /// Result of a transformation operation.
 ///
 /// Contains either the original bytes (passthrough) or transformed bytes.
@@ -213,6 +237,7 @@ pub fn transform_request(
     // Apply target provider defaults (e.g., Anthropic's required max_tokens)
     target_adapter.apply_defaults(&mut universal);
 
+    // Convert to target format (validation happens in adapter)
     let transformed = target_adapter.request_from_universal(&universal)?;
 
     let bytes = crate::serde_json::to_vec(&transformed)
diff --git a/crates/lingua/src/providers/anthropic/adapter.rs b/crates/lingua/src/providers/anthropic/adapter.rs
index 265f9a3f..32aa66b8 100644
--- a/crates/lingua/src/providers/anthropic/adapter.rs
+++ b/crates/lingua/src/providers/anthropic/adapter.rs
@@ -7,42 +7,31 @@ Anthropic's Messages API has some unique requirements:
 */
 
 use crate::capabilities::ProviderFormat;
+use crate::error::ConvertError;
 use crate::processing::adapters::{
-    collect_extras, insert_opt_bool, insert_opt_f64, insert_opt_i64, insert_opt_value,
-    ProviderAdapter,
+    insert_opt_bool, insert_opt_f64, insert_opt_i64, ProviderAdapter,
 };
 use crate::processing::transform::TransformError;
-use crate::providers::anthropic::generated::{ContentBlock, CreateMessageParams, InputMessage};
+use crate::providers::anthropic::generated::{ContentBlock, InputMessage};
+use crate::providers::anthropic::params::AnthropicParams;
 use crate::providers::anthropic::try_parse_anthropic;
+use crate::reject_params;
 use crate::serde_json::{self, Map, Value};
 use crate::universal::convert::TryFromLLM;
 use crate::universal::message::{Message, UserContent};
+use crate::universal::reasoning::ANTHROPIC_THINKING_TEMPERATURE;
+use crate::universal::tools::{tools_to_anthropic_value, UniversalTool};
 use crate::universal::transform::extract_system_messages;
 use crate::universal::{
-    FinishReason, UniversalParams, UniversalRequest, UniversalResponse, UniversalStreamChoice,
-    UniversalStreamChunk, UniversalUsage, PLACEHOLDER_ID, PLACEHOLDER_MODEL,
+    parse_stop_sequences, FinishReason, UniversalParams, UniversalRequest, UniversalResponse,
+    UniversalStreamChoice, UniversalStreamChunk, UniversalUsage, PLACEHOLDER_ID, PLACEHOLDER_MODEL,
 };
+use std::collections::HashMap;
+use std::convert::TryInto;
 
 /// Default max_tokens for Anthropic requests (matches legacy proxy behavior).
 pub const DEFAULT_MAX_TOKENS: i64 = 4096;
 
-/// Known request fields for Anthropic Messages API.
-/// Fields not in this list go into `extras`.
-const ANTHROPIC_KNOWN_KEYS: &[&str] = &[
-    "model",
-    "messages",
-    "system",
-    "max_tokens",
-    "temperature",
-    "top_p",
-    "top_k",
-    "stop_sequences",
-    "stream",
-    "metadata",
-    "tools",
-    "tool_choice",
-];
-
 /// Adapter for Anthropic Messages API.
 pub struct AnthropicAdapter;
 
@@ -64,37 +53,75 @@ impl ProviderAdapter for AnthropicAdapter {
     }
 
     fn request_to_universal(&self, payload: Value) -> Result<UniversalRequest, TransformError> {
-        let extras = collect_extras(&payload, ANTHROPIC_KNOWN_KEYS);
-        let stop = payload.get("stop_sequences").cloned();
-
-        let request: CreateMessageParams = serde_json::from_value(payload)
+        // Single parse: typed params now includes typed messages via #[serde(flatten)]
+        let typed_params: AnthropicParams = serde_json::from_value(payload)
             .map_err(|e| TransformError::ToUniversalFailed(e.to_string()))?;
 
-        let messages = <Vec<Message> as TryFromLLM<Vec<_>>>::try_from(request.messages)
+        // Extract typed messages (partial move - other fields remain accessible)
+        let input_messages = typed_params.messages.ok_or_else(|| {
+            TransformError::ToUniversalFailed("Anthropic: missing 'messages' field".to_string())
+        })?;
+
+        let messages = <Vec<Message> as TryFromLLM<Vec<_>>>::try_from(input_messages)
             .map_err(|e| TransformError::ToUniversalFailed(e.to_string()))?;
 
         let params = UniversalParams {
-            temperature: request.temperature,
-            top_p: request.top_p,
-            top_k: request.top_k,
-            max_tokens: Some(request.max_tokens),
-            stop,
-            tools: request.tools.and_then(|t| serde_json::to_value(t).ok()),
-            tool_choice: request
+            temperature: typed_params.temperature,
+            top_p: typed_params.top_p,
+            top_k: typed_params.top_k,
+            max_tokens: typed_params.max_tokens,
+            stop: typed_params
+                .stop_sequences
+                .as_ref()
+                .and_then(parse_stop_sequences),
+            tools: typed_params
+                .tools
+                .as_ref()
+                .map(UniversalTool::from_value_array),
+            tool_choice: typed_params
                 .tool_choice
-                .and_then(|t| serde_json::to_value(t).ok()),
-            response_format: None,  // Anthropic doesn't use response_format
+                .as_ref()
+                .and_then(|v| (ProviderFormat::Anthropic, v).try_into().ok()),
+            response_format: typed_params
+                .output_format
+                .as_ref()
+                .and_then(|v| (ProviderFormat::Anthropic, v).try_into().ok()),
             seed: None,             // Anthropic doesn't support seed
             presence_penalty: None, // Anthropic doesn't support these
             frequency_penalty: None,
-            stream: request.stream,
+            stream: typed_params.stream,
+            // Extract parallel_tool_calls from Anthropic's disable_parallel_tool_use in tool_choice
+            parallel_tool_calls: typed_params
+                .tool_choice
+                .as_ref()
+                .and_then(|tc| tc.get("disable_parallel_tool_use"))
+                .and_then(Value::as_bool)
+                .map(|disabled| !disabled), // disable_parallel_tool_use: true → parallel_tool_calls: false
+            reasoning: typed_params
+                .thinking
+                .as_ref()
+                .map(crate::universal::request::ReasoningConfig::from),
+            metadata: typed_params.metadata,
+            store: None, // Anthropic doesn't support store
+            service_tier: typed_params.service_tier,
+            logprobs: None,     // Anthropic doesn't support logprobs
+            top_logprobs: None, // Anthropic doesn't support top_logprobs
         };
 
+        // Use extras captured automatically via #[serde(flatten)]
+        let mut provider_extras = HashMap::new();
+        if !typed_params.extras.is_empty() {
+            provider_extras.insert(
+                ProviderFormat::Anthropic,
+                typed_params.extras.into_iter().collect(),
+            );
+        }
+
         Ok(UniversalRequest {
-            model: Some(request.model),
+            model: typed_params.model,
             messages,
             params,
-            extras,
+            provider_extras,
         })
     }
 
@@ -104,6 +131,29 @@ impl ProviderAdapter for AnthropicAdapter {
             reason: "missing model".to_string(),
         })?;
 
+        // Validate unsupported parameters
+        reject_params!(
+            req,
+            ProviderFormat::Anthropic,
+            logprobs,
+            top_logprobs,
+            presence_penalty,
+            frequency_penalty,
+            seed,
+            store
+        );
+        // Anthropic doesn't support multiple completions (n > 1)
+        if let Some(openai_extras) = req.provider_extras.get(&ProviderFormat::OpenAI) {
+            if let Some(n) = openai_extras.get("n").and_then(Value::as_i64) {
+                if n > 1 {
+                    return Err(TransformError::ValidationFailed {
+                        target: ProviderFormat::Anthropic,
+                        reason: "does not support n > 1 (multiple completions)".to_string(),
+                    });
+                }
+            }
+        }
+
         // Clone messages and extract system messages (Anthropic uses separate `system` param)
         let mut msgs = req.messages.clone();
         let system_contents = extract_system_messages(&mut msgs);
@@ -138,26 +188,85 @@ impl ProviderAdapter for AnthropicAdapter {
         let max_tokens = req.params.max_tokens.unwrap_or(DEFAULT_MAX_TOKENS);
         obj.insert("max_tokens".into(), Value::Number(max_tokens.into()));
 
+        // Check if reasoning/thinking is enabled (needed for temperature override)
+        let thinking_val = req.params.reasoning_for(ProviderFormat::Anthropic);
+        let reasoning_enabled = thinking_val.is_some();
+
         // Insert other params
-        insert_opt_f64(&mut obj, "temperature", req.params.temperature);
+        // Anthropic requires temperature=1.0 when extended thinking is enabled
+        let temperature = if reasoning_enabled {
+            Some(ANTHROPIC_THINKING_TEMPERATURE)
+        } else {
+            req.params.temperature
+        };
+        insert_opt_f64(&mut obj, "temperature", temperature);
         insert_opt_f64(&mut obj, "top_p", req.params.top_p);
         insert_opt_i64(&mut obj, "top_k", req.params.top_k);
 
         // Anthropic uses stop_sequences instead of stop
-        if let Some(stop) = &req.params.stop {
-            obj.insert("stop_sequences".into(), stop.clone());
+        if let Some(ref stop) = req.params.stop {
+            if !stop.is_empty() {
+                obj.insert(
+                    "stop_sequences".into(),
+                    Value::Array(stop.iter().map(|s| Value::String(s.clone())).collect()),
+                );
+            }
+        }
+
+        // Convert tools to Anthropic format
+        if let Some(tools) = &req.params.tools {
+            if let Some(tools_value) = tools_to_anthropic_value(tools)? {
+                obj.insert("tools".into(), tools_value);
+            }
         }
 
-        insert_opt_value(&mut obj, "tools", req.params.tools.clone());
-        insert_opt_value(&mut obj, "tool_choice", req.params.tool_choice.clone());
+        // Convert tool_choice using helper method (handles parallel_tool_calls internally)
+        if let Some(tool_choice_val) = req.params.tool_choice_for(ProviderFormat::Anthropic) {
+            obj.insert("tool_choice".into(), tool_choice_val);
+        }
         insert_opt_bool(&mut obj, "stream", req.params.stream);
 
-        // Merge extras - only include Anthropic-known fields
-        // This filters out OpenAI-specific fields like stream_options that would cause
-        // Anthropic to reject the request with "extra inputs are not permitted"
-        for (k, v) in &req.extras {
-            if ANTHROPIC_KNOWN_KEYS.contains(&k.as_str()) {
-                obj.insert(k.clone(), v.clone());
+        // Add reasoning as thinking if present (use pre-computed value from temperature override)
+        if let Some(thinking) = thinking_val {
+            obj.insert("thinking".into(), thinking);
+        }
+
+        // Add metadata from canonical params
+        // Anthropic only accepts user_id in metadata, so filter out other fields
+        if let Some(metadata) = req.params.metadata.as_ref() {
+            if let Some(obj_map) = metadata.as_object() {
+                if let Some(user_id) = obj_map.get("user_id") {
+                    obj.insert("metadata".into(), serde_json::json!({ "user_id": user_id }));
+                }
+                // Skip metadata entirely if no user_id present
+            }
+        }
+
+        // Add service_tier from canonical params
+        // Map OpenAI's "default" to Anthropic's "auto" (Anthropic only accepts "auto" or "standard_only")
+        if let Some(ref service_tier) = req.params.service_tier {
+            let anthropic_tier = match service_tier.as_str() {
+                "default" => "auto",
+                other => other,
+            };
+            obj.insert(
+                "service_tier".into(),
+                Value::String(anthropic_tier.to_string()),
+            );
+        }
+
+        // Add output_format for structured outputs (beta feature)
+        if let Some(output_format_val) = req.params.response_format_for(ProviderFormat::Anthropic) {
+            obj.insert("output_format".into(), output_format_val);
+        }
+
+        // Merge back provider-specific extras (only for Anthropic)
+        if let Some(extras) = req.provider_extras.get(&ProviderFormat::Anthropic) {
+            for (k, v) in extras {
+                // Don't overwrite canonical fields we already handled
+                if !obj.contains_key(k) {
+                    obj.insert(k.clone(), v.clone());
+                }
             }
         }
 
@@ -197,20 +306,15 @@ impl ProviderAdapter for AnthropicAdapter {
         let messages = <Vec<Message> as TryFromLLM<Vec<ContentBlock>>>::try_from(content_blocks)
             .map_err(|e| TransformError::ToUniversalFailed(e.to_string()))?;
 
-        let finish_reason = payload
-            .get("stop_reason")
-            .and_then(Value::as_str)
-            .map(|s| s.parse().unwrap());
-
-        let usage = payload.get("usage").map(|u| UniversalUsage {
-            prompt_tokens: u.get("input_tokens").and_then(Value::as_i64),
-            completion_tokens: u.get("output_tokens").and_then(Value::as_i64),
-            prompt_cached_tokens: u.get("cache_read_input_tokens").and_then(Value::as_i64),
-            prompt_cache_creation_tokens: u
-                .get("cache_creation_input_tokens")
-                .and_then(Value::as_i64),
-            completion_reasoning_tokens: None, // Anthropic doesn't expose thinking tokens separately
-        });
+        let finish_reason = match payload.get("stop_reason").and_then(Value::as_str) {
+            Some(s) => Some(s.parse().map_err(|_| ConvertError::InvalidEnumValue {
+                type_name: "FinishReason",
+                value: s.to_string(),
+            })?),
+            None => None,
+        };
+
+        let usage = UniversalUsage::extract_from_response(&payload, self.format());
 
         Ok(UniversalResponse {
             model: payload
@@ -231,8 +335,10 @@ impl ProviderAdapter for AnthropicAdapter {
         let content_value = serde_json::to_value(&content_blocks)
             .map_err(|e| TransformError::SerializationFailed(e.to_string()))?;
 
-        let stop_reason = self
-            .map_finish_reason(resp.finish_reason.as_ref())
+        let stop_reason = resp
+            .finish_reason
+            .as_ref()
+            .map(|r| r.to_provider_string(self.format()).to_string())
             .unwrap_or_else(|| "end_turn".to_string());
 
         let mut obj = serde_json::json!({
@@ -245,28 +351,14 @@ impl ProviderAdapter for AnthropicAdapter {
         });
 
         if let Some(usage) = &resp.usage {
-            obj.as_object_mut().unwrap().insert(
-                "usage".into(),
-                serde_json::json!({
-                    "input_tokens": usage.prompt_tokens.unwrap_or(0),
-                    "output_tokens": usage.completion_tokens.unwrap_or(0)
-                }),
-            );
+            obj.as_object_mut()
+                .unwrap()
+                .insert("usage".into(), usage.to_provider_value(self.format()));
         }
 
         Ok(obj)
     }
 
-    fn map_finish_reason(&self, reason: Option<&FinishReason>) -> Option<String> {
-        reason.map(|r| match r {
-            FinishReason::Stop => "end_turn".to_string(),
-            FinishReason::Length => "max_tokens".to_string(),
-            FinishReason::ToolCalls => "tool_use".to_string(),
-            FinishReason::ContentFilter => "content_filter".to_string(),
-            FinishReason::Other(s) => s.clone(),
-        })
-    }
-
     // =========================================================================
     // Streaming response handling
     // =========================================================================
@@ -305,10 +397,13 @@ impl ProviderAdapter for AnthropicAdapter {
                 let delta_type = delta.and_then(|d| d.get("type")).and_then(Value::as_str);
 
                 if delta_type == Some("text_delta") {
-                    let text = delta
-                        .and_then(|d| d.get("text"))
-                        .and_then(Value::as_str)
-                        .unwrap_or("");
+                    let text = delta.and_then(|d| d.get("text")).and_then(Value::as_str);
+
+                    // Use null for empty/missing text, preserving semantic equivalence with source
+                    let content_value = match text {
+                        Some(t) if !t.is_empty() => Value::String(t.to_string()),
+                        _ => Value::Null, // Empty or missing text becomes null
+                    };
 
                     let index = payload.get("index").and_then(Value::as_u64).unwrap_or(0) as u32;
 
@@ -319,7 +414,7 @@ impl ProviderAdapter for AnthropicAdapter {
                             index,
                             delta: Some(serde_json::json!({
                                 "role": "assistant",
-                                "content": text
+                                "content": content_value
                             })),
                             finish_reason: None,
                         }],
@@ -339,22 +434,10 @@ impl ProviderAdapter for AnthropicAdapter {
                     .and_then(|d| d.get("stop_reason"))
                     .and_then(Value::as_str);
 
-                let finish_reason = stop_reason.map(|r| match r {
-                    "end_turn" | "stop_sequence" => "stop".to_string(),
-                    "max_tokens" => "length".to_string(),
-                    "tool_use" => "tool_calls".to_string(),
-                    other => other.to_string(),
-                });
-
-                let usage = payload.get("usage").map(|u| UniversalUsage {
-                    prompt_tokens: u.get("input_tokens").and_then(Value::as_i64),
-                    completion_tokens: u.get("output_tokens").and_then(Value::as_i64),
-                    prompt_cached_tokens: u.get("cache_read_input_tokens").and_then(Value::as_i64),
-                    prompt_cache_creation_tokens: u
-                        .get("cache_creation_input_tokens")
-                        .and_then(Value::as_i64),
-                    completion_reasoning_tokens: None,
-                });
+                let finish_reason = stop_reason
+                    .map(|r| FinishReason::from_provider_string(r, self.format()).to_string());
+
+                let usage = UniversalUsage::extract_from_response(&payload, self.format());
 
                 if finish_reason.is_some() || usage.is_some() {
                     return Ok(Some(UniversalStreamChunk::new(
@@ -386,17 +469,7 @@ impl ProviderAdapter for AnthropicAdapter {
                     .map(String::from);
                 let usage = message
                     .and_then(|m| m.get("usage"))
-                    .map(|u| UniversalUsage {
-                        prompt_tokens: u.get("input_tokens").and_then(Value::as_i64),
-                        completion_tokens: u.get("output_tokens").and_then(Value::as_i64),
-                        prompt_cached_tokens: u
-                            .get("cache_read_input_tokens")
-                            .and_then(Value::as_i64),
-                        prompt_cache_creation_tokens: u
-                            .get("cache_creation_input_tokens")
-                            .and_then(Value::as_i64),
-                        completion_reasoning_tokens: None,
-                    });
+                    .map(|u| UniversalUsage::from_provider_value(u, self.format()));
 
                 // Return chunk with metadata but mark as role initialization
                 Ok(Some(UniversalStreamChunk::new(
@@ -442,6 +515,50 @@ impl ProviderAdapter for AnthropicAdapter {
             .and_then(|c| c.finish_reason.as_ref())
             .is_some();
 
+        // Check if this is an initial metadata chunk (has model/id/usage but no content)
+        let is_initial_metadata =
+            (chunk.model.is_some() || chunk.id.is_some() || chunk.usage.is_some())
+                && !has_finish
+                && chunk
+                    .choices
+                    .first()
+                    .and_then(|c| c.delta.as_ref())
+                    .is_none_or(|d| {
+                        // Initial chunk has role but empty/no content
+                        d.get("content")
+                            .and_then(Value::as_str)
+                            .is_none_or(|s| s.is_empty())
+                    });
+
+        if is_initial_metadata {
+            // Return message_start with model/id/usage
+            let id = chunk
+                .id
+                .clone()
+                .unwrap_or_else(|| format!("msg_{}", PLACEHOLDER_ID));
+
+            let mut message = serde_json::json!({
+                "id": id,
+                "type": "message",
+                "role": "assistant",
+                "model": chunk.model.as_deref().unwrap_or(PLACEHOLDER_MODEL),
+                "content": [],
+                "stop_reason": null,
+                "stop_sequence": null
+            });
+
+            if let Some(usage) = &chunk.usage {
+                if let Some(obj) = message.as_object_mut() {
+                    obj.insert("usage".into(), usage.to_provider_value(self.format()));
+                }
+            }
+
+            return Ok(serde_json::json!({
+                "type": "message_start",
+                "message": message
+            }));
+        }
+
         if has_finish {
             // Generate message_delta with stop_reason
             let finish_reason = chunk.choices.first().and_then(|c| c.finish_reason.as_ref());
@@ -460,13 +577,9 @@ impl ProviderAdapter for AnthropicAdapter {
             });
 
             if let Some(usage) = &chunk.usage {
-                obj.as_object_mut().unwrap().insert(
-                    "usage".into(),
-                    serde_json::json!({
-                        "input_tokens": usage.prompt_tokens.unwrap_or(0),
-                        "output_tokens": usage.completion_tokens.unwrap_or(0)
-                    }),
-                );
+                if let Some(obj_map) = obj.as_object_mut() {
+                    obj_map.insert("usage".into(), usage.to_provider_value(self.format()));
+                }
             }
 
             return Ok(obj);
@@ -486,13 +599,21 @@ impl ProviderAdapter for AnthropicAdapter {
                     }));
                 }
 
-                // Role-only delta (initial chunk) - return content_block_start
-                if delta.get("role").is_some() && delta.get("content").is_none() {
+                // Role-only delta or null content - return empty text_delta
+                // Treat null content the same as missing content (semantically equivalent)
+                // Using text_delta (instead of content_block_start) ensures proper roundtrip
+                // since our stream_to_universal converts empty text back to null
+                // Note: When tool_calls are present with null content, this will emit empty text
+                // which is documented as an expected limitation in streaming_expected_differences.json
+                let content_is_missing_or_null =
+                    delta.get("content").is_none() || delta.get("content") == Some(&Value::Null);
+
+                if delta.get("role").is_some() && content_is_missing_or_null {
                     return Ok(serde_json::json!({
-                        "type": "content_block_start",
+                        "type": "content_block_delta",
                         "index": choice.index,
-                        "content_block": {
-                            "type": "text",
+                        "delta": {
+                            "type": "text_delta",
                             "text": ""
                         }
                     }));
@@ -559,7 +680,7 @@ mod tests {
             model: Some("claude-3-5-sonnet-20241022".to_string()),
             messages: vec![],
             params: UniversalParams::default(),
-            extras: Map::new(),
+            provider_extras: HashMap::new(),
         };
 
         assert!(req.params.max_tokens.is_none());
@@ -577,10 +698,197 @@ mod tests {
                 max_tokens: Some(8192),
                 ..Default::default()
             },
-            extras: Map::new(),
+            provider_extras: HashMap::new(),
         };
 
         adapter.apply_defaults(&mut req);
         assert_eq!(req.params.max_tokens, Some(8192));
     }
+
+    #[test]
+    fn test_anthropic_auto_corrects_temperature_with_thinking() {
+        use crate::universal::message::UserContent;
+        use crate::universal::request::ReasoningConfig;
+
+        let adapter = AnthropicAdapter;
+
+        // Request with thinking enabled and user-specified temperature
+        let req = UniversalRequest {
+            model: Some("claude-sonnet-4-20250514".to_string()),
+            messages: vec![Message::User {
+                content: UserContent::String("Hello".to_string()),
+            }],
+            params: UniversalParams {
+                temperature: Some(0.5), // User specified, but should be overridden
+                reasoning: Some(ReasoningConfig {
+                    enabled: Some(true),
+                    budget_tokens: Some(2048),
+                    ..Default::default()
+                }),
+                max_tokens: Some(4096),
+                ..Default::default()
+            },
+            provider_extras: HashMap::new(),
+        };
+
+        let result = adapter.request_from_universal(&req).unwrap();
+
+        // Temperature should be auto-corrected to 1.0 (ANTHROPIC_THINKING_TEMPERATURE)
+        assert_eq!(
+            result.get("temperature").unwrap().as_f64().unwrap(),
+            1.0,
+            "Temperature should be auto-corrected to 1.0 when thinking is enabled"
+        );
+
+        // Thinking should be present
+        assert!(
+            result.get("thinking").is_some(),
+            "thinking field should be present"
+        );
+    }
+
+    #[test]
+    fn test_anthropic_preserves_temperature_without_thinking() {
+        use crate::universal::message::UserContent;
+
+        let adapter = AnthropicAdapter;
+
+        // Request without thinking - temperature should be preserved
+        let req = UniversalRequest {
+            model: Some("claude-3-5-sonnet-20241022".to_string()),
+            messages: vec![Message::User {
+                content: UserContent::String("Hello".to_string()),
+            }],
+            params: UniversalParams {
+                temperature: Some(0.7),
+                max_tokens: Some(1024),
+                ..Default::default()
+            },
+            provider_extras: HashMap::new(),
+        };
+
+        let result = adapter.request_from_universal(&req).unwrap();
+
+        // Temperature should be preserved as user specified
+        assert_eq!(
+            result.get("temperature").unwrap().as_f64().unwrap(),
+            0.7,
+            "Temperature should be preserved when thinking is not enabled"
+        );
+
+        // No thinking field
+        assert!(
+            result.get("thinking").is_none(),
+            "thinking field should not be present"
+        );
+    }
+
+    #[test]
+    fn test_anthropic_output_format_roundtrip() {
+        let adapter = AnthropicAdapter;
+
+        // Anthropic request with output_format (structured outputs)
+        let payload = json!({
+            "model": "claude-sonnet-4-5-20250929",
+            "max_tokens": 1024,
+            "messages": [{"role": "user", "content": "Extract: John is 25."}],
+            "output_format": {
+                "type": "json_schema",
+                "schema": {
+                    "type": "object",
+                    "properties": {
+                        "name": { "type": "string" },
+                        "age": { "type": "number" }
+                    },
+                    "required": ["name", "age"],
+                    "additionalProperties": false
+                }
+            }
+        });
+
+        // Parse to universal
+        let universal = adapter.request_to_universal(payload.clone()).unwrap();
+
+        // Verify response_format is parsed
+        assert!(
+            universal.params.response_format.is_some(),
+            "response_format should be parsed from output_format"
+        );
+
+        // Convert back to Anthropic
+        let reconstructed = adapter.request_from_universal(&universal).unwrap();
+
+        // Verify output_format is preserved
+        assert!(
+            reconstructed.get("output_format").is_some(),
+            "output_format should be present in reconstructed request"
+        );
+        let output_format = reconstructed.get("output_format").unwrap();
+        assert_eq!(output_format.get("type").unwrap(), "json_schema");
+        assert!(output_format.get("schema").is_some());
+    }
+
+    #[test]
+    fn test_anthropic_cross_provider_output_format() {
+        use crate::processing::adapters::ProviderAdapter;
+        use crate::providers::openai::adapter::OpenAIAdapter;
+        use crate::universal::request::ResponseFormatType;
+
+        let openai_adapter = OpenAIAdapter;
+        let anthropic_adapter = AnthropicAdapter;
+
+        // OpenAI request with response_format
+        let openai_payload = json!({
+            "model": "gpt-4o",
+            "messages": [{"role": "user", "content": "Extract: John is 25."}],
+            "response_format": {
+                "type": "json_schema",
+                "json_schema": {
+                    "name": "person_info",
+                    "schema": {
+                        "type": "object",
+                        "properties": {
+                            "name": { "type": "string" },
+                            "age": { "type": "number" }
+                        },
+                        "required": ["name", "age"]
+                    },
+                    "strict": true
+                }
+            }
+        });
+
+        // Parse OpenAI to universal
+        let universal = openai_adapter.request_to_universal(openai_payload).unwrap();
+        assert!(universal.params.response_format.is_some());
+        assert_eq!(
+            universal
+                .params
+                .response_format
+                .as_ref()
+                .unwrap()
+                .format_type,
+            Some(ResponseFormatType::JsonSchema)
+        );
+
+        // Convert to Anthropic
+        let mut universal_for_anthropic = universal;
+        universal_for_anthropic.model = Some("claude-sonnet-4-5-20250929".to_string());
+        anthropic_adapter.apply_defaults(&mut universal_for_anthropic);
+
+        let anthropic_request = anthropic_adapter
+            .request_from_universal(&universal_for_anthropic)
+            .unwrap();
+
+        // Verify Anthropic output_format structure
+        let output_format = anthropic_request.get("output_format").unwrap();
+        assert_eq!(output_format.get("type").unwrap(), "json_schema");
+        assert!(output_format.get("schema").is_some());
+        // Name should NOT be included (Anthropic doesn't support it)
+        assert!(output_format.get("name").is_none());
+        // strict is NOT supported in Anthropic output_format (it's for tools only)
+        assert!(output_format.get("strict").is_none());
+        // Anthropic format doesn't have nested json_schema wrapper
+        assert!(output_format.get("json_schema").is_none());
+    }
 }
diff --git a/crates/lingua/src/providers/anthropic/convert.rs b/crates/lingua/src/providers/anthropic/convert.rs
index f55ea7d2..cdca8528 100644
--- a/crates/lingua/src/providers/anthropic/convert.rs
+++ b/crates/lingua/src/providers/anthropic/convert.rs
@@ -2,7 +2,7 @@ use crate::error::ConvertError;
 use crate::providers::anthropic::generated;
 use crate::serde_json;
 use crate::universal::{
-    convert::TryFromLLM, AssistantContent, AssistantContentPart, Message, ProviderOptions,
+    convert::TryFromLLM, message::ProviderOptions, AssistantContent, AssistantContentPart, Message,
     TextContentPart, ToolCallArguments, ToolContentPart, ToolResultContentPart, UserContent,
     UserContentPart,
 };
@@ -141,42 +141,69 @@ impl TryFromLLM<generated::InputMessage> for Message {
                                     continue;
                                 }
                                 generated::InputContentBlockType::Document => {
-                                    if let Some(source) = block.source {
+                                    // Map document to File with provider_options for title/context
+                                    if let Some(source) = &block.source {
+                                        let mut opts = serde_json::Map::new();
+                                        // Store document-specific fields in provider_options
+                                        opts.insert(
+                                            "anthropic_type".into(),
+                                            serde_json::Value::String("document".to_string()),
+                                        );
+                                        if let Some(title) = &block.title {
+                                            opts.insert(
+                                                "title".into(),
+                                                serde_json::Value::String(title.clone()),
+                                            );
+                                        }
+                                        if let Some(context) = &block.context {
+                                            opts.insert(
+                                                "context".into(),
+                                                serde_json::Value::String(context.clone()),
+                                            );
+                                        }
+
+                                        // Extract data and media_type from source
                                         match source {
-                                            generated::Source::SourceSource(doc_source) => {
-                                                if let Some(data) = doc_source.data {
-                                                    let media_type = doc_source
-                                                        .media_type
-                                                        .map(|mt| match mt {
-                                                            generated::FluffyMediaType::ImageJpeg => {
-                                                                "image/jpeg".to_string()
-                                                            }
-                                                            generated::FluffyMediaType::ImagePng => {
-                                                                "image/png".to_string()
-                                                            }
-                                                            generated::FluffyMediaType::ImageGif => {
-                                                                "image/gif".to_string()
-                                                            }
-                                                            generated::FluffyMediaType::ImageWebp => {
-                                                                "image/webp".to_string()
-                                                            }
-                                                            generated::FluffyMediaType::ApplicationPdf => {
-                                                                "application/pdf".to_string()
-                                                            }
-                                                            generated::FluffyMediaType::TextPlain => {
-                                                                "text/plain".to_string()
-                                                            }
-                                                        })
-                                                        .unwrap_or_else(|| "text/plain".to_string());
-                                                    content_parts.push(UserContentPart::File {
-                                                        data: serde_json::Value::String(data),
-                                                        filename: block.title.clone(),
-                                                        media_type,
-                                                        provider_options: None,
-                                                    });
-                                                }
+                                            generated::Source::SourceSource(s) => {
+                                                let media_type = s.media_type.as_ref().map(|mt| {
+                                                    match mt {
+                                                        generated::FluffyMediaType::ImageJpeg => {
+                                                            "image/jpeg".to_string()
+                                                        }
+                                                        generated::FluffyMediaType::ImagePng => {
+                                                            "image/png".to_string()
+                                                        }
+                                                        generated::FluffyMediaType::ImageGif => {
+                                                            "image/gif".to_string()
+                                                        }
+                                                        generated::FluffyMediaType::ImageWebp => {
+                                                            "image/webp".to_string()
+                                                        }
+                                                        generated::FluffyMediaType::ApplicationPdf => {
+                                                            "application/pdf".to_string()
+                                                        }
+                                                        generated::FluffyMediaType::TextPlain => {
+                                                            "text/plain".to_string()
+                                                        }
+                                                    }
+                                                });
+                                                content_parts.push(UserContentPart::File {
+                                                    data: s
+                                                        .data
+                                                        .clone()
+                                                        .map(serde_json::Value::String)
+                                                        .unwrap_or(serde_json::Value::Null),
+                                                    filename: None,
+                                                    media_type: media_type.unwrap_or_else(|| {
+                                                        "text/plain".to_string()
+                                                    }),
+                                                    provider_options: Some(ProviderOptions {
+                                                        options: opts,
+                                                    }),
+                                                });
                                             }
                                             _ => {
+                                                // Skip other source types
                                                 continue;
                                             }
                                         }
@@ -191,16 +218,7 @@ impl TryFromLLM<generated::InputMessage> for Message {
 
                         if content_parts.is_empty() {
                             UserContent::String(String::new())
-                        } else if content_parts.len() == 1 {
-                            // Single text part can be simplified to string, but keep arrays for multimodal
-                            match &content_parts[0] {
-                                UserContentPart::Text(text_part) => {
-                                    UserContent::String(text_part.text.clone())
-                                }
-                                _ => UserContent::Array(content_parts),
-                            }
                         } else {
-                            // Multiple parts or multimodal content must remain as array
                             UserContent::Array(content_parts)
                         }
                     }
@@ -210,12 +228,7 @@ impl TryFromLLM<generated::InputMessage> for Message {
             }
             generated::MessageRole::Assistant => {
                 let content = match input_msg.content {
-                    generated::MessageContent::String(text) => {
-                        AssistantContent::Array(vec![AssistantContentPart::Text(TextContentPart {
-                            text,
-                            provider_options: None,
-                        })])
-                    }
+                    generated::MessageContent::String(text) => AssistantContent::String(text),
                     generated::MessageContent::InputContentBlockArray(blocks) => {
                         let mut content_parts = Vec::new();
 
@@ -223,19 +236,16 @@ impl TryFromLLM<generated::InputMessage> for Message {
                             match block.input_content_block_type {
                                 generated::InputContentBlockType::Text => {
                                     if let Some(text) = block.text {
+                                        // Preserve citations in provider_options for roundtrip
                                         let provider_options =
                                             block.citations.as_ref().map(|citations| {
                                                 let mut opts = serde_json::Map::new();
-                                                if let Ok(citations_json) =
-                                                    serde_json::to_value(citations)
-                                                {
-                                                    opts.insert(
-                                                        "citations".to_string(),
-                                                        citations_json,
-                                                    );
+                                                if let Ok(v) = serde_json::to_value(citations) {
+                                                    opts.insert("citations".into(), v);
                                                 }
                                                 ProviderOptions { options: opts }
                                             });
+
                                         content_parts.push(AssistantContentPart::Text(
                                             TextContentPart {
                                                 text,
@@ -248,6 +258,7 @@ impl TryFromLLM<generated::InputMessage> for Message {
                                     if let Some(thinking) = block.thinking {
                                         content_parts.push(AssistantContentPart::Reasoning {
                                             text: thinking,
+                                            // Preserve the signature in encrypted_content for roundtrip
                                             encrypted_content: block.signature.clone(),
                                         });
                                     }
@@ -275,7 +286,7 @@ impl TryFromLLM<generated::InputMessage> for Message {
                                     }
                                 }
                                 generated::InputContentBlockType::ServerToolUse => {
-                                    // Server-executed tool call (e.g., web_search)
+                                    // Server-executed tool use (web search, etc.)
                                     if let (Some(id), Some(name)) = (&block.id, &block.name) {
                                         let input = if let Some(input_map) = &block.input {
                                             serde_json::to_value(input_map)
@@ -291,24 +302,30 @@ impl TryFromLLM<generated::InputMessage> for Message {
                                                 .unwrap_or_else(|_| "{}".to_string())
                                                 .into(),
                                             provider_options: None,
-                                            provider_executed: Some(true),
+                                            provider_executed: Some(true), // Mark as server-executed
                                         });
                                     }
                                 }
                                 generated::InputContentBlockType::WebSearchToolResult => {
-                                    // Web search tool result
-                                    if let Some(tool_use_id) = &block.tool_use_id {
-                                        let output = if let Some(content) = &block.content {
-                                            serde_json::to_value(content)
-                                                .unwrap_or(serde_json::Value::Null)
-                                        } else {
-                                            serde_json::Value::Null
-                                        };
+                                    // Web search tool result - convert to ToolResult with marker
+                                    if let Some(id) = &block.tool_use_id {
+                                        let mut output = serde_json::Map::new();
+                                        output.insert(
+                                            "anthropic_type".into(),
+                                            serde_json::Value::String(
+                                                "web_search_tool_result".to_string(),
+                                            ),
+                                        );
+                                        if let Some(content) = &block.content {
+                                            if let Ok(v) = serde_json::to_value(content) {
+                                                output.insert("content".into(), v);
+                                            }
+                                        }
 
                                         content_parts.push(AssistantContentPart::ToolResult {
-                                            tool_call_id: tool_use_id.clone(),
-                                            tool_name: "web_search".to_string(),
-                                            output,
+                                            tool_call_id: id.clone(),
+                                            tool_name: "web_search".to_string(), // Server-executed web search tool
+                                            output: serde_json::Value::Object(output),
                                             provider_options: None,
                                         });
                                     }
@@ -385,28 +402,48 @@ impl TryFromLLM<Message> for generated::InputMessage {
                                     };
 
                                     if let Some(image_data) = data {
-                                        let anthropic_media_type =
-                                            media_type.as_ref().and_then(|mt| match mt.as_str() {
-                                                "image/jpeg" => {
-                                                    Some(generated::FluffyMediaType::ImageJpeg)
-                                                }
-                                                "image/png" => {
-                                                    Some(generated::FluffyMediaType::ImagePng)
-                                                }
-                                                "image/gif" => {
-                                                    Some(generated::FluffyMediaType::ImageGif)
-                                                }
-                                                "image/webp" => {
-                                                    Some(generated::FluffyMediaType::ImageWebp)
-                                                }
-                                                "application/pdf" => {
-                                                    Some(generated::FluffyMediaType::ApplicationPdf)
-                                                }
-                                                "text/plain" => {
-                                                    Some(generated::FluffyMediaType::TextPlain)
-                                                }
-                                                _ => None,
-                                            });
+                                        // Check if this is a URL - use URL source type (no media_type required)
+                                        let is_url = image_data.starts_with("http://")
+                                            || image_data.starts_with("https://");
+
+                                        let (source_type, source_url, source_data, anthropic_media_type) = if is_url {
+                                            (
+                                                generated::FluffyType::Url,
+                                                Some(image_data),
+                                                None,
+                                                None,
+                                            )
+                                        } else {
+                                            // Base64 data - parse media_type
+                                            let anthropic_media_type =
+                                                media_type.as_ref().and_then(|mt| match mt.as_str() {
+                                                    "image/jpeg" => {
+                                                        Some(generated::FluffyMediaType::ImageJpeg)
+                                                    }
+                                                    "image/png" => {
+                                                        Some(generated::FluffyMediaType::ImagePng)
+                                                    }
+                                                    "image/gif" => {
+                                                        Some(generated::FluffyMediaType::ImageGif)
+                                                    }
+                                                    "image/webp" => {
+                                                        Some(generated::FluffyMediaType::ImageWebp)
+                                                    }
+                                                    "application/pdf" => {
+                                                        Some(generated::FluffyMediaType::ApplicationPdf)
+                                                    }
+                                                    "text/plain" => {
+                                                        Some(generated::FluffyMediaType::TextPlain)
+                                                    }
+                                                    _ => None,
+                                                });
+                                            (
+                                                generated::FluffyType::Base64,
+                                                None,
+                                                Some(image_data),
+                                                anthropic_media_type,
+                                            )
+                                        };
 
                                         Some(generated::InputContentBlock {
                                             cache_control: None,
@@ -416,10 +453,10 @@ impl TryFromLLM<Message> for generated::InputMessage {
                                                 generated::InputContentBlockType::Image,
                                             source: Some(generated::Source::SourceSource(
                                                 generated::SourceSource {
-                                                    data: Some(image_data),
+                                                    data: source_data,
                                                     media_type: anthropic_media_type,
-                                                    source_type: generated::FluffyType::Base64,
-                                                    url: None,
+                                                    source_type,
+                                                    url: source_url,
                                                     content: None,
                                                 },
                                             )),
@@ -441,36 +478,45 @@ impl TryFromLLM<Message> for generated::InputMessage {
                                 }
                                 UserContentPart::File {
                                     data,
-                                    filename,
                                     media_type,
+                                    provider_options,
                                     ..
                                 } => {
-                                    // Convert universal file back to Anthropic Document format
-                                    let file_data = match data {
-                                        serde_json::Value::String(s) => Some(s),
-                                        _ => None,
-                                    };
+                                    // Check if this was originally a Document block
+                                    let is_document = provider_options
+                                        .as_ref()
+                                        .and_then(|opts| opts.options.get("anthropic_type"))
+                                        .and_then(|v| v.as_str())
+                                        == Some("document");
+
+                                    if is_document {
+                                        // Restore as Document block
+                                        let title = provider_options
+                                            .as_ref()
+                                            .and_then(|opts| opts.options.get("title"))
+                                            .and_then(|v| v.as_str())
+                                            .map(|s| s.to_string());
+
+                                        let context = provider_options
+                                            .as_ref()
+                                            .and_then(|opts| opts.options.get("context"))
+                                            .and_then(|v| v.as_str())
+                                            .map(|s| s.to_string());
 
-                                    if let Some(doc_data) = file_data {
                                         let anthropic_media_type = match media_type.as_str() {
-                                            "image/jpeg" => {
-                                                Some(generated::FluffyMediaType::ImageJpeg)
-                                            }
-                                            "image/png" => {
-                                                Some(generated::FluffyMediaType::ImagePng)
-                                            }
-                                            "image/gif" => {
-                                                Some(generated::FluffyMediaType::ImageGif)
-                                            }
-                                            "image/webp" => {
-                                                Some(generated::FluffyMediaType::ImageWebp)
-                                            }
+                                            "image/jpeg" => Some(generated::FluffyMediaType::ImageJpeg),
+                                            "image/png" => Some(generated::FluffyMediaType::ImagePng),
+                                            "image/gif" => Some(generated::FluffyMediaType::ImageGif),
+                                            "image/webp" => Some(generated::FluffyMediaType::ImageWebp),
                                             "application/pdf" => {
                                                 Some(generated::FluffyMediaType::ApplicationPdf)
                                             }
-                                            "text/plain" => {
-                                                Some(generated::FluffyMediaType::TextPlain)
-                                            }
+                                            "text/plain" => Some(generated::FluffyMediaType::TextPlain),
+                                            _ => Some(generated::FluffyMediaType::TextPlain),
+                                        };
+
+                                        let data_str = match data {
+                                            serde_json::Value::String(s) => Some(s),
                                             _ => None,
                                         };
 
@@ -482,15 +528,15 @@ impl TryFromLLM<Message> for generated::InputMessage {
                                                 generated::InputContentBlockType::Document,
                                             source: Some(generated::Source::SourceSource(
                                                 generated::SourceSource {
-                                                    data: Some(doc_data),
+                                                    data: data_str,
                                                     media_type: anthropic_media_type,
                                                     source_type: generated::FluffyType::Text,
                                                     url: None,
                                                     content: None,
                                                 },
                                             )),
-                                            context: None,
-                                            title: filename,
+                                            context,
+                                            title,
                                             content: None,
                                             signature: None,
                                             thinking: None,
@@ -502,6 +548,7 @@ impl TryFromLLM<Message> for generated::InputMessage {
                                             tool_use_id: None,
                                         })
                                     } else {
+                                        // Regular file - skip for now
                                         None
                                     }
                                 }
@@ -517,39 +564,19 @@ impl TryFromLLM<Message> for generated::InputMessage {
                 })
             }
             Message::Assistant { content, .. } => {
-                let blocks = match content {
-                    AssistantContent::String(text) => {
-                        vec![generated::InputContentBlock {
-                            cache_control: None,
-                            citations: None,
-                            text: Some(text),
-                            input_content_block_type: generated::InputContentBlockType::Text,
-                            source: None,
-                            context: None,
-                            title: None,
-                            content: None,
-                            signature: None,
-                            thinking: None,
-                            data: None,
-                            id: None,
-                            input: None,
-                            name: None,
-                            is_error: None,
-                            tool_use_id: None,
-                        }]
-                    }
-                    AssistantContent::Array(parts) => parts
-                        .into_iter()
-                        .filter_map(|part| match part {
+                let content = match content {
+                    AssistantContent::String(text) => generated::MessageContent::String(text),
+                    AssistantContent::Array(parts) => {
+                        let blocks = parts
+                            .into_iter()
+                            .filter_map(|part| match part {
                             AssistantContentPart::Text(text_part) => {
-                                let citations = text_part
-                                    .provider_options
+                                // Restore citations from provider_options
+                                let citations = text_part.provider_options
                                     .as_ref()
                                     .and_then(|opts| opts.options.get("citations"))
-                                    .and_then(|v| {
-                                        serde_json::from_value::<generated::Citations>(v.clone())
-                                            .ok()
-                                    });
+                                    .and_then(|v| serde_json::from_value::<generated::Citations>(v.clone()).ok());
+
                                 Some(generated::InputContentBlock {
                                     cache_control: None,
                                     citations,
@@ -573,25 +600,28 @@ impl TryFromLLM<Message> for generated::InputMessage {
                             AssistantContentPart::Reasoning {
                                 text,
                                 encrypted_content,
-                            } => Some(generated::InputContentBlock {
-                                cache_control: None,
-                                citations: None,
-                                text: None,
-                                input_content_block_type:
-                                    generated::InputContentBlockType::Thinking,
-                                source: None,
-                                context: None,
-                                title: None,
-                                content: None,
-                                signature: encrypted_content,
-                                thinking: Some(text),
-                                data: None,
-                                id: None,
-                                input: None,
-                                name: None,
-                                is_error: None,
-                                tool_use_id: None,
-                            }),
+                            } => {
+                                Some(generated::InputContentBlock {
+                                    cache_control: None,
+                                    citations: None,
+                                    text: None,
+                                    input_content_block_type:
+                                        generated::InputContentBlockType::Thinking,
+                                    source: None,
+                                    context: None,
+                                    title: None,
+                                    content: None,
+                                    // Restore signature from encrypted_content
+                                    signature: encrypted_content,
+                                    thinking: Some(text),
+                                    data: None,
+                                    id: None,
+                                    input: None,
+                                    name: None,
+                                    is_error: None,
+                                    tool_use_id: None,
+                                })
+                            }
                             AssistantContentPart::ToolCall {
                                 tool_call_id,
                                 tool_name,
@@ -605,7 +635,7 @@ impl TryFromLLM<Message> for generated::InputMessage {
                                     ToolCallArguments::Invalid(_) => None,
                                 };
 
-                                // Use ServerToolUse for provider-executed tools, ToolUse otherwise
+                                // Use ServerToolUse for provider-executed tools
                                 let block_type = if provider_executed == Some(true) {
                                     generated::InputContentBlockType::ServerToolUse
                                 } else {
@@ -636,36 +666,50 @@ impl TryFromLLM<Message> for generated::InputMessage {
                                 output,
                                 ..
                             } => {
-                                // Convert tool result back to WebSearchToolResult
-                                let content = serde_json::from_value(output).ok();
+                                // Check if this was a web_search_tool_result
+                                let is_web_search_result = output.as_object()
+                                    .and_then(|obj| obj.get("anthropic_type"))
+                                    .and_then(|v| v.as_str())
+                                    == Some("web_search_tool_result");
 
-                                Some(generated::InputContentBlock {
-                                    cache_control: None,
-                                    citations: None,
-                                    text: None,
-                                    input_content_block_type:
-                                        generated::InputContentBlockType::WebSearchToolResult,
-                                    source: None,
-                                    context: None,
-                                    title: None,
-                                    content,
-                                    signature: None,
-                                    thinking: None,
-                                    data: None,
-                                    id: None,
-                                    input: None,
-                                    name: None,
-                                    is_error: None,
-                                    tool_use_id: Some(tool_call_id),
-                                })
+                                if is_web_search_result {
+                                    // Restore WebSearchToolResult block
+                                    let content = output.as_object()
+                                        .and_then(|obj| obj.get("content"))
+                                        .and_then(|v| serde_json::from_value::<generated::Content>(v.clone()).ok());
+
+                                    Some(generated::InputContentBlock {
+                                        cache_control: None,
+                                        citations: None,
+                                        text: None,
+                                        input_content_block_type:
+                                            generated::InputContentBlockType::WebSearchToolResult,
+                                        source: None,
+                                        context: None,
+                                        title: None,
+                                        content,
+                                        signature: None,
+                                        thinking: None,
+                                        data: None,
+                                        id: None,
+                                        input: None,
+                                        name: None,
+                                        is_error: None,
+                                        tool_use_id: Some(tool_call_id.clone()),
+                                    })
+                                } else {
+                                    None // Skip other tool results in assistant messages
+                                }
                             }
                             _ => None, // Skip other types for now
                         })
-                        .collect(),
+                        .collect();
+                        generated::MessageContent::InputContentBlockArray(blocks)
+                    }
                 };
 
                 Ok(generated::InputMessage {
-                    content: generated::MessageContent::InputContentBlockArray(blocks),
+                    content,
                     role: generated::MessageRole::Assistant,
                 })
             }
@@ -737,8 +781,8 @@ impl TryFromLLM<Vec<generated::ContentBlock>> for Vec<Message> {
                         // Preserve citations in provider_options for roundtrip
                         let provider_options = block.citations.as_ref().map(|citations| {
                             let mut opts = serde_json::Map::new();
-                            if let Ok(citations_json) = serde_json::to_value(citations) {
-                                opts.insert("citations".to_string(), citations_json);
+                            if let Ok(v) = serde_json::to_value(citations) {
+                                opts.insert("citations".into(), v);
                             }
                             ProviderOptions { options: opts }
                         });
@@ -752,6 +796,7 @@ impl TryFromLLM<Vec<generated::ContentBlock>> for Vec<Message> {
                     if let Some(thinking) = block.thinking {
                         content_parts.push(AssistantContentPart::Reasoning {
                             text: thinking,
+                            // Preserve signature in encrypted_content for roundtrip
                             encrypted_content: block.signature.clone(),
                         });
                     }
@@ -777,7 +822,7 @@ impl TryFromLLM<Vec<generated::ContentBlock>> for Vec<Message> {
                     }
                 }
                 generated::ContentBlockType::ServerToolUse => {
-                    // Server-executed tool call (e.g., web_search)
+                    // Server-executed tool (similar to ToolUse but provider_executed=true)
                     if let (Some(id), Some(name)) = (block.id, block.name) {
                         let input = if let Some(input_map) = block.input {
                             serde_json::to_value(input_map).unwrap_or(serde_json::Value::Null)
@@ -792,29 +837,35 @@ impl TryFromLLM<Vec<generated::ContentBlock>> for Vec<Message> {
                                 .unwrap_or_else(|_| "{}".to_string())
                                 .into(),
                             provider_options: None,
-                            provider_executed: Some(true),
+                            provider_executed: Some(true), // Mark as server-executed
                         });
                     }
                 }
                 generated::ContentBlockType::WebSearchToolResult => {
-                    // Web search tool result with encrypted content
-                    if let Some(tool_use_id) = block.tool_use_id {
-                        let output = if let Some(content) = block.content {
-                            serde_json::to_value(content).unwrap_or(serde_json::Value::Null)
-                        } else {
-                            serde_json::Value::Null
-                        };
+                    // Web search tool result - convert to ToolResult with full data
+                    if let Some(id) = block.tool_use_id {
+                        // Store the entire block data for roundtrip
+                        let mut output = serde_json::Map::new();
+                        output.insert(
+                            "anthropic_type".into(),
+                            serde_json::Value::String("web_search_tool_result".to_string()),
+                        );
+                        if let Some(content) = &block.content {
+                            if let Ok(v) = serde_json::to_value(content) {
+                                output.insert("content".into(), v);
+                            }
+                        }
 
                         content_parts.push(AssistantContentPart::ToolResult {
-                            tool_call_id: tool_use_id,
+                            tool_call_id: id,
                             tool_name: "web_search".to_string(),
-                            output,
+                            output: serde_json::Value::Object(output),
                             provider_options: None,
                         });
                     }
                 }
                 _ => {
-                    // Skip other types for now
+                    // Skip other types (RedactedThinking, etc.)
                     continue;
                 }
             }
@@ -896,6 +947,7 @@ impl TryFromLLM<Vec<Message>> for Vec<generated::ContentBlock> {
                                         citations: None,
                                         text: None,
                                         content_block_type: generated::ContentBlockType::Thinking,
+                                        // Restore signature from encrypted_content
                                         signature: encrypted_content,
                                         thinking: Some(text),
                                         data: None,
@@ -919,7 +971,7 @@ impl TryFromLLM<Vec<Message>> for Vec<generated::ContentBlock> {
                                         ToolCallArguments::Invalid(_) => None,
                                     };
 
-                                    // Use ServerToolUse for provider-executed tools, ToolUse otherwise
+                                    // Use ServerToolUse if provider_executed is true
                                     let block_type = if provider_executed == Some(true) {
                                         generated::ContentBlockType::ServerToolUse
                                     } else {
@@ -945,23 +997,38 @@ impl TryFromLLM<Vec<Message>> for Vec<generated::ContentBlock> {
                                     output,
                                     ..
                                 } => {
-                                    // Convert tool result back to WebSearchToolResult
-                                    let content = serde_json::from_value(output).ok();
+                                    // Check if this is a web_search_tool_result
+                                    let is_web_search_result =
+                                        output.get("anthropic_type").and_then(|v| v.as_str())
+                                            == Some("web_search_tool_result");
 
-                                    content_blocks.push(generated::ContentBlock {
-                                        citations: None,
-                                        text: None,
-                                        content_block_type:
-                                            generated::ContentBlockType::WebSearchToolResult,
-                                        signature: None,
-                                        thinking: None,
-                                        data: None,
-                                        id: None,
-                                        input: None,
-                                        name: None,
-                                        content,
-                                        tool_use_id: Some(tool_call_id),
-                                    });
+                                    if is_web_search_result {
+                                        // Restore as WebSearchToolResult
+                                        let content = output.get("content").and_then(|v| {
+                                            serde_json::from_value::<
+                                                    generated::ContentBlockContent,
+                                                >(
+                                                    v.clone()
+                                                )
+                                                .ok()
+                                        });
+
+                                        content_blocks.push(generated::ContentBlock {
+                                            citations: None,
+                                            text: None,
+                                            content_block_type:
+                                                generated::ContentBlockType::WebSearchToolResult,
+                                            signature: None,
+                                            thinking: None,
+                                            data: None,
+                                            id: None,
+                                            input: None,
+                                            name: None,
+                                            content,
+                                            tool_use_id: Some(tool_call_id.clone()),
+                                        });
+                                    }
+                                    // Skip other tool results - they shouldn't appear in response content
                                 }
                                 _ => {
                                     // Skip other types for now
@@ -978,22 +1045,6 @@ impl TryFromLLM<Vec<Message>> for Vec<generated::ContentBlock> {
             }
         }
 
-        if content_blocks.is_empty() {
-            content_blocks.push(generated::ContentBlock {
-                citations: None,
-                text: Some(String::new()),
-                content_block_type: generated::ContentBlockType::Text,
-                signature: None,
-                thinking: None,
-                data: None,
-                id: None,
-                input: None,
-                name: None,
-                content: None,
-                tool_use_id: None,
-            });
-        }
-
         Ok(content_blocks)
     }
 }
diff --git a/crates/lingua/src/providers/anthropic/generated.rs b/crates/lingua/src/providers/anthropic/generated.rs
index 77d46db1..0d8a51a8 100644
--- a/crates/lingua/src/providers/anthropic/generated.rs
+++ b/crates/lingua/src/providers/anthropic/generated.rs
@@ -283,6 +283,7 @@ pub struct InputContentBlock {
     pub cache_control: Option<CacheControlEphemeral>,
     #[serde(skip_serializing_if = "Option::is_none")]
     pub citations: Option<Citations>,
+    #[serde(skip_serializing_if = "Option::is_none")]
     pub text: Option<String>,
     #[serde(rename = "type")]
     pub input_content_block_type: InputContentBlockType,
@@ -323,6 +324,7 @@ pub struct CacheControlEphemeral {
     /// - `1h`: 1 hour
     ///
     /// Defaults to `5m`.
+    #[serde(skip_serializing_if = "Option::is_none")]
     pub ttl: Option<Ttl>,
     #[serde(rename = "type")]
     pub cache_control_ephemeral_type: CacheControlEphemeralType,
@@ -369,6 +371,7 @@ pub struct RequestLocationCitation {
     pub document_title: Option<String>,
     #[serde(skip_serializing_if = "Option::is_none")]
     pub end_char_index: Option<i64>,
+    #[serde(skip_serializing_if = "Option::is_none")]
     pub start_char_index: Option<i64>,
     #[serde(rename = "type")]
     pub request_location_citation_type: CitationType,
@@ -440,6 +443,7 @@ pub struct Block {
     pub cache_control: Option<CacheControlEphemeral>,
     #[serde(skip_serializing_if = "Option::is_none")]
     pub citations: Option<Citations>,
+    #[serde(skip_serializing_if = "Option::is_none")]
     pub text: Option<String>,
     #[serde(rename = "type")]
     pub block_type: WebSearchToolResultBlockItemType,
@@ -506,6 +510,7 @@ pub enum Source {
 pub struct SourceSource {
     #[serde(skip_serializing_if = "Option::is_none")]
     pub data: Option<String>,
+    #[serde(skip_serializing_if = "Option::is_none")]
     pub media_type: Option<FluffyMediaType>,
     #[serde(rename = "type")]
     pub source_type: FluffyType,
@@ -534,6 +539,7 @@ pub struct ContentBlockSourceContentItem {
     pub cache_control: Option<CacheControlEphemeral>,
     #[serde(skip_serializing_if = "Option::is_none")]
     pub citations: Option<Vec<RequestLocationCitation>>,
+    #[serde(skip_serializing_if = "Option::is_none")]
     pub text: Option<String>,
     #[serde(rename = "type")]
     pub content_block_source_content_item_type: ContentBlockSourceContentItemType,
@@ -554,6 +560,7 @@ pub enum ContentBlockSourceContentItemType {
 pub struct SourceSourceClass {
     #[serde(skip_serializing_if = "Option::is_none")]
     pub data: Option<String>,
+    #[serde(skip_serializing_if = "Option::is_none")]
     pub media_type: Option<PurpleMediaType>,
     #[serde(rename = "type")]
     pub source_type: PurpleType,
@@ -731,6 +738,7 @@ pub struct Thinking {
     /// See [extended
     /// thinking](https://docs.anthropic.com/en/docs/build-with-claude/extended-thinking) for
     /// details.
+    #[serde(skip_serializing_if = "Option::is_none")]
     pub budget_tokens: Option<i64>,
     #[serde(rename = "type")]
     pub thinking_type: ThinkingType,
@@ -764,6 +772,7 @@ pub struct ToolChoice {
     /// Whether to disable parallel tool use.
     ///
     /// Defaults to `false`. If set to `true`, the model will output exactly one tool use.
+    #[serde(skip_serializing_if = "Option::is_none")]
     pub disable_parallel_tool_use: Option<bool>,
     #[serde(rename = "type")]
     pub tool_choice_type: ToolChoiceType,
@@ -919,6 +928,7 @@ pub struct InputSchema {
     #[ts(type = "unknown")]
     #[serde(skip_serializing_if = "Option::is_none")]
     pub properties: Option<serde_json::Map<String, serde_json::Value>>,
+    #[serde(skip_serializing_if = "Option::is_none")]
     pub required: Option<Vec<String>>,
     #[serde(rename = "type")]
     pub input_schema_type: InputSchemaType,
@@ -962,6 +972,7 @@ pub struct UserLocation {
     #[serde(skip_serializing_if = "Option::is_none")]
     pub region: Option<String>,
     /// The [IANA timezone](https://nodatime.org/TimeZones) of the user.
+    #[serde(skip_serializing_if = "Option::is_none")]
     pub timezone: Option<String>,
     #[serde(rename = "type")]
     pub user_location_type: UserLocationType,
@@ -1070,6 +1081,7 @@ pub struct ContentBlock {
     /// document results in `content_block_location`.
     #[serde(skip_serializing_if = "Option::is_none")]
     pub citations: Option<Vec<ResponseLocationCitation>>,
+    #[serde(skip_serializing_if = "Option::is_none")]
     pub text: Option<String>,
     #[serde(rename = "type")]
     pub content_block_type: ContentBlockType,
@@ -1104,6 +1116,7 @@ pub struct ResponseLocationCitation {
     pub end_char_index: Option<i64>,
     #[serde(skip_serializing_if = "Option::is_none")]
     pub file_id: Option<String>,
+    #[serde(skip_serializing_if = "Option::is_none")]
     pub start_char_index: Option<i64>,
     #[serde(rename = "type")]
     pub response_location_citation_type: CitationType,
diff --git a/crates/lingua/src/providers/anthropic/mod.rs b/crates/lingua/src/providers/anthropic/mod.rs
index df2fe6b1..b33bb334 100644
--- a/crates/lingua/src/providers/anthropic/mod.rs
+++ b/crates/lingua/src/providers/anthropic/mod.rs
@@ -9,6 +9,7 @@ pub mod adapter;
 pub mod convert;
 pub mod detect;
 pub mod generated;
+pub mod params;
 
 #[cfg(test)]
 pub mod test_anthropic;
diff --git a/crates/lingua/src/providers/anthropic/params.rs b/crates/lingua/src/providers/anthropic/params.rs
new file mode 100644
index 00000000..2a5eea31
--- /dev/null
+++ b/crates/lingua/src/providers/anthropic/params.rs
@@ -0,0 +1,157 @@
+/*!
+Typed parameter structs for Anthropic Messages API.
+
+These structs use `#[serde(flatten)]` to automatically capture unknown fields,
+eliminating the need for explicit KNOWN_KEYS arrays.
+*/
+
+use crate::providers::anthropic::generated::{InputMessage, Thinking};
+use crate::serde_json::Value;
+use serde::{Deserialize, Serialize};
+use std::collections::BTreeMap;
+
+/// Anthropic Messages API request parameters.
+///
+/// All known fields are explicitly typed. Unknown fields automatically
+/// go into `extras` via `#[serde(flatten)]`.
+#[derive(Debug, Clone, Default, Serialize, Deserialize)]
+pub struct AnthropicParams {
+    // === Core fields ===
+    pub model: Option<String>,
+    pub messages: Option<Vec<InputMessage>>,
+
+    // === System prompt (can be string or array with cache_control) ===
+    pub system: Option<Value>,
+
+    // === Required output control ===
+    pub max_tokens: Option<i64>,
+
+    // === Sampling parameters ===
+    pub temperature: Option<f64>,
+    pub top_p: Option<f64>,
+    pub top_k: Option<i64>,
+    pub stop_sequences: Option<Value>,
+
+    // === Streaming ===
+    pub stream: Option<bool>,
+
+    // === Tools and function calling ===
+    pub tools: Option<Value>,
+    pub tool_choice: Option<Value>,
+
+    // === Extended thinking ===
+    pub thinking: Option<Thinking>,
+
+    // === Structured outputs (beta: structured-outputs-2025-11-13) ===
+    /// Output format for structured JSON responses.
+    /// Structure: `{ type: "json_schema", schema: {...} }`
+    pub output_format: Option<Value>,
+
+    // === Metadata and identification ===
+    pub metadata: Option<Value>,
+    pub service_tier: Option<String>,
+
+    /// Unknown fields - automatically captured by serde flatten.
+    /// These are provider-specific fields not in the canonical set.
+    #[serde(flatten)]
+    pub extras: BTreeMap<String, Value>,
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::serde_json;
+    use crate::serde_json::json;
+
+    #[test]
+    fn test_anthropic_params_known_fields() {
+        let json = json!({
+            "model": "claude-sonnet-4-20250514",
+            "messages": [{"role": "user", "content": "Hello"}],
+            "max_tokens": 1024,
+            "temperature": 0.7,
+            "top_k": 40
+        });
+
+        let params: AnthropicParams = serde_json::from_value(json).unwrap();
+        assert_eq!(params.model, Some("claude-sonnet-4-20250514".to_string()));
+        assert_eq!(params.max_tokens, Some(1024));
+        assert_eq!(params.temperature, Some(0.7));
+        assert_eq!(params.top_k, Some(40));
+        assert!(params.extras.is_empty());
+    }
+
+    #[test]
+    fn test_anthropic_params_with_thinking() {
+        use crate::providers::anthropic::generated::ThinkingType;
+
+        let json = json!({
+            "model": "claude-sonnet-4-20250514",
+            "messages": [],
+            "max_tokens": 16000,
+            "thinking": {
+                "type": "enabled",
+                "budget_tokens": 10000
+            }
+        });
+
+        let params: AnthropicParams = serde_json::from_value(json).unwrap();
+        assert!(params.thinking.is_some());
+        let thinking = params.thinking.unwrap();
+        assert_eq!(thinking.thinking_type, ThinkingType::Enabled);
+        assert_eq!(thinking.budget_tokens, Some(10000));
+    }
+
+    #[test]
+    fn test_anthropic_params_with_system_cache_control() {
+        let json = json!({
+            "model": "claude-sonnet-4-20250514",
+            "messages": [],
+            "max_tokens": 1024,
+            "system": [
+                {
+                    "type": "text",
+                    "text": "Be helpful.",
+                    "cache_control": {"type": "ephemeral", "ttl": "5m"}
+                }
+            ]
+        });
+
+        let params: AnthropicParams = serde_json::from_value(json).unwrap();
+        assert!(params.system.is_some());
+        assert!(params.extras.is_empty());
+    }
+
+    #[test]
+    fn test_anthropic_params_unknown_fields_go_to_extras() {
+        let json = json!({
+            "model": "claude-sonnet-4-20250514",
+            "messages": [],
+            "max_tokens": 1024,
+            "some_future_param": "value"
+        });
+
+        let params: AnthropicParams = serde_json::from_value(json).unwrap();
+        assert_eq!(params.extras.len(), 1);
+        assert_eq!(
+            params.extras.get("some_future_param"),
+            Some(&Value::String("value".to_string()))
+        );
+    }
+
+    #[test]
+    fn test_anthropic_roundtrip_preserves_extras() {
+        let json = json!({
+            "model": "claude-sonnet-4-20250514",
+            "messages": [],
+            "max_tokens": 1024,
+            "custom_field": {"nested": "data"}
+        });
+
+        let params: AnthropicParams = serde_json::from_value(json.clone()).unwrap();
+        let back: Value = serde_json::to_value(&params).unwrap();
+
+        // Custom field should be preserved
+        assert_eq!(back.get("custom_field"), json.get("custom_field"));
+    }
+}
diff --git a/crates/lingua/src/providers/bedrock/adapter.rs b/crates/lingua/src/providers/bedrock/adapter.rs
index c840e5a3..987e8609 100644
--- a/crates/lingua/src/providers/bedrock/adapter.rs
+++ b/crates/lingua/src/providers/bedrock/adapter.rs
@@ -9,33 +9,24 @@ Bedrock's Converse API has some unique characteristics:
 */
 
 use crate::capabilities::ProviderFormat;
-use crate::processing::adapters::{collect_extras, ProviderAdapter};
+use crate::error::ConvertError;
+use crate::processing::adapters::ProviderAdapter;
 use crate::processing::transform::TransformError;
-use crate::providers::bedrock::request::{
-    BedrockInferenceConfiguration, BedrockMessage, ConverseRequest,
-};
+use crate::providers::anthropic::generated::Thinking;
+use crate::providers::bedrock::params::BedrockParams;
+use crate::providers::bedrock::request::{BedrockInferenceConfiguration, BedrockMessage};
 use crate::providers::bedrock::try_parse_bedrock;
 use crate::serde_json::{self, Map, Value};
 use crate::universal::convert::TryFromLLM;
 use crate::universal::message::Message;
+use crate::universal::reasoning::ANTHROPIC_THINKING_TEMPERATURE;
+use crate::universal::request::ReasoningConfig;
+use crate::universal::tools::{UniversalTool, UniversalToolType};
 use crate::universal::{
     FinishReason, UniversalParams, UniversalRequest, UniversalResponse, UniversalStreamChoice,
     UniversalStreamChunk, UniversalUsage,
 };
-
-/// Known request fields for Bedrock Converse API.
-/// Fields not in this list go into `extras`.
-const BEDROCK_KNOWN_KEYS: &[&str] = &[
-    "modelId",
-    "messages",
-    "system",
-    "inferenceConfig",
-    "toolConfig",
-    "guardrailConfig",
-    "additionalModelRequestFields",
-    "additionalModelResponseFieldPaths",
-    "promptVariables",
-];
+use std::collections::HashMap;
 
 /// Adapter for Amazon Bedrock Converse API.
 pub struct BedrockAdapter;
@@ -58,30 +49,40 @@ impl ProviderAdapter for BedrockAdapter {
     }
 
     fn request_to_universal(&self, payload: Value) -> Result<UniversalRequest, TransformError> {
-        let extras = collect_extras(&payload, BEDROCK_KNOWN_KEYS);
-
-        let request: ConverseRequest = serde_json::from_value(payload)
+        // Single parse: typed params now includes typed messages and inference_config
+        let typed_params: BedrockParams = serde_json::from_value(payload)
             .map_err(|e| TransformError::ToUniversalFailed(e.to_string()))?;
 
+        // Extract typed messages (partial move - other fields remain accessible)
+        let bedrock_messages = typed_params.messages.ok_or_else(|| {
+            TransformError::ToUniversalFailed("Bedrock: missing 'messages' field".to_string())
+        })?;
+
         let messages =
-            <Vec<Message> as TryFromLLM<Vec<BedrockMessage>>>::try_from(request.messages)
+            <Vec<Message> as TryFromLLM<Vec<BedrockMessage>>>::try_from(bedrock_messages)
                 .map_err(|e| TransformError::ToUniversalFailed(e.to_string()))?;
 
-        // Extract params from inferenceConfig
-        let (temperature, top_p, max_tokens, stop) = if let Some(config) = &request.inference_config
-        {
-            (
-                config.temperature,
-                config.top_p,
-                config.max_tokens.map(|t| t as i64),
-                config
-                    .stop_sequences
-                    .as_ref()
-                    .and_then(|s| serde_json::to_value(s).ok()),
-            )
-        } else {
-            (None, None, None, None)
-        };
+        // Extract params from inferenceConfig (now typed in params struct)
+        let (temperature, top_p, max_tokens, stop) =
+            if let Some(config) = &typed_params.inference_config {
+                (
+                    config.temperature,
+                    config.top_p,
+                    config.max_tokens.map(|t| t as i64),
+                    config.stop_sequences.clone(),
+                )
+            } else {
+                (None, None, None, None)
+            };
+
+        // Extract reasoning from additionalModelRequestFields.thinking
+        // Bedrock uses the same format as Anthropic for Claude extended thinking
+        let reasoning = typed_params
+            .additional_model_request_fields
+            .as_ref()
+            .and_then(|fields| fields.get("thinking"))
+            .and_then(|v| serde_json::from_value::<Thinking>(v.clone()).ok())
+            .map(|t| ReasoningConfig::from(&t));
 
         let params = UniversalParams {
             temperature,
@@ -89,22 +90,73 @@ impl ProviderAdapter for BedrockAdapter {
             top_k: None, // Bedrock doesn't expose top_k in Converse API
             max_tokens,
             stop,
-            tools: request
-                .tool_config
-                .and_then(|t| serde_json::to_value(t).ok()),
+            tools: typed_params.tool_config.and_then(|t| {
+                // Bedrock uses {tools: [{toolSpec: {name, description, inputSchema: {json: {...}}}}]}
+                // Parse into UniversalTools
+                let value = serde_json::to_value(&t).ok()?;
+                let tools_arr = value.get("tools").and_then(|v| v.as_array())?;
+
+                let mut universal_tools = Vec::new();
+                for tool in tools_arr {
+                    if let Some(spec) = tool.get("toolSpec") {
+                        let name = spec.get("name").and_then(|v| v.as_str())?;
+                        let description = spec
+                            .get("description")
+                            .and_then(|v| v.as_str())
+                            .map(String::from);
+                        let parameters =
+                            spec.get("inputSchema").and_then(|s| s.get("json")).cloned();
+
+                        universal_tools.push(UniversalTool::function(
+                            name,
+                            description,
+                            parameters,
+                        ));
+                    }
+                }
+
+                if universal_tools.is_empty() {
+                    // Fallback: store as builtin for unknown format (e.g., toolChoice)
+                    Some(vec![UniversalTool::builtin(
+                        "bedrock_tool_config",
+                        "bedrock",
+                        "tool_config",
+                        Some(value),
+                    )])
+                } else {
+                    Some(universal_tools)
+                }
+            }),
             tool_choice: None, // Tool choice is inside tool_config
             response_format: None,
             seed: None, // Bedrock doesn't support seed
             presence_penalty: None,
             frequency_penalty: None,
             stream: None, // Bedrock uses separate endpoint for streaming
+            // New canonical fields
+            parallel_tool_calls: None,
+            reasoning, // Extracted from additionalModelRequestFields.thinking
+            metadata: None,
+            store: None,
+            service_tier: None,
+            logprobs: None,
+            top_logprobs: None,
         };
 
+        // Use extras captured automatically via #[serde(flatten)]
+        let mut provider_extras = HashMap::new();
+        if !typed_params.extras.is_empty() {
+            provider_extras.insert(
+                ProviderFormat::Converse,
+                typed_params.extras.into_iter().collect(),
+            );
+        }
+
         Ok(UniversalRequest {
-            model: Some(request.model_id),
+            model: typed_params.model_id,
             messages,
             params,
-            extras,
+            provider_extras,
         })
     }
 
@@ -127,30 +179,28 @@ impl ProviderAdapter for BedrockAdapter {
                 .map_err(|e| TransformError::SerializationFailed(e.to_string()))?,
         );
 
+        // Check if reasoning/thinking is enabled (for temperature override)
+        let thinking_config = req.params.reasoning_for(ProviderFormat::Converse);
+
         // Build inferenceConfig if any params are set
-        let has_params = req.params.temperature.is_some()
+        // Note: Claude on Bedrock requires temperature=1.0 when extended thinking is enabled
+        let temperature = if thinking_config.is_some() {
+            Some(ANTHROPIC_THINKING_TEMPERATURE)
+        } else {
+            req.params.temperature
+        };
+
+        let has_params = temperature.is_some()
             || req.params.top_p.is_some()
             || req.params.max_tokens.is_some()
             || req.params.stop.is_some();
 
         if has_params {
             let config = BedrockInferenceConfiguration {
-                temperature: req.params.temperature,
+                temperature,
                 top_p: req.params.top_p,
                 max_tokens: req.params.max_tokens.map(|t| t as i32),
-                stop_sequences: req.params.stop.as_ref().and_then(|v| {
-                    if let Value::Array(arr) = v {
-                        Some(
-                            arr.iter()
-                                .filter_map(|s| s.as_str().map(String::from))
-                                .collect(),
-                        )
-                    } else if let Value::String(s) = v {
-                        Some(vec![s.clone()])
-                    } else {
-                        None
-                    }
-                }),
+                stop_sequences: req.params.stop.clone(),
             };
 
             obj.insert(
@@ -161,20 +211,78 @@ impl ProviderAdapter for BedrockAdapter {
         }
 
         // Add toolConfig if tools are present
+        // Bedrock uses toolConfig.tools format: [{toolSpec: {name, description, inputSchema}}]
         if let Some(tools) = &req.params.tools {
-            obj.insert("toolConfig".into(), tools.clone());
+            // First check for Bedrock builtins (pass through original config)
+            let mut bedrock_builtin_found = false;
+            for tool in tools {
+                if let UniversalToolType::Builtin {
+                    provider, config, ..
+                } = &tool.tool_type
+                {
+                    if provider == "bedrock" {
+                        if let Some(config_value) = config {
+                            obj.insert("toolConfig".into(), config_value.clone());
+                            bedrock_builtin_found = true;
+                            break;
+                        }
+                    }
+                }
+            }
+
+            // If no Bedrock builtin, convert function tools to Bedrock format
+            if !bedrock_builtin_found {
+                let tool_specs: Vec<serde_json::Value> = tools
+                    .iter()
+                    .filter_map(|tool| {
+                        if tool.is_function() {
+                            Some(serde_json::json!({
+                                "toolSpec": {
+                                    "name": tool.name,
+                                    "description": tool.description,
+                                    "inputSchema": {
+                                        "json": tool.parameters.clone().unwrap_or(serde_json::json!({}))
+                                    }
+                                }
+                            }))
+                        } else {
+                            None
+                        }
+                    })
+                    .collect();
+
+                if !tool_specs.is_empty() {
+                    obj.insert(
+                        "toolConfig".into(),
+                        serde_json::json!({"tools": tool_specs}),
+                    );
+                }
+            }
         }
 
-        // Merge extras
-        for (k, v) in &req.extras {
-            obj.insert(k.clone(), v.clone());
+        // Inject reasoning/thinking into additionalModelRequestFields
+        // Bedrock uses additionalModelRequestFields.thinking with same format as Anthropic
+        if let Some(thinking_val) = &thinking_config {
+            let additional_fields = obj
+                .entry("additionalModelRequestFields")
+                .or_insert_with(|| Value::Object(Map::new()));
+
+            if let Value::Object(fields) = additional_fields {
+                fields.insert("thinking".into(), thinking_val.clone());
+            }
         }
 
-        Ok(Value::Object(obj))
-    }
+        // Merge back provider-specific extras (only for Bedrock/Converse)
+        if let Some(extras) = req.provider_extras.get(&ProviderFormat::Converse) {
+            for (k, v) in extras {
+                // Don't overwrite canonical fields we already handled
+                if !obj.contains_key(k) {
+                    obj.insert(k.clone(), v.clone());
+                }
+            }
+        }
 
-    fn apply_defaults(&self, _req: &mut UniversalRequest) {
-        // Bedrock doesn't require any specific defaults
+        Ok(Value::Object(obj))
     }
 
     fn detect_response(&self, payload: &Value) -> bool {
@@ -201,18 +309,15 @@ impl ProviderAdapter for BedrockAdapter {
             <Vec<Message> as TryFromLLM<Vec<BedrockMessage>>>::try_from(vec![bedrock_message])
                 .map_err(|e| TransformError::ToUniversalFailed(e.to_string()))?;
 
-        let finish_reason = payload
-            .get("stopReason")
-            .and_then(Value::as_str)
-            .map(|s| s.parse().unwrap());
-
-        let usage = payload.get("usage").map(|u| UniversalUsage {
-            prompt_tokens: u.get("inputTokens").and_then(Value::as_i64),
-            completion_tokens: u.get("outputTokens").and_then(Value::as_i64),
-            prompt_cached_tokens: u.get("cacheReadInputTokens").and_then(Value::as_i64),
-            prompt_cache_creation_tokens: u.get("cacheWriteInputTokens").and_then(Value::as_i64),
-            completion_reasoning_tokens: None, // Bedrock doesn't expose thinking tokens separately
-        });
+        let finish_reason = match payload.get("stopReason").and_then(Value::as_str) {
+            Some(s) => Some(s.parse().map_err(|_| ConvertError::InvalidEnumValue {
+                type_name: "FinishReason",
+                value: s.to_string(),
+            })?),
+            None => None,
+        };
+
+        let usage = UniversalUsage::extract_from_response(&payload, self.format());
 
         Ok(UniversalResponse {
             model: None, // Bedrock doesn't include model in response
@@ -236,8 +341,10 @@ impl ProviderAdapter for BedrockAdapter {
         let message_value = serde_json::to_value(message)
             .map_err(|e| TransformError::SerializationFailed(e.to_string()))?;
 
-        let stop_reason = self
-            .map_finish_reason(resp.finish_reason.as_ref())
+        let stop_reason = resp
+            .finish_reason
+            .as_ref()
+            .map(|r| r.to_provider_string(self.format()).to_string())
             .unwrap_or_else(|| "end_turn".to_string());
 
         let mut obj = serde_json::json!({
@@ -248,28 +355,14 @@ impl ProviderAdapter for BedrockAdapter {
         });
 
         if let Some(usage) = &resp.usage {
-            obj.as_object_mut().unwrap().insert(
-                "usage".into(),
-                serde_json::json!({
-                    "inputTokens": usage.prompt_tokens.unwrap_or(0),
-                    "outputTokens": usage.completion_tokens.unwrap_or(0)
-                }),
-            );
+            obj.as_object_mut()
+                .unwrap()
+                .insert("usage".into(), usage.to_provider_value(self.format()));
         }
 
         Ok(obj)
     }
 
-    fn map_finish_reason(&self, reason: Option<&FinishReason>) -> Option<String> {
-        reason.map(|r| match r {
-            FinishReason::Stop => "end_turn".to_string(),
-            FinishReason::Length => "max_tokens".to_string(),
-            FinishReason::ToolCalls => "tool_use".to_string(),
-            FinishReason::ContentFilter => "content_filtered".to_string(),
-            FinishReason::Other(s) => s.clone(),
-        })
-    }
-
     // =========================================================================
     // Streaming response handling
     // =========================================================================
@@ -323,13 +416,8 @@ impl ProviderAdapter for BedrockAdapter {
         // Handle messageStop - finish reason
         if let Some(stop_event) = payload.get("messageStop") {
             let stop_reason = stop_event.get("stopReason").and_then(Value::as_str);
-            let finish_reason = stop_reason.map(|r| match r {
-                "end_turn" | "stop_sequence" => "stop".to_string(),
-                "max_tokens" => "length".to_string(),
-                "tool_use" => "tool_calls".to_string(),
-                "content_filtered" => "content_filter".to_string(),
-                other => other.to_string(),
-            });
+            let finish_reason = stop_reason
+                .map(|r| FinishReason::from_provider_string(r, self.format()).to_string());
 
             return Ok(Some(UniversalStreamChunk::new(
                 None,
@@ -346,15 +434,9 @@ impl ProviderAdapter for BedrockAdapter {
 
         // Handle metadata - usage info
         if let Some(meta) = payload.get("metadata") {
-            let usage = meta.get("usage").map(|u| UniversalUsage {
-                prompt_tokens: u.get("inputTokens").and_then(Value::as_i64),
-                completion_tokens: u.get("outputTokens").and_then(Value::as_i64),
-                prompt_cached_tokens: u.get("cacheReadInputTokens").and_then(Value::as_i64),
-                prompt_cache_creation_tokens: u
-                    .get("cacheWriteInputTokens")
-                    .and_then(Value::as_i64),
-                completion_reasoning_tokens: None,
-            });
+            let usage = meta
+                .get("usage")
+                .map(|u| UniversalUsage::from_provider_value(u, self.format()));
 
             if usage.is_some() {
                 return Ok(Some(UniversalStreamChunk::new(
@@ -422,10 +504,7 @@ impl ProviderAdapter for BedrockAdapter {
         if let (true, Some(usage)) = (chunk.choices.is_empty(), &chunk.usage) {
             return Ok(serde_json::json!({
                 "metadata": {
-                    "usage": {
-                        "inputTokens": usage.prompt_tokens.unwrap_or(0),
-                        "outputTokens": usage.completion_tokens.unwrap_or(0)
-                    }
+                    "usage": usage.to_provider_value(self.format())
                 }
             }));
         }
@@ -539,4 +618,138 @@ mod tests {
         assert!(reconstructed.get("modelId").is_some());
         assert!(reconstructed.get("messages").is_some());
     }
+
+    #[test]
+    fn test_bedrock_extracts_reasoning_from_additional_fields() {
+        let adapter = BedrockAdapter;
+        let payload = json!({
+            "modelId": "anthropic.claude-3-7-sonnet",
+            "messages": [{
+                "role": "user",
+                "content": [{"text": "Hello"}]
+            }],
+            "inferenceConfig": {
+                "maxTokens": 4096
+            },
+            "additionalModelRequestFields": {
+                "thinking": {
+                    "type": "enabled",
+                    "budget_tokens": 2048
+                }
+            }
+        });
+
+        let universal = adapter.request_to_universal(payload).unwrap();
+        assert!(universal.params.reasoning.is_some());
+
+        let reasoning = universal.params.reasoning.unwrap();
+        assert_eq!(reasoning.enabled, Some(true));
+        assert_eq!(reasoning.budget_tokens, Some(2048));
+    }
+
+    #[test]
+    fn test_bedrock_injects_reasoning_into_additional_fields() {
+        use crate::universal::request::ReasoningConfig;
+
+        let adapter = BedrockAdapter;
+
+        // Create a universal request with reasoning
+        let universal = UniversalRequest {
+            model: Some("anthropic.claude-3-7-sonnet".to_string()),
+            messages: vec![],
+            params: UniversalParams {
+                reasoning: Some(ReasoningConfig {
+                    enabled: Some(true),
+                    budget_tokens: Some(3000),
+                    ..Default::default()
+                }),
+                max_tokens: Some(4096),
+                ..Default::default()
+            },
+            provider_extras: Default::default(),
+        };
+
+        let reconstructed = adapter.request_from_universal(&universal).unwrap();
+
+        // Check additionalModelRequestFields.thinking is present
+        let additional = reconstructed.get("additionalModelRequestFields").unwrap();
+        let thinking = additional.get("thinking").unwrap();
+        assert_eq!(thinking.get("type").unwrap(), "enabled");
+        assert_eq!(thinking.get("budget_tokens").unwrap(), 3000);
+    }
+
+    #[test]
+    fn test_bedrock_reasoning_sets_temperature_to_1() {
+        use crate::universal::request::ReasoningConfig;
+
+        let adapter = BedrockAdapter;
+
+        // Create a universal request with reasoning and custom temperature
+        let universal = UniversalRequest {
+            model: Some("anthropic.claude-3-7-sonnet".to_string()),
+            messages: vec![],
+            params: UniversalParams {
+                reasoning: Some(ReasoningConfig {
+                    enabled: Some(true),
+                    budget_tokens: Some(2048),
+                    ..Default::default()
+                }),
+                temperature: Some(0.5), // This should be overridden to 1.0
+                max_tokens: Some(4096),
+                ..Default::default()
+            },
+            provider_extras: Default::default(),
+        };
+
+        let reconstructed = adapter.request_from_universal(&universal).unwrap();
+
+        // Temperature should be 1.0 when thinking is enabled
+        let inference_config = reconstructed.get("inferenceConfig").unwrap();
+        assert_eq!(inference_config.get("temperature").unwrap(), 1.0);
+    }
+
+    #[test]
+    fn test_bedrock_reasoning_roundtrip() {
+        let adapter = BedrockAdapter;
+
+        // Start with a Bedrock request with thinking enabled
+        let payload = json!({
+            "modelId": "anthropic.claude-3-7-sonnet",
+            "messages": [{
+                "role": "user",
+                "content": [{"text": "Think about this carefully"}]
+            }],
+            "inferenceConfig": {
+                "maxTokens": 4096,
+                "temperature": 1.0
+            },
+            "additionalModelRequestFields": {
+                "thinking": {
+                    "type": "enabled",
+                    "budget_tokens": 2500
+                }
+            }
+        });
+
+        // Convert to universal
+        let universal = adapter.request_to_universal(payload).unwrap();
+        assert!(universal.params.reasoning.is_some());
+        assert_eq!(
+            universal.params.reasoning.as_ref().unwrap().budget_tokens,
+            Some(2500)
+        );
+
+        // Convert back to Bedrock
+        let reconstructed = adapter.request_from_universal(&universal).unwrap();
+
+        // Verify thinking config is preserved
+        let additional = reconstructed.get("additionalModelRequestFields").unwrap();
+        let thinking = additional.get("thinking").unwrap();
+        assert_eq!(thinking.get("type").unwrap(), "enabled");
+        assert_eq!(thinking.get("budget_tokens").unwrap(), 2500);
+
+        // Verify temperature is set to 1.0
+        let inference_config = reconstructed.get("inferenceConfig").unwrap();
+        assert_eq!(inference_config.get("temperature").unwrap(), 1.0);
+    }
 }
diff --git a/crates/lingua/src/providers/bedrock/mod.rs b/crates/lingua/src/providers/bedrock/mod.rs
index adb267bf..dc3623c1 100644
--- a/crates/lingua/src/providers/bedrock/mod.rs
+++ b/crates/lingua/src/providers/bedrock/mod.rs
@@ -8,6 +8,7 @@ using the official AWS SDK types for maximum compatibility.
 pub mod adapter;
 pub mod convert;
 pub mod detect;
+pub mod params;
 pub mod request;
 pub mod response;
 
diff --git a/crates/lingua/src/providers/bedrock/params.rs b/crates/lingua/src/providers/bedrock/params.rs
new file mode 100644
index 00000000..9ffe8629
--- /dev/null
+++ b/crates/lingua/src/providers/bedrock/params.rs
@@ -0,0 +1,107 @@
+/*!
+Typed parameter structs for Bedrock Converse API.
+
+These structs use `#[serde(flatten)]` to automatically capture unknown fields,
+eliminating the need for explicit KNOWN_KEYS arrays.
+*/
+
+use crate::providers::bedrock::request::{
+    BedrockInferenceConfiguration, BedrockMessage, BedrockToolConfiguration,
+};
+use crate::serde_json::Value;
+use serde::{Deserialize, Serialize};
+use std::collections::BTreeMap;
+
+/// Bedrock Converse API request parameters.
+///
+/// All known fields are explicitly typed. Unknown fields automatically
+/// go into `extras` via `#[serde(flatten)]`.
+#[derive(Debug, Clone, Default, Serialize, Deserialize)]
+#[serde(rename_all = "camelCase")]
+pub struct BedrockParams {
+    // === Core fields ===
+    pub model_id: Option<String>,
+    pub messages: Option<Vec<BedrockMessage>>,
+
+    // === System prompt ===
+    pub system: Option<Value>,
+
+    // === Inference configuration ===
+    pub inference_config: Option<BedrockInferenceConfiguration>,
+
+    // === Tools and function calling ===
+    pub tool_config: Option<BedrockToolConfiguration>,
+
+    // === Guardrails ===
+    pub guardrail_config: Option<Value>,
+
+    // === Additional model fields ===
+    pub additional_model_request_fields: Option<Value>,
+    pub additional_model_response_field_paths: Option<Vec<String>>,
+
+    // === Prompt templates ===
+    pub prompt_variables: Option<Value>,
+
+    /// Unknown fields - automatically captured by serde flatten.
+    /// These are provider-specific fields not in the canonical set.
+    #[serde(flatten)]
+    pub extras: BTreeMap<String, Value>,
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::serde_json;
+    use crate::serde_json::json;
+
+    #[test]
+    fn test_bedrock_params_known_fields() {
+        let json = json!({
+            "modelId": "anthropic.claude-3-sonnet",
+            "messages": [{"role": "user", "content": [{"text": "Hello"}]}],
+            "inferenceConfig": {
+                "temperature": 0.7,
+                "maxTokens": 1024
+            }
+        });
+
+        let params: BedrockParams = serde_json::from_value(json).unwrap();
+        assert_eq!(
+            params.model_id,
+            Some("anthropic.claude-3-sonnet".to_string())
+        );
+        assert!(params.inference_config.is_some());
+        assert!(params.extras.is_empty());
+    }
+
+    #[test]
+    fn test_bedrock_params_unknown_fields_go_to_extras() {
+        let json = json!({
+            "modelId": "anthropic.claude-3-sonnet",
+            "messages": [],
+            "someFutureParam": "value"
+        });
+
+        let params: BedrockParams = serde_json::from_value(json).unwrap();
+        assert_eq!(params.extras.len(), 1);
+        assert_eq!(
+            params.extras.get("someFutureParam"),
+            Some(&Value::String("value".to_string()))
+        );
+    }
+
+    #[test]
+    fn test_bedrock_roundtrip_preserves_extras() {
+        let json = json!({
+            "modelId": "anthropic.claude-3-sonnet",
+            "messages": [],
+            "customField": {"nested": "data"}
+        });
+
+        let params: BedrockParams = serde_json::from_value(json.clone()).unwrap();
+        let back: Value = serde_json::to_value(&params).unwrap();
+
+        // Custom field should be preserved
+        assert_eq!(back.get("customField"), json.get("customField"));
+    }
+}
diff --git a/crates/lingua/src/providers/google/adapter.rs b/crates/lingua/src/providers/google/adapter.rs
index 17142c5b..3d56a650 100644
--- a/crates/lingua/src/providers/google/adapter.rs
+++ b/crates/lingua/src/providers/google/adapter.rs
@@ -9,33 +9,24 @@ Google's API has some unique characteristics:
 */
 
 use crate::capabilities::ProviderFormat;
-use crate::processing::adapters::{collect_extras, ProviderAdapter};
+use crate::error::ConvertError;
+use crate::processing::adapters::ProviderAdapter;
 use crate::processing::transform::TransformError;
 use crate::providers::google::detect::try_parse_google;
 use crate::providers::google::generated::{
-    candidate, generate_content_response, part, Content as GoogleContent, GenerateContentRequest,
-    GenerateContentResponse, GenerationConfig,
+    Content as GoogleContent, GenerationConfig, ThinkingConfig,
 };
+use crate::providers::google::params::GoogleParams;
 use crate::serde_json::{self, Map, Value};
 use crate::universal::convert::TryFromLLM;
 use crate::universal::message::Message;
+use crate::universal::tools::{UniversalTool, UniversalToolType};
 use crate::universal::{
     extract_system_messages, flatten_consecutive_messages, FinishReason, UniversalParams,
     UniversalRequest, UniversalResponse, UniversalStreamChoice, UniversalStreamChunk,
     UniversalUsage, UserContent,
 };
-
-/// Known request fields for Google GenerateContent API.
-/// Fields not in this list go into `extras`.
-const GOOGLE_KNOWN_KEYS: &[&str] = &[
-    "contents",
-    "generationConfig",
-    "systemInstruction",
-    "safetySettings",
-    "tools",
-    "toolConfig",
-    "model",
-];
+use std::collections::HashMap;
 
 /// Adapter for Google AI GenerateContent API.
 pub struct GoogleAdapter;
@@ -58,34 +49,48 @@ impl ProviderAdapter for GoogleAdapter {
     }
 
     fn request_to_universal(&self, payload: Value) -> Result<UniversalRequest, TransformError> {
-        let extras = collect_extras(&payload, GOOGLE_KNOWN_KEYS);
-        let model = payload
-            .get("model")
-            .and_then(Value::as_str)
-            .map(String::from);
-
-        let request: GenerateContentRequest = serde_json::from_value(payload)
+        // Single parse: typed params now includes typed contents and generation_config
+        let typed_params: GoogleParams = serde_json::from_value(payload)
             .map_err(|e| TransformError::ToUniversalFailed(e.to_string()))?;
 
-        let messages = <Vec<Message> as TryFromLLM<Vec<GoogleContent>>>::try_from(request.contents)
+        let model = typed_params.model.clone();
+
+        // Extract typed contents (partial move - other fields remain accessible)
+        let contents = typed_params.contents.ok_or_else(|| {
+            TransformError::ToUniversalFailed("Google: missing 'contents' field".to_string())
+        })?;
+
+        let messages = <Vec<Message> as TryFromLLM<Vec<GoogleContent>>>::try_from(contents)
             .map_err(|e| TransformError::ToUniversalFailed(e.to_string()))?;
 
-        // Extract params from generationConfig
-        let (temperature, top_p, top_k, max_tokens, stop) =
-            if let Some(config) = &request.generation_config {
+        // Extract params from generationConfig (now typed in params struct)
+        let (temperature, top_p, top_k, max_tokens, stop, reasoning) =
+            if let Some(config) = &typed_params.generation_config {
+                let max_tokens = config.max_output_tokens.map(|t| t as i64);
+                // Convert Google's thinkingConfig to ReasoningConfig
+                let reasoning = config.thinking_config.as_ref().map(|tc| {
+                    crate::universal::ReasoningConfig {
+                        enabled: tc.include_thoughts.or(Some(true)), // If thinking_config exists, it's enabled
+                        budget_tokens: tc.thinking_budget.map(|b| b as i64),
+                        ..Default::default()
+                    }
+                });
+                // Generated type has stop_sequences as Vec<String>, convert to Option
+                let stop = if config.stop_sequences.is_empty() {
+                    None
+                } else {
+                    Some(config.stop_sequences.clone())
+                };
                 (
                     config.temperature.map(|t| t as f64),
                     config.top_p.map(|p| p as f64),
                     config.top_k.map(|k| k as i64),
-                    config.max_output_tokens.map(|t| t as i64),
-                    if config.stop_sequences.is_empty() {
-                        None
-                    } else {
-                        serde_json::to_value(&config.stop_sequences).ok()
-                    },
+                    max_tokens,
+                    stop,
+                    reasoning,
                 )
             } else {
-                (None, None, None, None, None)
+                (None, None, None, None, None, None)
             };
 
         let params = UniversalParams {
@@ -94,24 +99,76 @@ impl ProviderAdapter for GoogleAdapter {
             top_k,
             max_tokens,
             stop,
-            tools: if request.tools.is_empty() {
-                None
-            } else {
-                serde_json::to_value(&request.tools).ok()
-            },
+            tools: typed_params.tools.and_then(|t| {
+                // Google uses [{functionDeclarations: [{name, description, parameters}]}]
+                // Parse into UniversalTools
+                let value = serde_json::to_value(&t).ok()?;
+                let tools_arr = value.as_array()?;
+
+                let mut universal_tools = Vec::new();
+                for tool_group in tools_arr {
+                    if let Some(func_decls) = tool_group.get("functionDeclarations") {
+                        if let Some(decls) = func_decls.as_array() {
+                            for decl in decls {
+                                let name = decl.get("name").and_then(|v| v.as_str())?;
+                                let description = decl
+                                    .get("description")
+                                    .and_then(|v| v.as_str())
+                                    .map(String::from);
+                                let parameters = decl.get("parameters").cloned();
+
+                                universal_tools.push(UniversalTool::function(
+                                    name,
+                                    description,
+                                    parameters,
+                                ));
+                            }
+                        }
+                    }
+                }
+
+                if universal_tools.is_empty() {
+                    // Fallback: store as builtin for unknown format
+                    Some(vec![UniversalTool::builtin(
+                        "google_tools",
+                        "google",
+                        "unknown",
+                        Some(value),
+                    )])
+                } else {
+                    Some(universal_tools)
+                }
+            }),
             tool_choice: None, // Google uses different mechanism
             response_format: None,
             seed: None, // Google doesn't support seed
             presence_penalty: None,
             frequency_penalty: None,
             stream: None, // Google uses endpoint-based streaming
+            // New canonical fields - Google doesn't support most of these
+            parallel_tool_calls: None,
+            reasoning,
+            metadata: None,
+            store: None,
+            service_tier: None,
+            logprobs: None,
+            top_logprobs: None,
         };
 
+        // Use extras captured automatically via #[serde(flatten)]
+        let mut provider_extras = HashMap::new();
+        if !typed_params.extras.is_empty() {
+            provider_extras.insert(
+                ProviderFormat::Google,
+                typed_params.extras.into_iter().collect(),
+            );
+        }
+
         Ok(UniversalRequest {
             model,
             messages,
             params,
-            extras,
+            provider_extras,
         })
     }
 
@@ -171,60 +228,114 @@ impl ProviderAdapter for GoogleAdapter {
         }
 
         // Build generationConfig if any params are set
-        let stop_sequences = req
+        let has_reasoning = req
             .params
-            .stop
+            .reasoning
             .as_ref()
-            .map(|stop| match stop {
-                Value::Array(arr) => arr
-                    .iter()
-                    .filter_map(|s| s.as_str().map(|v| v.to_string()))
-                    .collect::<Vec<_>>(),
-                Value::String(s) => vec![s.clone()],
-                _ => Vec::new(),
-            })
-            .unwrap_or_default();
-
-        let config = GenerationConfig {
-            temperature: req.params.temperature.map(|t| t as f32),
-            top_p: req.params.top_p.map(|p| p as f32),
-            top_k: req.params.top_k.map(|k| k as i32),
-            max_output_tokens: req.params.max_tokens.map(|t| t as i32),
-            stop_sequences,
-            ..GenerationConfig::default()
-        };
+            .map(|r| !r.is_effectively_disabled())
+            .unwrap_or(false);
+        let has_params = req.params.temperature.is_some()
+            || req.params.top_p.is_some()
+            || req.params.top_k.is_some()
+            || req.params.max_tokens.is_some()
+            || req.params.stop.is_some()
+            || has_reasoning;
+
+        if has_params {
+            // Convert ReasoningConfig to Google's thinkingConfig
+            let thinking_config = req.params.reasoning.as_ref().and_then(|r| {
+                if r.is_effectively_disabled() {
+                    return None;
+                }
+                // Use budget_tokens or default minimum
+                let budget = r
+                    .budget_tokens
+                    .unwrap_or(crate::universal::reasoning::MIN_THINKING_BUDGET);
+                Some(ThinkingConfig {
+                    include_thoughts: Some(true),
+                    thinking_budget: Some(budget as i32),
+                })
+            });
+
+            // Generated type has stop_sequences as Vec<String>, not Option
+            let stop_sequences = req.params.stop.clone().unwrap_or_default();
+
+            let config = GenerationConfig {
+                temperature: req.params.temperature.map(|t| t as f32),
+                top_p: req.params.top_p.map(|p| p as f32),
+                top_k: req.params.top_k.map(|k| k as i32),
+                max_output_tokens: req.params.max_tokens.map(|t| t as i32),
+                stop_sequences,
+                thinking_config,
+                ..Default::default()
+            };
 
-        let config_value = serde_json::to_value(config)
-            .map_err(|e| TransformError::SerializationFailed(e.to_string()))?;
-        if !config_value
-            .as_object()
-            .map(|map| map.is_empty())
-            .unwrap_or(true)
-        {
-            obj.insert("generationConfig".into(), config_value);
+            obj.insert(
+                "generationConfig".into(),
+                serde_json::to_value(config)
+                    .map_err(|e| TransformError::SerializationFailed(e.to_string()))?,
+            );
         }
 
         // Add tools if present
+        // Google uses functionDeclarations format: [{name, description, parameters}]
         if let Some(tools) = &req.params.tools {
-            obj.insert("tools".into(), tools.clone());
+            // First check for Google builtins (pass through original config)
+            let mut google_builtin_found = false;
+            for tool in tools {
+                if let UniversalToolType::Builtin {
+                    provider, config, ..
+                } = &tool.tool_type
+                {
+                    if provider == "google" {
+                        if let Some(config_value) = config {
+                            obj.insert("tools".into(), config_value.clone());
+                            google_builtin_found = true;
+                            break;
+                        }
+                    }
+                }
+            }
+
+            // If no Google builtin, convert function tools to Google format
+            if !google_builtin_found {
+                let function_declarations: Vec<serde_json::Value> = tools
+                    .iter()
+                    .filter_map(|tool| {
+                        if tool.is_function() {
+                            Some(serde_json::json!({
+                                "name": tool.name,
+                                "description": tool.description,
+                                "parameters": tool.parameters.clone().unwrap_or(serde_json::json!({}))
+                            }))
+                        } else {
+                            None
+                        }
+                    })
+                    .collect();
+
+                if !function_declarations.is_empty() {
+                    obj.insert(
+                        "tools".into(),
+                        serde_json::json!([{"functionDeclarations": function_declarations}]),
+                    );
+                }
+            }
         }
 
-        // Merge extras - only include Google-known fields
-        // This filters out OpenAI-specific fields like stream_options that would cause
-        // Google to reject the request with "Unknown name: stream_options"
-        for (k, v) in &req.extras {
-            if GOOGLE_KNOWN_KEYS.contains(&k.as_str()) {
-                obj.insert(k.clone(), v.clone());
+        // Merge back provider-specific extras (only for Google)
+        if let Some(extras) = req.provider_extras.get(&ProviderFormat::Google) {
+            for (k, v) in extras {
+                // Don't overwrite canonical fields we already handled
+                if !obj.contains_key(k) {
+                    obj.insert(k.clone(), v.clone());
+                }
             }
         }
 
         Ok(Value::Object(obj))
     }
 
-    fn apply_defaults(&self, _req: &mut UniversalRequest) {
-        // Google doesn't require any specific defaults
-    }
-
     fn detect_response(&self, payload: &Value) -> bool {
         // Google response has candidates[].content structure
         payload
@@ -234,52 +345,42 @@ impl ProviderAdapter for GoogleAdapter {
     }
 
     fn response_to_universal(&self, payload: Value) -> Result<UniversalResponse, TransformError> {
-        let response: GenerateContentResponse = serde_json::from_value(payload)
-            .map_err(|e| TransformError::ToUniversalFailed(e.to_string()))?;
-        let GenerateContentResponse {
-            candidates,
-            usage_metadata,
-            model_version,
-            ..
-        } = response;
+        let candidates = payload
+            .get("candidates")
+            .and_then(Value::as_array)
+            .ok_or_else(|| TransformError::ToUniversalFailed("missing candidates".to_string()))?;
 
         let mut messages = Vec::new();
         let mut finish_reason = None;
 
         for candidate in candidates {
-            let content = candidate.content;
-            let finish_reason_value = candidate.finish_reason;
-
-            if let Some(content) = content {
+            if let Some(content_val) = candidate.get("content") {
+                let content: GoogleContent = serde_json::from_value(content_val.clone())
+                    .map_err(|e| TransformError::ToUniversalFailed(e.to_string()))?;
                 let universal = <Message as TryFromLLM<GoogleContent>>::try_from(content)
                     .map_err(|e| TransformError::ToUniversalFailed(e.to_string()))?;
                 messages.push(universal);
             }
 
             // Get finishReason from first candidate
-            if finish_reason.is_none() && finish_reason_value != 0 {
-                let reason = candidate::FinishReason::try_from(finish_reason_value)
-                    .ok()
-                    .map(|r| r.as_str_name())
-                    .unwrap_or("FINISH_REASON_UNSPECIFIED");
-                finish_reason = Some(reason.parse().unwrap());
+            if finish_reason.is_none() {
+                if let Some(reason) = candidate.get("finishReason").and_then(Value::as_str) {
+                    finish_reason =
+                        Some(reason.parse().map_err(|_| ConvertError::InvalidEnumValue {
+                            type_name: "FinishReason",
+                            value: reason.to_string(),
+                        })?);
+                }
             }
         }
 
-        let usage = usage_metadata.map(|u| UniversalUsage {
-            prompt_tokens: Some(u.prompt_token_count as i64),
-            completion_tokens: Some(u.candidates_token_count as i64),
-            prompt_cached_tokens: Some(u.cached_content_token_count as i64),
-            prompt_cache_creation_tokens: None, // Google doesn't report cache creation tokens
-            completion_reasoning_tokens: Some(u.thoughts_token_count as i64),
-        });
+        let usage = UniversalUsage::extract_from_response(&payload, self.format());
 
         Ok(UniversalResponse {
-            model: if model_version.is_empty() {
-                None
-            } else {
-                Some(model_version)
-            },
+            model: payload
+                .get("modelVersion")
+                .and_then(Value::as_str)
+                .map(String::from),
             messages,
             usage,
             finish_reason,
@@ -287,73 +388,43 @@ impl ProviderAdapter for GoogleAdapter {
     }
 
     fn response_from_universal(&self, resp: &UniversalResponse) -> Result<Value, TransformError> {
-        let finish_reason = map_finish_reason_to_candidate_enum(
-            self.map_finish_reason(resp.finish_reason.as_ref()),
-        );
+        let finish_reason = resp
+            .finish_reason
+            .as_ref()
+            .map(|r| r.to_provider_string(self.format()).to_string())
+            .unwrap_or_else(|| "STOP".to_string());
 
-        let candidates = resp
+        let candidates: Vec<Value> = resp
             .messages
             .iter()
             .enumerate()
             .map(|(i, msg)| {
                 let content = <GoogleContent as TryFromLLM<Message>>::try_from(msg.clone())
                     .map_err(|e| TransformError::FromUniversalFailed(e.to_string()))?;
-                Ok(crate::providers::google::generated::Candidate {
-                    index: Some(i as i32),
-                    content: Some(content),
-                    finish_reason,
-                    finish_message: None,
-                    safety_ratings: Vec::new(),
-                    citation_metadata: None,
-                    token_count: 0,
-                    grounding_attributions: Vec::new(),
-                    grounding_metadata: None,
-                    avg_logprobs: 0.0,
-                    logprobs_result: None,
-                    url_context_metadata: None,
-                })
+
+                let content_value = serde_json::to_value(&content)
+                    .map_err(|e| TransformError::SerializationFailed(e.to_string()))?;
+
+                Ok(serde_json::json!({
+                    "index": i,
+                    "content": content_value,
+                    "finishReason": finish_reason
+                }))
             })
             .collect::<Result<Vec<_>, TransformError>>()?;
 
-        let usage_metadata = resp.usage.as_ref().map(|usage| {
-            let prompt = usage.prompt_tokens.unwrap_or(0) as i32;
-            let completion = usage.completion_tokens.unwrap_or(0) as i32;
-            generate_content_response::UsageMetadata {
-                prompt_token_count: prompt,
-                cached_content_token_count: usage.prompt_cached_tokens.unwrap_or(0) as i32,
-                candidates_token_count: completion,
-                tool_use_prompt_token_count: 0,
-                thoughts_token_count: usage.completion_reasoning_tokens.unwrap_or(0) as i32,
-                total_token_count: prompt + completion,
-                prompt_tokens_details: Vec::new(),
-                cache_tokens_details: Vec::new(),
-                candidates_tokens_details: Vec::new(),
-                tool_use_prompt_tokens_details: Vec::new(),
-            }
+        let mut obj = serde_json::json!({
+            "candidates": candidates
         });
 
-        let response = GenerateContentResponse {
-            candidates,
-            prompt_feedback: None,
-            usage_metadata,
-            model_version: resp.model.clone().unwrap_or_default(),
-            response_id: String::new(),
-        };
-
-        let mut value = serde_json::to_value(response)
-            .map_err(|e| TransformError::SerializationFailed(e.to_string()))?;
-        ensure_candidates_field(&mut value);
-        Ok(value)
-    }
+        if let Some(usage) = &resp.usage {
+            obj.as_object_mut().unwrap().insert(
+                "usageMetadata".into(),
+                usage.to_provider_value(self.format()),
+            );
+        }
 
-    fn map_finish_reason(&self, reason: Option<&FinishReason>) -> Option<String> {
-        reason.map(|r| match r {
-            FinishReason::Stop => "STOP".to_string(),
-            FinishReason::Length => "MAX_TOKENS".to_string(),
-            FinishReason::ToolCalls => "TOOL_CALLS".to_string(),
-            FinishReason::ContentFilter => "SAFETY".to_string(),
-            FinishReason::Other(s) => s.clone(),
-        })
+        Ok(obj)
     }
 
     // =========================================================================
@@ -370,48 +441,35 @@ impl ProviderAdapter for GoogleAdapter {
         &self,
         payload: Value,
     ) -> Result<Option<UniversalStreamChunk>, TransformError> {
-        let response: GenerateContentResponse = serde_json::from_value(payload)
-            .map_err(|e| TransformError::ToUniversalFailed(e.to_string()))?;
-        let GenerateContentResponse {
-            candidates,
-            usage_metadata,
-            model_version,
-            response_id,
-            ..
-        } = response;
+        let candidates = payload
+            .get("candidates")
+            .and_then(Value::as_array)
+            .ok_or_else(|| TransformError::ToUniversalFailed("missing candidates".to_string()))?;
 
         let mut choices = Vec::new();
 
         for candidate in candidates {
-            let index = candidate.index.unwrap_or(0) as u32;
+            let index = candidate.get("index").and_then(Value::as_u64).unwrap_or(0) as u32;
 
             // Extract text from content.parts
             let text: String = candidate
-                .content
-                .as_ref()
-                .map(|content| {
-                    content
-                        .parts
+                .get("content")
+                .and_then(|c| c.get("parts"))
+                .and_then(Value::as_array)
+                .map(|parts| {
+                    parts
                         .iter()
-                        .filter_map(|part| match &part.data {
-                            Some(part::Data::Text(text)) => Some(text.as_str()),
-                            _ => None,
-                        })
+                        .filter_map(|p| p.get("text").and_then(Value::as_str))
                         .collect::<Vec<_>>()
                         .join("")
                 })
                 .unwrap_or_default();
 
-            // Map finish reason
-            let finish_reason = candidate::FinishReason::try_from(candidate.finish_reason)
-                .ok()
-                .map(|r| r.as_str_name())
-                .map(|r| match r {
-                    "STOP" => "stop".to_string(),
-                    "MAX_TOKENS" => "length".to_string(),
-                    "SAFETY" | "RECITATION" | "OTHER" => "content_filter".to_string(),
-                    other => other.to_lowercase(),
-                });
+            // Map finish reason using centralized helper
+            let finish_reason = candidate
+                .get("finishReason")
+                .and_then(Value::as_str)
+                .map(|r| FinishReason::from_provider_string(r, self.format()).to_string());
 
             choices.push(UniversalStreamChoice {
                 index,
@@ -424,24 +482,17 @@ impl ProviderAdapter for GoogleAdapter {
         }
 
         // Extract usage from usageMetadata
-        let usage = usage_metadata.map(|u| UniversalUsage {
-            prompt_tokens: Some(u.prompt_token_count as i64),
-            completion_tokens: Some(u.candidates_token_count as i64),
-            prompt_cached_tokens: Some(u.cached_content_token_count as i64),
-            prompt_cache_creation_tokens: None,
-            completion_reasoning_tokens: Some(u.thoughts_token_count as i64),
-        });
+        let usage = UniversalUsage::extract_from_response(&payload, self.format());
 
-        let model = if model_version.is_empty() {
-            None
-        } else {
-            Some(model_version)
-        };
-        let id = if response_id.is_empty() {
-            None
-        } else {
-            Some(response_id)
-        };
+        let model = payload
+            .get("modelVersion")
+            .and_then(Value::as_str)
+            .map(String::from);
+
+        let id = payload
+            .get("responseId")
+            .and_then(Value::as_str)
+            .map(String::from);
 
         Ok(Some(UniversalStreamChunk::new(
             id, model, choices, None, usage,
@@ -449,123 +500,73 @@ impl ProviderAdapter for GoogleAdapter {
     }
 
     fn stream_from_universal(&self, chunk: &UniversalStreamChunk) -> Result<Value, TransformError> {
-        let candidates = if chunk.is_keep_alive() {
-            Vec::new()
-        } else {
-            chunk
-                .choices
-                .iter()
-                .map(|c| {
-                    // Extract text content from delta
-                    let text = c
-                        .delta
-                        .as_ref()
-                        .and_then(|d| d.get("content"))
-                        .and_then(Value::as_str)
-                        .unwrap_or("");
-
-                    let finish_reason =
-                        map_stream_finish_reason_to_candidate_enum(c.finish_reason.as_deref());
-
-                    crate::providers::google::generated::Candidate {
-                        index: Some(c.index as i32),
-                        content: Some(GoogleContent {
-                            role: "model".to_string(),
-                            parts: vec![crate::providers::google::generated::Part {
-                                thought: false,
-                                thought_signature: Vec::new(),
-                                part_metadata: None,
-                                data: Some(part::Data::Text(text.to_string())),
-                                metadata: None,
-                            }],
-                        }),
-                        finish_reason,
-                        finish_message: None,
-                        safety_ratings: Vec::new(),
-                        citation_metadata: None,
-                        token_count: 0,
-                        grounding_attributions: Vec::new(),
-                        grounding_metadata: None,
-                        avg_logprobs: 0.0,
-                        logprobs_result: None,
-                        url_context_metadata: None,
+        if chunk.is_keep_alive() {
+            // Google doesn't have a keep-alive event, return empty candidates
+            return Ok(serde_json::json!({
+                "candidates": []
+            }));
+        }
+
+        let candidates: Vec<Value> = chunk
+            .choices
+            .iter()
+            .map(|c| {
+                // Extract text content from delta
+                let text = c
+                    .delta
+                    .as_ref()
+                    .and_then(|d| d.get("content"))
+                    .and_then(Value::as_str)
+                    .unwrap_or("");
+
+                // Map finish reason to Google format
+                let finish_reason = c.finish_reason.as_ref().map(|r| match r.as_str() {
+                    "stop" => "STOP",
+                    "length" => "MAX_TOKENS",
+                    "tool_calls" => "TOOL_CALLS",
+                    "content_filter" => "SAFETY",
+                    other => other,
+                });
+
+                let mut candidate = serde_json::json!({
+                    "index": c.index,
+                    "content": {
+                        "parts": [{"text": text}],
+                        "role": "model"
                     }
-                })
-                .collect::<Vec<_>>()
-        };
+                });
 
-        let usage_metadata = chunk.usage.as_ref().map(|usage| {
-            let prompt = usage.prompt_tokens.unwrap_or(0) as i32;
-            let completion = usage.completion_tokens.unwrap_or(0) as i32;
-            generate_content_response::UsageMetadata {
-                prompt_token_count: prompt,
-                cached_content_token_count: usage.prompt_cached_tokens.unwrap_or(0) as i32,
-                candidates_token_count: completion,
-                tool_use_prompt_token_count: 0,
-                thoughts_token_count: usage.completion_reasoning_tokens.unwrap_or(0) as i32,
-                total_token_count: prompt + completion,
-                prompt_tokens_details: Vec::new(),
-                cache_tokens_details: Vec::new(),
-                candidates_tokens_details: Vec::new(),
-                tool_use_prompt_tokens_details: Vec::new(),
-            }
-        });
+                if let Some(reason) = finish_reason {
+                    candidate
+                        .as_object_mut()
+                        .unwrap()
+                        .insert("finishReason".into(), Value::String(reason.to_string()));
+                }
 
-        let response = GenerateContentResponse {
-            candidates,
-            prompt_feedback: None,
-            usage_metadata,
-            model_version: chunk.model.clone().unwrap_or_default(),
-            response_id: chunk.id.clone().unwrap_or_default(),
-        };
+                candidate
+            })
+            .collect();
 
-        let mut value = serde_json::to_value(response)
-            .map_err(|e| TransformError::SerializationFailed(e.to_string()))?;
-        ensure_candidates_field(&mut value);
-        Ok(value)
-    }
-}
+        let mut obj = serde_json::json!({
+            "candidates": candidates
+        });
+
+        let obj_map = obj.as_object_mut().unwrap();
 
-fn map_finish_reason_to_candidate_enum(reason_str: Option<String>) -> i32 {
-    if let Some(reason_str) = reason_str {
-        if let Some(mapped) = candidate::FinishReason::from_str_name(&reason_str) {
-            return mapped as i32;
+        if let Some(ref id) = chunk.id {
+            obj_map.insert("responseId".into(), Value::String(id.clone()));
         }
-        if reason_str == "TOOL_CALLS" {
-            return candidate::FinishReason::Other as i32;
+        if let Some(ref model) = chunk.model {
+            obj_map.insert("modelVersion".into(), Value::String(model.clone()));
+        }
+        if let Some(ref usage) = chunk.usage {
+            obj_map.insert(
+                "usageMetadata".into(),
+                usage.to_provider_value(self.format()),
+            );
         }
-    }
-    0
-}
-
-fn map_stream_finish_reason_to_candidate_enum(reason: Option<&str>) -> i32 {
-    let reason = match reason {
-        Some(value) => value,
-        None => return 0,
-    };
-
-    if reason.eq_ignore_ascii_case("stop") {
-        return candidate::FinishReason::Stop as i32;
-    }
-    if reason.eq_ignore_ascii_case("length") || reason.eq_ignore_ascii_case("max_tokens") {
-        return candidate::FinishReason::MaxTokens as i32;
-    }
-    if reason.eq_ignore_ascii_case("content_filter") {
-        return candidate::FinishReason::Safety as i32;
-    }
-    if reason.eq_ignore_ascii_case("tool_calls") || reason.eq_ignore_ascii_case("tool_use") {
-        return candidate::FinishReason::Other as i32;
-    }
-    if let Some(mapped) = candidate::FinishReason::from_str_name(reason) {
-        return mapped as i32;
-    }
-    candidate::FinishReason::Other as i32
-}
 
-fn ensure_candidates_field(value: &mut Value) {
-    if let Value::Object(map) = value {
-        map.entry("candidates".to_string())
-            .or_insert_with(|| Value::Array(Vec::new()));
+        Ok(obj)
     }
 }
 
@@ -601,8 +602,8 @@ mod tests {
         });
 
         let universal = adapter.request_to_universal(payload).unwrap();
-        let temperature = universal.params.temperature.unwrap();
-        assert_eq!(temperature as f32, 0.7f32);
+        // Use approximate comparison due to f32->f64 conversion precision
+        assert!((universal.params.temperature.unwrap() - 0.7).abs() < 0.001);
         assert_eq!(universal.params.max_tokens, Some(1024));
 
         let reconstructed = adapter.request_from_universal(&universal).unwrap();
diff --git a/crates/lingua/src/providers/google/mod.rs b/crates/lingua/src/providers/google/mod.rs
index 5762bfc8..a2d8add8 100644
--- a/crates/lingua/src/providers/google/mod.rs
+++ b/crates/lingua/src/providers/google/mod.rs
@@ -5,6 +5,7 @@ pub mod adapter;
 pub mod convert;
 pub mod detect;
 pub mod generated;
+pub mod params;
 
 // Re-export adapter
 pub use adapter::GoogleAdapter;
diff --git a/crates/lingua/src/providers/google/params.rs b/crates/lingua/src/providers/google/params.rs
new file mode 100644
index 00000000..e4dffab5
--- /dev/null
+++ b/crates/lingua/src/providers/google/params.rs
@@ -0,0 +1,97 @@
+/*!
+Typed parameter structs for Google GenerateContent API.
+
+These structs use `#[serde(flatten)]` to automatically capture unknown fields,
+eliminating the need for explicit KNOWN_KEYS arrays.
+*/
+
+use crate::providers::google::generated::{Content, GenerationConfig, Tool};
+use crate::serde_json::Value;
+use serde::{Deserialize, Serialize};
+use std::collections::BTreeMap;
+
+/// Google GenerateContent API request parameters.
+///
+/// All known fields are explicitly typed. Unknown fields automatically
+/// go into `extras` via `#[serde(flatten)]`.
+#[derive(Debug, Clone, Default, Serialize, Deserialize)]
+#[serde(rename_all = "camelCase")]
+pub struct GoogleParams {
+    // === Core fields ===
+    pub model: Option<String>,
+    pub contents: Option<Vec<Content>>,
+
+    // === System prompt ===
+    pub system_instruction: Option<Value>,
+
+    // === Generation configuration ===
+    pub generation_config: Option<GenerationConfig>,
+
+    // === Safety settings ===
+    pub safety_settings: Option<Value>,
+
+    // === Tools and function calling ===
+    pub tools: Option<Vec<Tool>>,
+    pub tool_config: Option<Value>,
+
+    // === Caching ===
+    pub cached_content: Option<String>,
+
+    /// Unknown fields - automatically captured by serde flatten.
+    /// These are provider-specific fields not in the canonical set.
+    #[serde(flatten)]
+    pub extras: BTreeMap<String, Value>,
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::serde_json;
+    use crate::serde_json::json;
+
+    #[test]
+    fn test_google_params_known_fields() {
+        let json = json!({
+            "model": "gemini-pro",
+            "contents": [{"role": "user", "parts": [{"text": "Hello"}]}],
+            "generationConfig": {
+                "temperature": 0.7,
+                "maxOutputTokens": 1024
+            }
+        });
+
+        let params: GoogleParams = serde_json::from_value(json).unwrap();
+        assert_eq!(params.model, Some("gemini-pro".to_string()));
+        assert!(params.generation_config.is_some());
+        assert!(params.extras.is_empty());
+    }
+
+    #[test]
+    fn test_google_params_unknown_fields_go_to_extras() {
+        let json = json!({
+            "contents": [{"parts": [{"text": "Hello"}]}],
+            "someFutureParam": "value"
+        });
+
+        let params: GoogleParams = serde_json::from_value(json).unwrap();
+        assert_eq!(params.extras.len(), 1);
+        assert_eq!(
+            params.extras.get("someFutureParam"),
+            Some(&Value::String("value".to_string()))
+        );
+    }
+
+    #[test]
+    fn test_google_roundtrip_preserves_extras() {
+        let json = json!({
+            "contents": [],
+            "customField": {"nested": "data"}
+        });
+
+        let params: GoogleParams = serde_json::from_value(json.clone()).unwrap();
+        let back: Value = serde_json::to_value(&params).unwrap();
+
+        // Custom field should be preserved
+        assert_eq!(back.get("customField"), json.get("customField"));
+    }
+}
diff --git a/crates/lingua/src/providers/openai/adapter.rs b/crates/lingua/src/providers/openai/adapter.rs
index 79fc9efc..6eb4164f 100644
--- a/crates/lingua/src/providers/openai/adapter.rs
+++ b/crates/lingua/src/providers/openai/adapter.rs
@@ -1,78 +1,43 @@
 /*!
-OpenAI provider adapters for chat completions and responses API.
+OpenAI Chat Completions API adapter.
 
-This module provides two adapters:
-- `OpenAIAdapter` for the standard Chat Completions API
-- `ResponsesAdapter` for the Responses API (used by reasoning models like o1)
+This module provides the `OpenAIAdapter` for the standard Chat Completions API,
+along with target-specific transformation utilities for providers like Azure,
+Vertex, and Mistral.
 */
 
 use crate::capabilities::ProviderFormat;
+use crate::error::ConvertError;
+use crate::reject_params;
+use std::collections::HashMap;
+
 use crate::processing::adapters::{
-    collect_extras, insert_opt_bool, insert_opt_f64, insert_opt_i64, insert_opt_value,
-    ProviderAdapter,
+    insert_opt_bool, insert_opt_f64, insert_opt_i64, insert_opt_value, ProviderAdapter,
 };
 use crate::processing::transform::TransformError;
 use crate::providers::openai::capabilities::{OpenAICapabilities, TargetProvider};
+use crate::providers::openai::convert::{
+    ChatCompletionRequestMessageExt, ChatCompletionResponseMessageExt,
+};
 use crate::providers::openai::generated::{
-    AllowedToolsFunction, ChatCompletionRequestMessage, ChatCompletionRequestMessageContent,
+    AllowedToolsFunction, ChatCompletionRequestMessageContent,
     ChatCompletionRequestMessageContentPart, ChatCompletionRequestMessageRole,
-    ChatCompletionResponseMessage, ChatCompletionToolChoiceOption,
-    CreateChatCompletionRequestClass, CreateResponseClass, File, FunctionObject,
-    FunctionToolChoiceClass, FunctionToolChoiceType, InputItem, InputItemContent, InputItemRole,
-    InputItemType, Instructions, PurpleType, ResponseFormatType, ToolElement, ToolType,
-};
-use crate::providers::openai::{
-    try_parse_openai, try_parse_responses, universal_to_responses_input,
+    ChatCompletionToolChoiceOption, CreateChatCompletionRequestClass, File, FunctionObject,
+    FunctionToolChoiceClass, FunctionToolChoiceType, PurpleType, ResponseFormatType, ToolElement,
+    ToolType,
 };
+use crate::providers::openai::params::OpenAIChatParams;
+use crate::providers::openai::try_parse_openai;
 use crate::serde_json::{self, Map, Value};
 use crate::universal::convert::TryFromLLM;
-use crate::universal::message::{AssistantContent, Message, UserContent};
+use crate::universal::message::Message;
+use crate::universal::tools::{tools_to_openai_chat_value, UniversalTool};
 use crate::universal::{
-    FinishReason, UniversalParams, UniversalRequest, UniversalResponse, UniversalStreamChoice,
-    UniversalStreamChunk, UniversalUsage, PLACEHOLDER_ID, PLACEHOLDER_MODEL,
+    parse_stop_sequences, UniversalParams, UniversalRequest, UniversalResponse,
+    UniversalStreamChoice, UniversalStreamChunk, UniversalUsage, PLACEHOLDER_ID, PLACEHOLDER_MODEL,
 };
 use crate::util::media::parse_base64_data_url;
-
-/// Known request fields for OpenAI Chat Completions API.
-/// These are fields extracted into UniversalRequest/UniversalParams.
-/// Fields not in this list go into `extras` for passthrough.
-const OPENAI_KNOWN_KEYS: &[&str] = &[
-    "model",
-    "messages",
-    "temperature",
-    "top_p",
-    "max_tokens",
-    "max_completion_tokens",
-    "stop",
-    "tools",
-    "tool_choice",
-    "response_format",
-    "seed",
-    "presence_penalty",
-    "frequency_penalty",
-    "stream",
-    // OpenAI-specific fields (not in UniversalParams) go to extras:
-    // stream_options, n, logprobs, top_logprobs, logit_bias,
-    // user, store, metadata, parallel_tool_calls, service_tier
-];
-
-/// Known request fields for OpenAI Responses API.
-/// These are fields extracted into UniversalRequest/UniversalParams.
-/// Fields not in this list go into `extras` for passthrough.
-const RESPONSES_KNOWN_KEYS: &[&str] = &[
-    "model",
-    "input",
-    "temperature",
-    "top_p",
-    "max_output_tokens",
-    "tools",
-    "tool_choice",
-    "stream",
-    // Responses-specific fields (not in UniversalParams) go to extras:
-    // instructions, stop, response_format, seed, presence_penalty,
-    // frequency_penalty, reasoning, truncation, user, store,
-    // metadata, parallel_tool_calls
-];
+use std::convert::TryInto;
 
 /// Adapter for OpenAI Chat Completions API.
 pub struct OpenAIAdapter;
@@ -95,37 +60,123 @@ impl ProviderAdapter for OpenAIAdapter {
     }
 
     fn request_to_universal(&self, payload: Value) -> Result<UniversalRequest, TransformError> {
-        let extras = collect_extras(&payload, OPENAI_KNOWN_KEYS);
-        let request: CreateChatCompletionRequestClass = serde_json::from_value(payload)
+        // Parse params (messages will be parsed separately to preserve reasoning field)
+        let typed_params: OpenAIChatParams = serde_json::from_value(payload.clone())
             .map_err(|e| TransformError::ToUniversalFailed(e.to_string()))?;
 
-        let messages = <Vec<Message> as TryFromLLM<Vec<_>>>::try_from(request.messages)
+        // Extract and parse messages as extended type to capture reasoning field
+        let messages_val = payload
+            .get("messages")
+            .ok_or_else(|| {
+                TransformError::ToUniversalFailed("OpenAI: missing 'messages' field".to_string())
+            })?
+            .as_array()
+            .ok_or_else(|| {
+                TransformError::ToUniversalFailed("OpenAI: 'messages' must be an array".to_string())
+            })?;
+
+        let provider_messages: Vec<ChatCompletionRequestMessageExt> = messages_val
+            .iter()
+            .map(|msg_val| {
+                serde_json::from_value(msg_val.clone())
+                    .map_err(|e| TransformError::ToUniversalFailed(e.to_string()))
+            })
+            .collect::<Result<Vec<_>, _>>()?;
+
+        let messages = <Vec<Message> as TryFromLLM<Vec<_>>>::try_from(provider_messages)
             .map_err(|e| TransformError::ToUniversalFailed(e.to_string()))?;
 
-        let params = UniversalParams {
-            temperature: request.temperature,
-            top_p: request.top_p,
+        // Extract max_tokens first - needed for reasoning budget computation
+        let max_tokens = typed_params
+            .max_tokens
+            .or(typed_params.max_completion_tokens);
+
+        // Convert reasoning effort to ReasoningConfig, computing budget_tokens with max_tokens context
+        let reasoning = typed_params
+            .reasoning_effort
+            .map(|effort| (effort, max_tokens).into());
+
+        // Build canonical params from typed fields
+        let mut params = UniversalParams {
+            temperature: typed_params.temperature,
+            top_p: typed_params.top_p,
             top_k: None, // OpenAI doesn't support top_k
-            max_tokens: request.max_tokens.or(request.max_completion_tokens),
-            stop: request.stop.and_then(|s| serde_json::to_value(s).ok()),
-            tools: request.tools.and_then(|t| serde_json::to_value(t).ok()),
-            tool_choice: request
+            max_tokens,
+            stop: typed_params.stop.as_ref().and_then(parse_stop_sequences),
+            tools: typed_params
+                .tools
+                .as_ref()
+                .map(UniversalTool::from_value_array),
+            tool_choice: typed_params
                 .tool_choice
-                .and_then(|t| serde_json::to_value(t).ok()),
-            response_format: request
+                .as_ref()
+                .and_then(|v| (ProviderFormat::OpenAI, v).try_into().ok()),
+            response_format: typed_params
                 .response_format
-                .and_then(|r| serde_json::to_value(r).ok()),
-            seed: request.seed,
-            presence_penalty: request.presence_penalty,
-            frequency_penalty: request.frequency_penalty,
-            stream: request.stream,
+                .as_ref()
+                .and_then(|v| (ProviderFormat::OpenAI, v).try_into().ok()),
+            seed: typed_params.seed,
+            presence_penalty: typed_params.presence_penalty,
+            frequency_penalty: typed_params.frequency_penalty,
+            stream: typed_params.stream,
+            // New canonical fields
+            parallel_tool_calls: typed_params.parallel_tool_calls,
+            reasoning,
+            metadata: typed_params.metadata,
+            store: typed_params.store,
+            service_tier: typed_params.service_tier,
+            logprobs: typed_params.logprobs,
+            top_logprobs: typed_params.top_logprobs,
         };
 
+        // Sync parallel_tool_calls with tool_choice.disable_parallel for roundtrip fidelity
+        // OpenAI uses parallel_tool_calls at params level, Anthropic uses tool_choice.disable_parallel
+        if params.parallel_tool_calls == Some(false) {
+            if let Some(ref mut tc) = params.tool_choice {
+                if tc.disable_parallel.is_none() {
+                    tc.disable_parallel = Some(true);
+                }
+            }
+        }
+
+        // Collect provider-specific extras for round-trip preservation
+        // This includes both unknown fields (from serde flatten) and known OpenAI fields
+        // that aren't part of UniversalParams
+        let mut extras_map: Map<String, Value> = typed_params.extras.into_iter().collect();
+
+        // Add OpenAI-specific known fields that aren't in UniversalParams
+        if let Some(user) = typed_params.user {
+            extras_map.insert("user".into(), Value::String(user));
+        }
+        if let Some(n) = typed_params.n {
+            extras_map.insert("n".into(), Value::Number(n.into()));
+        }
+        if let Some(logit_bias) = typed_params.logit_bias {
+            extras_map.insert("logit_bias".into(), logit_bias);
+        }
+        if let Some(stream_options) = typed_params.stream_options {
+            extras_map.insert("stream_options".into(), stream_options);
+        }
+        if let Some(prediction) = typed_params.prediction {
+            extras_map.insert("prediction".into(), prediction);
+        }
+        if let Some(safety_identifier) = typed_params.safety_identifier {
+            extras_map.insert("safety_identifier".into(), Value::String(safety_identifier));
+        }
+        if let Some(prompt_cache_key) = typed_params.prompt_cache_key {
+            extras_map.insert("prompt_cache_key".into(), Value::String(prompt_cache_key));
+        }
+
+        let mut provider_extras = HashMap::new();
+        if !extras_map.is_empty() {
+            provider_extras.insert(ProviderFormat::OpenAI, extras_map);
+        }
+
         Ok(UniversalRequest {
-            model: Some(request.model),
+            model: typed_params.model,
             messages,
             params,
-            extras,
+            provider_extras,
         })
     }
 
@@ -135,8 +186,11 @@ impl ProviderAdapter for OpenAIAdapter {
             reason: "missing model".to_string(),
         })?;
 
-        let openai_messages: Vec<ChatCompletionRequestMessage> =
-            <Vec<ChatCompletionRequestMessage> as TryFromLLM<Vec<Message>>>::try_from(
+        // Validate unsupported parameters
+        reject_params!(req, ProviderFormat::OpenAI, top_k);
+
+        let openai_messages: Vec<ChatCompletionRequestMessageExt> =
+            <Vec<ChatCompletionRequestMessageExt> as TryFromLLM<Vec<Message>>>::try_from(
                 req.messages.clone(),
             )
             .map_err(|e| TransformError::FromUniversalFailed(e.to_string()))?;
@@ -153,19 +207,64 @@ impl ProviderAdapter for OpenAIAdapter {
         insert_opt_f64(&mut obj, "temperature", req.params.temperature);
         insert_opt_f64(&mut obj, "top_p", req.params.top_p);
         insert_opt_i64(&mut obj, "max_completion_tokens", req.params.max_tokens);
-        insert_opt_value(&mut obj, "stop", req.params.stop.clone());
-        insert_opt_value(&mut obj, "tools", req.params.tools.clone());
-        insert_opt_value(&mut obj, "tool_choice", req.params.tool_choice.clone());
+        // Output stop sequences as array (OpenAI accepts both string and array)
+        if let Some(ref stop) = req.params.stop {
+            if !stop.is_empty() {
+                obj.insert(
+                    "stop".into(),
+                    Value::Array(stop.iter().map(|s| Value::String(s.clone())).collect()),
+                );
+            }
+        }
+        // Convert tools to OpenAI Chat format
+        if let Some(tools) = &req.params.tools {
+            if let Some(tools_value) = tools_to_openai_chat_value(tools)? {
+                obj.insert("tools".into(), tools_value);
+            }
+        }
+        // Use helper methods to reduce boilerplate
+        insert_opt_value(
+            &mut obj,
+            "tool_choice",
+            req.params.tool_choice_for(ProviderFormat::OpenAI),
+        );
         insert_opt_value(
             &mut obj,
             "response_format",
-            req.params.response_format.clone(),
+            req.params.response_format_for(ProviderFormat::OpenAI),
         );
         insert_opt_i64(&mut obj, "seed", req.params.seed);
         insert_opt_f64(&mut obj, "presence_penalty", req.params.presence_penalty);
         insert_opt_f64(&mut obj, "frequency_penalty", req.params.frequency_penalty);
+        insert_opt_bool(&mut obj, "logprobs", req.params.logprobs);
+        insert_opt_i64(&mut obj, "top_logprobs", req.params.top_logprobs);
         insert_opt_bool(&mut obj, "stream", req.params.stream);
 
+        // Add parallel_tool_calls from canonical params
+        if let Some(parallel) = req.params.parallel_tool_calls {
+            obj.insert("parallel_tool_calls".into(), Value::Bool(parallel));
+        }
+
+        // Add reasoning_effort from canonical params
+        if let Some(effort_value) = req.params.reasoning_for(ProviderFormat::OpenAI) {
+            obj.insert("reasoning_effort".into(), effort_value);
+        }
+
+        // Add metadata from canonical params
+        if let Some(metadata) = req.params.metadata.as_ref() {
+            obj.insert("metadata".into(), metadata.clone());
+        }
+
+        // Add store from canonical params
+        if let Some(store) = req.params.store {
+            obj.insert("store".into(), Value::Bool(store));
+        }
+
+        // Add service_tier from canonical params
+        if let Some(ref service_tier) = req.params.service_tier {
+            obj.insert("service_tier".into(), Value::String(service_tier.clone()));
+        }
+
         // If streaming, ensure stream_options.include_usage is set for usage reporting
         if req.params.stream == Some(true) {
             let stream_options = obj
@@ -176,18 +275,16 @@ impl ProviderAdapter for OpenAIAdapter {
             }
         }
 
-        // Merge extras (provider-specific fields)
-        for (k, v) in &req.extras {
-            obj.insert(k.clone(), v.clone());
+        // Merge back provider-specific extras (only for OpenAI)
+        if let Some(extras) = req.provider_extras.get(&ProviderFormat::OpenAI) {
+            for (k, v) in extras {
+                obj.insert(k.clone(), v.clone());
+            }
         }
 
         Ok(Value::Object(obj))
     }
 
-    fn apply_defaults(&self, _req: &mut UniversalRequest) {
-        // OpenAI doesn't require any specific defaults
-    }
-
     fn detect_response(&self, payload: &Value) -> bool {
         // OpenAI chat completion response has choices[].message and object="chat.completion"
         payload.get("choices").and_then(Value::as_array).is_some()
@@ -208,37 +305,31 @@ impl ProviderAdapter for OpenAIAdapter {
 
         for choice in choices {
             if let Some(msg_val) = choice.get("message") {
-                let response_msg: ChatCompletionResponseMessage =
+                // Deserialize to extended type to capture reasoning field
+                let response_msg: ChatCompletionResponseMessageExt =
                     serde_json::from_value(msg_val.clone())
                         .map_err(|e| TransformError::ToUniversalFailed(e.to_string()))?;
-                let universal = <Message as TryFromLLM<&ChatCompletionResponseMessage>>::try_from(
-                    &response_msg,
-                )
-                .map_err(|e| TransformError::ToUniversalFailed(e.to_string()))?;
+                let universal =
+                    <Message as TryFromLLM<ChatCompletionResponseMessageExt>>::try_from(
+                        response_msg,
+                    )
+                    .map_err(|e| TransformError::ToUniversalFailed(e.to_string()))?;
                 messages.push(universal);
             }
 
             // Get finish_reason from first choice
             if finish_reason.is_none() {
                 if let Some(reason) = choice.get("finish_reason").and_then(Value::as_str) {
-                    finish_reason = Some(reason.parse().unwrap());
+                    finish_reason =
+                        Some(reason.parse().map_err(|_| ConvertError::InvalidEnumValue {
+                            type_name: "FinishReason",
+                            value: reason.to_string(),
+                        })?);
                 }
             }
         }
 
-        let usage = payload.get("usage").map(|u| UniversalUsage {
-            prompt_tokens: u.get("prompt_tokens").and_then(Value::as_i64),
-            completion_tokens: u.get("completion_tokens").and_then(Value::as_i64),
-            prompt_cached_tokens: u
-                .get("prompt_tokens_details")
-                .and_then(|d| d.get("cached_tokens"))
-                .and_then(Value::as_i64),
-            prompt_cache_creation_tokens: None, // OpenAI doesn't report cache creation tokens
-            completion_reasoning_tokens: u
-                .get("completion_tokens_details")
-                .and_then(|d| d.get("reasoning_tokens"))
-                .and_then(Value::as_i64),
-        });
+        let usage = UniversalUsage::extract_from_response(&payload, self.format());
 
         Ok(UniversalResponse {
             model: payload
@@ -252,8 +343,10 @@ impl ProviderAdapter for OpenAIAdapter {
     }
 
     fn response_from_universal(&self, resp: &UniversalResponse) -> Result<Value, TransformError> {
-        let finish_reason = self
-            .map_finish_reason(resp.finish_reason.as_ref())
+        let finish_reason = resp
+            .finish_reason
+            .as_ref()
+            .map(|r| r.to_provider_string(self.format()).to_string())
             .unwrap_or_else(|| "stop".to_string());
 
         let choices: Vec<Value> = resp
@@ -261,8 +354,9 @@ impl ProviderAdapter for OpenAIAdapter {
             .iter()
             .enumerate()
             .map(|(i, msg)| {
+                // Use extended type to include reasoning field in output
                 let response_msg =
-                    <ChatCompletionResponseMessage as TryFromLLM<&Message>>::try_from(msg)
+                    <ChatCompletionResponseMessageExt as TryFromLLM<&Message>>::try_from(msg)
                         .map_err(|e| TransformError::FromUniversalFailed(e.to_string()))?;
 
                 let message_value = serde_json::to_value(&response_msg)
@@ -276,15 +370,10 @@ impl ProviderAdapter for OpenAIAdapter {
             })
             .collect::<Result<Vec<_>, TransformError>>()?;
 
-        let usage = resp.usage.as_ref().map(|u| {
-            let input = u.prompt_tokens.unwrap_or(0);
-            let output = u.completion_tokens.unwrap_or(0);
-            serde_json::json!({
-                "prompt_tokens": input,
-                "completion_tokens": output,
-                "total_tokens": input + output
-            })
-        });
+        let usage = resp
+            .usage
+            .as_ref()
+            .map(|u| u.to_provider_value(self.format()));
 
         let mut obj = serde_json::json!({
             "id": format!("chatcmpl-{}", PLACEHOLDER_ID),
@@ -303,16 +392,6 @@ impl ProviderAdapter for OpenAIAdapter {
         Ok(obj)
     }
 
-    fn map_finish_reason(&self, reason: Option<&FinishReason>) -> Option<String> {
-        reason.map(|r| match r {
-            FinishReason::Stop => "stop".to_string(),
-            FinishReason::Length => "length".to_string(),
-            FinishReason::ToolCalls => "tool_calls".to_string(),
-            FinishReason::ContentFilter => "content_filter".to_string(),
-            FinishReason::Other(s) => s.clone(),
-        })
-    }
-
     // =========================================================================
     // Streaming response handling
     // =========================================================================
@@ -364,19 +443,7 @@ impl ProviderAdapter for OpenAIAdapter {
             .unwrap_or_default();
 
         // Extract usage if present (usually only on final chunk)
-        let usage = payload.get("usage").map(|u| UniversalUsage {
-            prompt_tokens: u.get("prompt_tokens").and_then(Value::as_i64),
-            completion_tokens: u.get("completion_tokens").and_then(Value::as_i64),
-            prompt_cached_tokens: u
-                .get("prompt_tokens_details")
-                .and_then(|d| d.get("cached_tokens"))
-                .and_then(Value::as_i64),
-            prompt_cache_creation_tokens: None,
-            completion_reasoning_tokens: u
-                .get("completion_tokens_details")
-                .and_then(|d| d.get("reasoning_tokens"))
-                .and_then(Value::as_i64),
-        });
+        let usage = UniversalUsage::extract_from_response(&payload, self.format());
 
         Ok(Some(UniversalStreamChunk::new(
             payload.get("id").and_then(Value::as_str).map(String::from),
@@ -439,15 +506,9 @@ impl ProviderAdapter for OpenAIAdapter {
             obj_map.insert("created".into(), Value::Number(created.into()));
         }
         if let Some(ref usage) = chunk.usage {
-            let prompt = usage.prompt_tokens.unwrap_or(0);
-            let completion = usage.completion_tokens.unwrap_or(0);
             obj_map.insert(
                 "usage".into(),
-                serde_json::json!({
-                    "prompt_tokens": prompt,
-                    "completion_tokens": completion,
-                    "total_tokens": prompt + completion
-                }),
+                usage.to_provider_value(ProviderFormat::OpenAI),
             );
         }
 
@@ -455,660 +516,6 @@ impl ProviderAdapter for OpenAIAdapter {
     }
 }
 
-/// Adapter for OpenAI Responses API (used by reasoning models like o1).
-pub struct ResponsesAdapter;
-
-impl ProviderAdapter for ResponsesAdapter {
-    fn format(&self) -> ProviderFormat {
-        ProviderFormat::Responses
-    }
-
-    fn directory_name(&self) -> &'static str {
-        "responses"
-    }
-
-    fn display_name(&self) -> &'static str {
-        "Responses"
-    }
-
-    fn detect_request(&self, payload: &Value) -> bool {
-        try_parse_responses(payload).is_ok()
-    }
-
-    fn request_to_universal(&self, payload: Value) -> Result<UniversalRequest, TransformError> {
-        let extras = collect_extras(&payload, RESPONSES_KNOWN_KEYS);
-        let request: CreateResponseClass = serde_json::from_value(payload)
-            .map_err(|e| TransformError::ToUniversalFailed(e.to_string()))?;
-
-        // Extract input items from the request
-        let input_items: Vec<InputItem> = match request.input {
-            Some(Instructions::InputItemArray(items)) => items,
-            Some(Instructions::String(s)) => {
-                // Single string input - create a user message InputItem
-                vec![InputItem {
-                    input_item_type: Some(InputItemType::Message),
-                    role: Some(InputItemRole::User),
-                    content: Some(InputItemContent::String(s)),
-                    ..Default::default()
-                }]
-            }
-            None => vec![],
-        };
-
-        let messages = <Vec<Message> as TryFromLLM<Vec<InputItem>>>::try_from(input_items)
-            .map_err(|e| TransformError::ToUniversalFailed(e.to_string()))?;
-
-        let params = UniversalParams {
-            temperature: request.temperature,
-            top_p: request.top_p,
-            top_k: None,
-            max_tokens: request.max_output_tokens,
-            stop: None, // Responses API doesn't use stop
-            tools: request.tools.and_then(|t| serde_json::to_value(t).ok()),
-            tool_choice: request
-                .tool_choice
-                .and_then(|t| serde_json::to_value(t).ok()),
-            response_format: None,  // Different structure in Responses API
-            seed: None,             // Responses API uses different randomness control
-            presence_penalty: None, // Responses API doesn't support penalties
-            frequency_penalty: None,
-            stream: request.stream,
-        };
-
-        Ok(UniversalRequest {
-            model: request.model, // Already Option<String> in CreateResponseClass
-            messages,
-            params,
-            extras,
-        })
-    }
-
-    fn request_from_universal(&self, req: &UniversalRequest) -> Result<Value, TransformError> {
-        let model = req.model.as_ref().ok_or(TransformError::ValidationFailed {
-            target: ProviderFormat::Responses,
-            reason: "missing model".to_string(),
-        })?;
-
-        // Use existing conversion with 1:N Tool message expansion
-        let input_items = universal_to_responses_input(&req.messages)
-            .map_err(|e| TransformError::FromUniversalFailed(e.to_string()))?;
-
-        let mut obj = Map::new();
-        obj.insert("model".into(), Value::String(model.clone()));
-        obj.insert(
-            "input".into(),
-            serde_json::to_value(input_items)
-                .map_err(|e| TransformError::SerializationFailed(e.to_string()))?,
-        );
-
-        // Note: temperature is intentionally NOT included for Responses API
-        // as reasoning models (o1, o3) don't support it
-        insert_opt_f64(&mut obj, "top_p", req.params.top_p);
-        insert_opt_i64(&mut obj, "max_output_tokens", req.params.max_tokens);
-        insert_opt_f64(&mut obj, "presence_penalty", req.params.presence_penalty);
-        insert_opt_f64(&mut obj, "frequency_penalty", req.params.frequency_penalty);
-        insert_opt_bool(&mut obj, "stream", req.params.stream);
-
-        // Transform tools from OpenAI Chat format to Responses API format
-        // {type: "function", function: {name, description, parameters}}
-        // → {type: "function", name, description, parameters, strict: false}
-        // Tools can come from params.tools or extras.tools depending on how the request was built
-        let tools_value = req
-            .params
-            .tools
-            .as_ref()
-            .or_else(|| req.extras.get("tools"));
-        if let Some(Value::Array(tools)) = tools_value {
-            let response_tools: Vec<Value> = tools
-                .iter()
-                .filter_map(|tool| {
-                    if tool.get("type").and_then(Value::as_str) == Some("function") {
-                        let func = tool.get("function")?;
-                        Some(serde_json::json!({
-                            "type": "function",
-                            "name": func.get("name")?,
-                            "description": func.get("description"),
-                            "parameters": func.get("parameters").cloned().unwrap_or(serde_json::json!({})),
-                            "strict": false
-                        }))
-                    } else {
-                        None
-                    }
-                })
-                .collect();
-            if !response_tools.is_empty() {
-                obj.insert("tools".into(), Value::Array(response_tools));
-            }
-        }
-
-        // Transform tool_choice from OpenAI Chat format to Responses API format
-        // {function: {name: "foo"}} → {type: "function", name: "foo"}
-        // tool_choice can come from params or extras depending on how the request was built
-        let tool_choice_value = req
-            .params
-            .tool_choice
-            .as_ref()
-            .or_else(|| req.extras.get("tool_choice"));
-        if let Some(tool_choice) = tool_choice_value {
-            let converted = match tool_choice {
-                Value::String(s) if s == "none" || s == "auto" || s == "required" => {
-                    Value::String(s.clone())
-                }
-                Value::Object(obj_tc) if obj_tc.contains_key("function") => {
-                    if let Some(func) = obj_tc.get("function") {
-                        if let Some(name) = func.get("name").and_then(Value::as_str) {
-                            serde_json::json!({ "type": "function", "name": name })
-                        } else {
-                            Value::String("auto".into())
-                        }
-                    } else {
-                        Value::String("auto".into())
-                    }
-                }
-                _ => Value::String("auto".into()),
-            };
-            obj.insert("tool_choice".into(), converted);
-        }
-
-        // Transform response_format to nested text.format structure for Responses API
-        if let Some(response_format) = req.extras.get("response_format") {
-            let text_format = match response_format.get("type").and_then(Value::as_str) {
-                Some("text") | Some("json_object") => {
-                    Some(serde_json::json!({ "format": response_format }))
-                }
-                Some("json_schema") => response_format.get("json_schema").map(|json_schema| {
-                    serde_json::json!({
-                        "format": {
-                            "type": "json_schema",
-                            "schema": json_schema.get("schema").cloned().unwrap_or(serde_json::json!({})),
-                            "name": json_schema.get("name"),
-                            "description": json_schema.get("description"),
-                            "strict": json_schema.get("strict")
-                        }
-                    })
-                }),
-                _ => None,
-            };
-            if let Some(tf) = text_format {
-                obj.insert("text".into(), tf);
-            }
-        }
-
-        // Transform reasoning_effort to nested reasoning.effort structure
-        if let Some(effort) = req.extras.get("reasoning_effort") {
-            obj.insert(
-                "reasoning".into(),
-                serde_json::json!({ "effort": effort.clone() }),
-            );
-        }
-
-        // Pass through parallel_tool_calls
-        if let Some(Value::Bool(parallel)) = req.extras.get("parallel_tool_calls") {
-            obj.insert("parallel_tool_calls".into(), Value::Bool(*parallel));
-        }
-
-        // Merge remaining extras (except those we handled specially)
-        for (k, v) in &req.extras {
-            if !matches!(
-                k.as_str(),
-                "tools"
-                    | "tool_choice"
-                    | "response_format"
-                    | "reasoning_effort"
-                    | "parallel_tool_calls"
-            ) {
-                obj.insert(k.clone(), v.clone());
-            }
-        }
-
-        Ok(Value::Object(obj))
-    }
-
-    fn apply_defaults(&self, _req: &mut UniversalRequest) {
-        // Responses API doesn't require any specific defaults
-    }
-
-    fn detect_response(&self, payload: &Value) -> bool {
-        // Responses API response has output[] array and object="response"
-        payload.get("output").and_then(Value::as_array).is_some()
-            && payload
-                .get("object")
-                .and_then(Value::as_str)
-                .is_some_and(|o| o == "response")
-    }
-
-    fn response_to_universal(&self, payload: Value) -> Result<UniversalResponse, TransformError> {
-        let output = payload
-            .get("output")
-            .and_then(Value::as_array)
-            .ok_or_else(|| TransformError::ToUniversalFailed("missing output".to_string()))?;
-
-        // Convert output items to messages
-        // Responses API has multiple output types: message, function_call, reasoning, etc.
-        let mut messages: Vec<Message> = Vec::new();
-        let mut tool_calls: Vec<Value> = Vec::new();
-
-        for item in output {
-            let item_type = item.get("type").and_then(Value::as_str);
-
-            match item_type {
-                Some("message") => {
-                    // Message type - extract text content
-                    if let Some(content) = item.get("content") {
-                        if let Some(content_arr) = content.as_array() {
-                            let text: String = content_arr
-                                .iter()
-                                .filter_map(|c| {
-                                    if c.get("type").and_then(Value::as_str) == Some("output_text")
-                                    {
-                                        c.get("text").and_then(Value::as_str).map(String::from)
-                                    } else {
-                                        None
-                                    }
-                                })
-                                .collect::<Vec<_>>()
-                                .join("");
-                            if !text.is_empty() {
-                                messages.push(Message::Assistant {
-                                    content: AssistantContent::String(text),
-                                    id: None,
-                                });
-                            }
-                        }
-                    }
-                }
-                Some("function_call") => {
-                    // Function call - collect for later conversion to tool calls
-                    tool_calls.push(item.clone());
-                }
-                _ => {
-                    // Skip reasoning and other types for now
-                }
-            }
-        }
-
-        // If we have tool calls but no messages, create an assistant message with tool calls
-        if !tool_calls.is_empty() && messages.is_empty() {
-            // Convert function_call items to tool call format
-            use crate::universal::message::{AssistantContentPart, ToolCallArguments};
-            let parts: Vec<AssistantContentPart> = tool_calls
-                .iter()
-                .filter_map(|tc| {
-                    let name = tc.get("name").and_then(Value::as_str)?;
-                    let call_id = tc.get("call_id").and_then(Value::as_str)?;
-                    let arguments = tc.get("arguments").and_then(Value::as_str)?;
-
-                    // Try to parse arguments as JSON, fall back to invalid string
-                    let args = serde_json::from_str::<Map<String, Value>>(arguments)
-                        .map(ToolCallArguments::Valid)
-                        .unwrap_or_else(|_| ToolCallArguments::Invalid(arguments.to_string()));
-
-                    Some(AssistantContentPart::ToolCall {
-                        tool_call_id: call_id.to_string(),
-                        tool_name: name.to_string(),
-                        arguments: args,
-                        provider_options: None,
-                        provider_executed: None,
-                    })
-                })
-                .collect();
-
-            if !parts.is_empty() {
-                messages.push(Message::Assistant {
-                    content: AssistantContent::Array(parts),
-                    id: None,
-                });
-            }
-        }
-
-        // If still no messages, try output_text field as fallback
-        if messages.is_empty() {
-            if let Some(text) = payload.get("output_text").and_then(Value::as_str) {
-                if !text.is_empty() {
-                    messages.push(Message::Assistant {
-                        content: AssistantContent::String(text.to_string()),
-                        id: None,
-                    });
-                }
-            }
-        }
-
-        // Map status to finish_reason
-        let finish_reason = payload
-            .get("status")
-            .and_then(Value::as_str)
-            .map(|s| s.parse().unwrap());
-
-        let usage = payload.get("usage").map(|u| UniversalUsage {
-            prompt_tokens: u.get("input_tokens").and_then(Value::as_i64),
-            completion_tokens: u.get("output_tokens").and_then(Value::as_i64),
-            prompt_cached_tokens: u
-                .get("input_tokens_details")
-                .and_then(|d| d.get("cached_tokens"))
-                .and_then(Value::as_i64),
-            prompt_cache_creation_tokens: None,
-            completion_reasoning_tokens: u
-                .get("output_tokens_details")
-                .and_then(|d| d.get("reasoning_tokens"))
-                .and_then(Value::as_i64),
-        });
-
-        Ok(UniversalResponse {
-            model: payload
-                .get("model")
-                .and_then(Value::as_str)
-                .map(String::from),
-            messages,
-            usage,
-            finish_reason,
-        })
-    }
-
-    fn response_from_universal(&self, resp: &UniversalResponse) -> Result<Value, TransformError> {
-        // Build Responses API response format
-        let output: Vec<Value> = resp
-            .messages
-            .iter()
-            .map(|msg| {
-                let text = match msg {
-                    Message::Assistant { content, .. } => match content {
-                        AssistantContent::String(s) => s.clone(),
-                        AssistantContent::Array(_) => String::new(), // TODO: extract text from parts
-                    },
-                    Message::User { content } => match content {
-                        UserContent::String(s) => s.clone(),
-                        UserContent::Array(_) => String::new(),
-                    },
-                    _ => String::new(),
-                };
-
-                serde_json::json!({
-                    "type": "message",
-                    "role": "assistant",
-                    "content": [{
-                        "type": "output_text",
-                        "text": text
-                    }]
-                })
-            })
-            .collect();
-
-        let status = self
-            .map_finish_reason(resp.finish_reason.as_ref())
-            .unwrap_or_else(|| "completed".to_string());
-
-        // Build response with all required fields for TheResponseObject
-        let mut obj = serde_json::json!({
-            "id": format!("resp_{}", PLACEHOLDER_ID),
-            "object": "response",
-            "model": resp.model.as_deref().unwrap_or(PLACEHOLDER_MODEL),
-            "output": output,
-            "status": status,
-            "created_at": 0.0,
-            "tool_choice": "none",
-            "tools": [],
-            "parallel_tool_calls": false
-        });
-
-        if let Some(usage) = &resp.usage {
-            let input = usage.prompt_tokens.unwrap_or(0);
-            let output = usage.completion_tokens.unwrap_or(0);
-            obj.as_object_mut().unwrap().insert(
-                "usage".into(),
-                serde_json::json!({
-                    "input_tokens": input,
-                    "output_tokens": output,
-                    "total_tokens": input + output,
-                    "input_tokens_details": {
-                        "cached_tokens": usage.prompt_cached_tokens.unwrap_or(0)
-                    },
-                    "output_tokens_details": {
-                        "reasoning_tokens": usage.completion_reasoning_tokens.unwrap_or(0)
-                    }
-                }),
-            );
-        }
-
-        Ok(obj)
-    }
-
-    fn map_finish_reason(&self, reason: Option<&FinishReason>) -> Option<String> {
-        reason.map(|r| match r {
-            FinishReason::Stop => "completed".to_string(),
-            FinishReason::Length => "incomplete".to_string(),
-            FinishReason::ToolCalls => "completed".to_string(), // Tool calls also complete
-            FinishReason::ContentFilter => "incomplete".to_string(),
-            FinishReason::Other(s) => s.clone(),
-        })
-    }
-
-    // =========================================================================
-    // Streaming response handling
-    // =========================================================================
-
-    fn detect_stream_response(&self, payload: &Value) -> bool {
-        // Responses API streaming has type field starting with "response."
-        payload
-            .get("type")
-            .and_then(Value::as_str)
-            .is_some_and(|t| t.starts_with("response."))
-    }
-
-    fn stream_to_universal(
-        &self,
-        payload: Value,
-    ) -> Result<Option<UniversalStreamChunk>, TransformError> {
-        let event_type = payload
-            .get("type")
-            .and_then(Value::as_str)
-            .ok_or_else(|| TransformError::ToUniversalFailed("missing type field".to_string()))?;
-
-        match event_type {
-            "response.output_text.delta" => {
-                // Text delta - extract from delta field
-                let text = payload.get("delta").and_then(Value::as_str).unwrap_or("");
-                let output_index = payload
-                    .get("output_index")
-                    .and_then(Value::as_u64)
-                    .unwrap_or(0) as u32;
-
-                Ok(Some(UniversalStreamChunk::new(
-                    None,
-                    None,
-                    vec![UniversalStreamChoice {
-                        index: output_index,
-                        delta: Some(serde_json::json!({
-                            "role": "assistant",
-                            "content": text
-                        })),
-                        finish_reason: None,
-                    }],
-                    None,
-                    None,
-                )))
-            }
-
-            "response.completed" => {
-                // Final event with usage
-                let response = payload.get("response");
-                let usage = response
-                    .and_then(|r| r.get("usage"))
-                    .map(|u| UniversalUsage {
-                        prompt_tokens: u.get("input_tokens").and_then(Value::as_i64),
-                        completion_tokens: u.get("output_tokens").and_then(Value::as_i64),
-                        prompt_cached_tokens: u
-                            .get("input_tokens_details")
-                            .and_then(|d| d.get("cached_tokens"))
-                            .and_then(Value::as_i64),
-                        prompt_cache_creation_tokens: None,
-                        completion_reasoning_tokens: u
-                            .get("output_tokens_details")
-                            .and_then(|d| d.get("reasoning_tokens"))
-                            .and_then(Value::as_i64),
-                    });
-
-                let model = response
-                    .and_then(|r| r.get("model"))
-                    .and_then(Value::as_str)
-                    .map(String::from);
-
-                let id = response
-                    .and_then(|r| r.get("id"))
-                    .and_then(Value::as_str)
-                    .map(String::from);
-
-                Ok(Some(UniversalStreamChunk::new(
-                    id,
-                    model,
-                    vec![UniversalStreamChoice {
-                        index: 0,
-                        delta: Some(serde_json::json!({})),
-                        finish_reason: Some("stop".to_string()),
-                    }],
-                    None,
-                    usage,
-                )))
-            }
-
-            "response.incomplete" => {
-                // Incomplete response - typically due to length
-                let response = payload.get("response");
-                let usage = response
-                    .and_then(|r| r.get("usage"))
-                    .map(|u| UniversalUsage {
-                        prompt_tokens: u.get("input_tokens").and_then(Value::as_i64),
-                        completion_tokens: u.get("output_tokens").and_then(Value::as_i64),
-                        prompt_cached_tokens: u
-                            .get("input_tokens_details")
-                            .and_then(|d| d.get("cached_tokens"))
-                            .and_then(Value::as_i64),
-                        prompt_cache_creation_tokens: None,
-                        completion_reasoning_tokens: u
-                            .get("output_tokens_details")
-                            .and_then(|d| d.get("reasoning_tokens"))
-                            .and_then(Value::as_i64),
-                    });
-
-                Ok(Some(UniversalStreamChunk::new(
-                    None,
-                    None,
-                    vec![UniversalStreamChoice {
-                        index: 0,
-                        delta: Some(serde_json::json!({})),
-                        finish_reason: Some("length".to_string()),
-                    }],
-                    None,
-                    usage,
-                )))
-            }
-
-            "response.created" | "response.in_progress" => {
-                // Initial metadata events - extract model/id
-                let response = payload.get("response");
-                let model = response
-                    .and_then(|r| r.get("model"))
-                    .and_then(Value::as_str)
-                    .map(String::from);
-                let id = response
-                    .and_then(|r| r.get("id"))
-                    .and_then(Value::as_str)
-                    .map(String::from);
-
-                Ok(Some(UniversalStreamChunk::new(
-                    id,
-                    model,
-                    vec![UniversalStreamChoice {
-                        index: 0,
-                        delta: Some(serde_json::json!({"role": "assistant", "content": ""})),
-                        finish_reason: None,
-                    }],
-                    None,
-                    None,
-                )))
-            }
-
-            // All other events are metadata/keep-alive
-            _ => Ok(Some(UniversalStreamChunk::keep_alive())),
-        }
-    }
-
-    fn stream_from_universal(&self, chunk: &UniversalStreamChunk) -> Result<Value, TransformError> {
-        if chunk.is_keep_alive() {
-            // Return a generic in_progress event
-            return Ok(serde_json::json!({
-                "type": "response.in_progress",
-                "sequence_number": 0
-            }));
-        }
-
-        // Check for finish chunk
-        let has_finish = chunk
-            .choices
-            .first()
-            .and_then(|c| c.finish_reason.as_ref())
-            .is_some();
-
-        if has_finish {
-            let finish_reason = chunk.choices.first().and_then(|c| c.finish_reason.as_ref());
-            let status = match finish_reason.map(|r| r.as_str()) {
-                Some("stop") => "completed",
-                Some("length") => "incomplete",
-                _ => "completed",
-            };
-
-            let id = chunk
-                .id
-                .clone()
-                .unwrap_or_else(|| format!("resp_{}", PLACEHOLDER_ID));
-            let mut response = serde_json::json!({
-                "id": id,
-                "object": "response",
-                "model": chunk.model.as_deref().unwrap_or(PLACEHOLDER_MODEL),
-                "status": status,
-                "output": []
-            });
-
-            if let Some(usage) = &chunk.usage {
-                response.as_object_mut().unwrap().insert(
-                    "usage".into(),
-                    serde_json::json!({
-                        "input_tokens": usage.prompt_tokens.unwrap_or(0),
-                        "output_tokens": usage.completion_tokens.unwrap_or(0),
-                        "total_tokens": usage.prompt_tokens.unwrap_or(0) + usage.completion_tokens.unwrap_or(0)
-                    }),
-                );
-            }
-
-            return Ok(serde_json::json!({
-                "type": if status == "completed" { "response.completed" } else { "response.incomplete" },
-                "response": response
-            }));
-        }
-
-        // Check for content delta
-        if let Some(choice) = chunk.choices.first() {
-            if let Some(delta) = &choice.delta {
-                if let Some(content) = delta.get("content").and_then(Value::as_str) {
-                    return Ok(serde_json::json!({
-                        "type": "response.output_text.delta",
-                        "output_index": choice.index,
-                        "content_index": 0,
-                        "delta": content
-                    }));
-                }
-            }
-        }
-
-        // Fallback - return output_text.delta with empty content
-        Ok(serde_json::json!({
-            "type": "response.output_text.delta",
-            "output_index": 0,
-            "content_index": 0,
-            "delta": ""
-        }))
-    }
-}
-
 // =============================================================================
 // OpenAI Target-Specific Transformations
 // =============================================================================
@@ -1418,8 +825,12 @@ mod tests {
         });
 
         let universal = adapter.request_to_universal(payload).unwrap();
-        assert!(universal.extras.contains_key("user"));
-        assert!(universal.extras.contains_key("custom_field"));
+        let openai_extras = universal
+            .provider_extras
+            .get(&ProviderFormat::OpenAI)
+            .expect("should have OpenAI extras");
+        assert!(openai_extras.contains_key("user"));
+        assert!(openai_extras.contains_key("custom_field"));
 
         let reconstructed = adapter.request_from_universal(&universal).unwrap();
         assert_eq!(reconstructed.get("user").unwrap(), "test-user-123");
@@ -1430,12 +841,218 @@ mod tests {
     }
 
     #[test]
-    fn test_responses_detect_request() {
-        let adapter = ResponsesAdapter;
-        let payload = json!({
-            "model": "o1",
-            "input": [{"role": "user", "content": "Hello"}]
-        });
-        assert!(adapter.detect_request(&payload));
+    fn test_openai_reasoning_roundtrip() {
+        use crate::universal::message::{AssistantContent, AssistantContentPart, TextContentPart};
+
+        let adapter = OpenAIAdapter;
+
+        // Create universal request with reasoning content
+        let universal = UniversalRequest {
+            model: Some("gpt-4".to_string()),
+            messages: vec![
+                Message::User {
+                    content: crate::universal::message::UserContent::String("Hello".to_string()),
+                },
+                Message::Assistant {
+                    content: AssistantContent::Array(vec![
+                        AssistantContentPart::Reasoning {
+                            text: "Let me think about this...".to_string(),
+                            encrypted_content: None,
+                        },
+                        AssistantContentPart::Text(TextContentPart {
+                            text: "OK".to_string(),
+                            provider_options: None,
+                        }),
+                    ]),
+                    id: None,
+                },
+                Message::User {
+                    content: crate::universal::message::UserContent::String("Thanks".to_string()),
+                },
+            ],
+            params: Default::default(),
+            provider_extras: Default::default(),
+        };
+
+        // Convert universal to ChatCompletions format
+        let openai_json = adapter.request_from_universal(&universal).unwrap();
+
+        // Verify reasoning field is in the JSON output
+        let messages = openai_json.get("messages").unwrap().as_array().unwrap();
+        let assistant_msg = &messages[1];
+        eprintln!(
+            "Assistant message JSON: {}",
+            serde_json::to_string_pretty(assistant_msg).unwrap()
+        );
+
+        assert!(
+            assistant_msg.get("reasoning").is_some(),
+            "Assistant message should have reasoning field. Got: {}",
+            serde_json::to_string_pretty(assistant_msg).unwrap()
+        );
+        assert_eq!(
+            assistant_msg.get("reasoning").unwrap().as_str().unwrap(),
+            "Let me think about this..."
+        );
+
+        // Now convert back to universal and verify reasoning is preserved
+        let universal2 = adapter.request_to_universal(openai_json.clone()).unwrap();
+
+        // Check that reasoning is preserved in universal format
+        let msg = &universal2.messages[1];
+        match msg {
+            Message::Assistant { content, .. } => match content {
+                AssistantContent::Array(parts) => {
+                    let reasoning_part = parts
+                        .iter()
+                        .find(|p| matches!(p, AssistantContentPart::Reasoning { .. }));
+                    assert!(
+                        reasoning_part.is_some(),
+                        "Should have reasoning part after roundtrip. Got: {:?}",
+                        parts
+                    );
+                }
+                _ => panic!("Expected Array content, got {:?}", content),
+            },
+            _ => panic!("Expected Assistant message, got {:?}", msg),
+        }
+    }
+
+    #[test]
+    fn test_openai_reasoning_only_roundtrip() {
+        // Test case like Responses API where assistant message only has reasoning, no text
+        use crate::universal::message::{AssistantContent, AssistantContentPart};
+
+        let adapter = OpenAIAdapter;
+
+        // Create universal request with reasoning-only content (like from Responses API)
+        let universal = UniversalRequest {
+            model: Some("gpt-4".to_string()),
+            messages: vec![
+                Message::User {
+                    content: crate::universal::message::UserContent::String("Hello".to_string()),
+                },
+                Message::Assistant {
+                    content: AssistantContent::Array(vec![AssistantContentPart::Reasoning {
+                        text: "Let me think...".to_string(),
+                        encrypted_content: None,
+                    }]),
+                    id: None,
+                },
+            ],
+            params: Default::default(),
+            provider_extras: Default::default(),
+        };
+
+        // Convert universal to ChatCompletions format
+        let openai_json = adapter.request_from_universal(&universal).unwrap();
+        eprintln!(
+            "Full OpenAI JSON: {}",
+            serde_json::to_string_pretty(&openai_json).unwrap()
+        );
+
+        // Verify reasoning field is in the JSON output
+        let messages = openai_json.get("messages").unwrap().as_array().unwrap();
+        let assistant_msg = &messages[1];
+        eprintln!(
+            "Assistant message JSON: {}",
+            serde_json::to_string_pretty(assistant_msg).unwrap()
+        );
+
+        assert!(
+            assistant_msg.get("reasoning").is_some(),
+            "Assistant message should have reasoning field. Got: {}",
+            serde_json::to_string_pretty(assistant_msg).unwrap()
+        );
+
+        // Now convert back to universal and verify reasoning is preserved
+        let universal2 = adapter.request_to_universal(openai_json.clone()).unwrap();
+        eprintln!("Universal2 messages: {:?}", universal2.messages);
+
+        // Check that reasoning is preserved in universal format
+        let msg = &universal2.messages[1];
+        match msg {
+            Message::Assistant { content, .. } => match content {
+                AssistantContent::Array(parts) => {
+                    eprintln!("Parts: {:?}", parts);
+                    let reasoning_part = parts
+                        .iter()
+                        .find(|p| matches!(p, AssistantContentPart::Reasoning { .. }));
+                    assert!(
+                        reasoning_part.is_some(),
+                        "Should have reasoning part after roundtrip. Got: {:?}",
+                        parts
+                    );
+                }
+                AssistantContent::String(s) => {
+                    panic!("Expected Array content, got String: {:?}", s)
+                }
+            },
+            _ => panic!("Expected Assistant message, got {:?}", msg),
+        }
+    }
+
+    #[test]
+    fn test_openai_empty_reasoning_roundtrip() {
+        // Test case like Responses API where assistant message has empty reasoning summary
+        use crate::universal::message::{AssistantContent, AssistantContentPart};
+
+        let adapter = OpenAIAdapter;
+
+        // Create universal request with empty reasoning content (like from Responses API with empty summary)
+        let universal = UniversalRequest {
+            model: Some("gpt-4".to_string()),
+            messages: vec![
+                Message::User {
+                    content: crate::universal::message::UserContent::String("Hello".to_string()),
+                },
+                Message::Assistant {
+                    content: AssistantContent::Array(vec![AssistantContentPart::Reasoning {
+                        text: "".to_string(), // Empty reasoning
+                        encrypted_content: None,
+                    }]),
+                    id: None,
+                },
+            ],
+            params: Default::default(),
+            provider_extras: Default::default(),
+        };
+
+        // Convert universal to ChatCompletions format
+        let openai_json = adapter.request_from_universal(&universal).unwrap();
+
+        // Verify reasoning field is in the JSON output (even if empty)
+        let messages = openai_json.get("messages").unwrap().as_array().unwrap();
+        let assistant_msg = &messages[1];
+
+        assert!(
+            assistant_msg.get("reasoning").is_some(),
+            "Assistant message should have reasoning field (even if empty). Got: {}",
+            serde_json::to_string_pretty(assistant_msg).unwrap()
+        );
+
+        // Now convert back to universal and verify reasoning is preserved
+        let universal2 = adapter.request_to_universal(openai_json.clone()).unwrap();
+
+        // Check that empty reasoning is preserved in universal format
+        let msg = &universal2.messages[1];
+        match msg {
+            Message::Assistant { content, .. } => match content {
+                AssistantContent::Array(parts) => {
+                    let reasoning_part = parts
+                        .iter()
+                        .find(|p| matches!(p, AssistantContentPart::Reasoning { .. }));
+                    assert!(
+                        reasoning_part.is_some(),
+                        "Should have reasoning part after roundtrip (even if empty). Got: {:?}",
+                        parts
+                    );
+                }
+                AssistantContent::String(s) => {
+                    panic!("Expected Array content, got String: {:?}", s)
+                }
+            },
+            _ => panic!("Expected Assistant message, got {:?}", msg),
+        }
     }
 }
diff --git a/crates/lingua/src/providers/openai/convert.rs b/crates/lingua/src/providers/openai/convert.rs
index a4d6936d..bf8a5303 100644
--- a/crates/lingua/src/providers/openai/convert.rs
+++ b/crates/lingua/src/providers/openai/convert.rs
@@ -7,6 +7,38 @@ use crate::universal::{
     AssistantContent, AssistantContentPart, Message, TextContentPart, ToolCallArguments,
     ToolContentPart, ToolResultContentPart, UserContent, UserContentPart,
 };
+use crate::util::media::parse_base64_data_url;
+use serde::{Deserialize, Serialize};
+
+/// Extended ChatCompletionRequest/ResponseMessage with reasoning support.
+///
+/// The official OpenAI Chat Completions API doesn't include a `reasoning` field on messages.`                                         
+/// With the release of gpt-oss, OpenAI's guidance is to handle reasoning content with                                                 
+/// a top-level `reasoning` field. https://cookbook.openai.com/articles/gpt-oss/handle-raw-cot#chat-completions-api                    
+///
+/// These extension type uses `#[serde(flatten)]` to wrap the generated type while adding
+/// the `reasoning` field, keeping generated types faithful to the official spec.
+#[derive(Debug, Clone, Serialize, Deserialize)]
+pub struct ChatCompletionResponseMessageExt {
+    #[serde(flatten)]
+    pub base: openai::ChatCompletionResponseMessage,
+    #[serde(skip_serializing_if = "Option::is_none")]
+    pub reasoning: Option<String>,
+    /// Encrypted reasoning signature for cross-provider roundtrips (e.g., Anthropic's signature)
+    #[serde(skip_serializing_if = "Option::is_none")]
+    pub reasoning_signature: Option<String>,
+}
+
+#[derive(Debug, Clone, Serialize, Deserialize)]
+pub struct ChatCompletionRequestMessageExt {
+    #[serde(flatten)]
+    pub base: openai::ChatCompletionRequestMessage,
+    #[serde(skip_serializing_if = "Option::is_none")]
+    pub reasoning: Option<String>,
+    /// Encrypted reasoning signature for cross-provider roundtrips (e.g., Anthropic's signature)
+    #[serde(skip_serializing_if = "Option::is_none")]
+    pub reasoning_signature: Option<String>,
+}
 
 /// Helper function to build ToolCallArguments from a JSON value
 fn build_tool_arguments(value: &serde_json::Value) -> ToolCallArguments {
@@ -16,6 +48,27 @@ fn build_tool_arguments(value: &serde_json::Value) -> ToolCallArguments {
     }
 }
 
+/// Helper to parse an optional field from JSON with proper error handling.
+///
+/// Returns `Ok(None)` if the field is missing or null, `Ok(Some(value))` if parsing succeeds,
+/// or `Err` with a descriptive error if parsing fails.
+fn parse_builtin_field<T: serde::de::DeserializeOwned>(
+    value: &serde_json::Value,
+    field: &str,
+    tool_name: &str,
+) -> Result<Option<T>, ConvertError> {
+    match value.get(field) {
+        Some(v) if v.is_null() => Ok(None),
+        Some(v) => serde_json::from_value(v.clone()).map(Some).map_err(|e| {
+            ConvertError::JsonSerializationFailed {
+                field: format!("{}.{}", tool_name, field),
+                error: e.to_string(),
+            }
+        }),
+        None => Ok(None),
+    }
+}
+
 /// Convert OpenAI InputItem collection to universal Message collection
 /// This handles OpenAI-specific logic for combining or transforming multiple items
 impl TryFromLLM<Vec<openai::InputItem>> for Vec<Message> {
@@ -356,9 +409,19 @@ impl TryFromLLM<openai::InputContent> for UserContentPart {
                     None
                 };
 
+                // Parse data URLs to extract raw base64, keep HTTP URLs as-is
+                let (image_data, media_type) =
+                    if let Some(block) = parse_base64_data_url(&image_url) {
+                        // Data URL: extract raw base64 and media type
+                        (block.data, Some(block.media_type))
+                    } else {
+                        // HTTP URL or other: keep as-is with default media type
+                        (image_url.clone(), Some("image/jpeg".to_string()))
+                    };
+
                 UserContentPart::Image {
-                    image: serde_json::Value::String(image_url),
-                    media_type: Some("image/jpeg".to_string()), // Default to JPEG, could be improved
+                    image: serde_json::Value::String(image_data),
+                    media_type,
                     provider_options,
                 }
             }
@@ -438,10 +501,10 @@ impl TryFromLLM<UserContentPart> for openai::InputContent {
             },
             UserContentPart::Image {
                 image,
+                media_type,
                 provider_options,
-                ..
             } => {
-                let image_url = match image {
+                let image_str = match image {
                     serde_json::Value::String(url) => url,
                     _ => {
                         return Err(ConvertError::UnsupportedInputType {
@@ -450,6 +513,18 @@ impl TryFromLLM<UserContentPart> for openai::InputContent {
                     }
                 };
 
+                // If we have raw base64 data (not a URL) and media_type, create a proper data URL
+                let image_url = if !image_str.starts_with("data:")
+                    && !image_str.starts_with("http://")
+                    && !image_str.starts_with("https://")
+                {
+                    // Assume raw base64 data - create data URL with media_type
+                    let mt = media_type.as_deref().unwrap_or("image/jpeg");
+                    format!("data:{};base64,{}", mt, image_str)
+                } else {
+                    image_str
+                };
+
                 // Extract detail from provider_options if present
                 let detail = provider_options
                     .as_ref()
@@ -559,6 +634,37 @@ impl TryFromLLM<AssistantContentPart> for openai::InputContent {
                     ..Default::default()
                 }
             }
+            AssistantContentPart::ToolResult {
+                tool_call_id: _,
+                tool_name,
+                output,
+                ..
+            } => {
+                // Check for web search tool result marker from Anthropic
+                let is_web_search = tool_name == "web_search"
+                    || output.get("anthropic_type").and_then(|v| v.as_str())
+                        == Some("web_search_tool_result");
+
+                if is_web_search {
+                    // Convert web search results to text representation for InputContent
+                    // Extract search results content for display
+                    let text = serde_json::to_string(&output).unwrap_or_else(|_| "{}".to_string());
+                    openai::InputContent {
+                        input_content_type: openai::InputItemContentListType::OutputText,
+                        text: Some(text),
+                        annotations: Some(vec![]),
+                        logprobs: Some(vec![]),
+                        ..Default::default()
+                    }
+                } else {
+                    return Err(ConvertError::UnsupportedInputType {
+                        type_info: format!(
+                            "AssistantContentPart::ToolResult for tool: {}",
+                            tool_name
+                        ),
+                    });
+                }
+            }
             _ => {
                 return Err(ConvertError::UnsupportedInputType {
                     type_info: format!("AssistantContentPart variant: {:?}", part),
@@ -782,12 +888,16 @@ impl TryFromLLM<Message> for openai::InputItem {
                                     "web_search" => (
                                         openai::InputItemType::WebSearchCall,
                                         openai::InputItem {
-                                            action: args_value.get("action").and_then(|v| {
-                                                serde_json::from_value(v.clone()).ok()
-                                            }),
-                                            queries: args_value.get("queries").and_then(|v| {
-                                                serde_json::from_value(v.clone()).ok()
-                                            }),
+                                            action: parse_builtin_field(
+                                                &args_value,
+                                                "action",
+                                                "web_search",
+                                            )?,
+                                            queries: parse_builtin_field(
+                                                &args_value,
+                                                "queries",
+                                                "web_search",
+                                            )?,
                                             ..Default::default()
                                         },
                                     ),
@@ -802,30 +912,38 @@ impl TryFromLLM<Message> for openai::InputItem {
                                                 .get("container_id")
                                                 .and_then(|v| v.as_str())
                                                 .map(|s| s.to_string()),
-                                            outputs: args_value.get("outputs").and_then(|v| {
-                                                serde_json::from_value(v.clone()).ok()
-                                            }),
+                                            outputs: parse_builtin_field(
+                                                &args_value,
+                                                "outputs",
+                                                "code_interpreter",
+                                            )?,
                                             ..Default::default()
                                         },
                                     ),
                                     "file_search" => (
                                         openai::InputItemType::FileSearchCall,
                                         openai::InputItem {
-                                            queries: args_value.get("queries").and_then(|v| {
-                                                serde_json::from_value(v.clone()).ok()
-                                            }),
-                                            results: args_value.get("results").and_then(|v| {
-                                                serde_json::from_value(v.clone()).ok()
-                                            }),
+                                            queries: parse_builtin_field(
+                                                &args_value,
+                                                "queries",
+                                                "file_search",
+                                            )?,
+                                            results: parse_builtin_field(
+                                                &args_value,
+                                                "results",
+                                                "file_search",
+                                            )?,
                                             ..Default::default()
                                         },
                                     ),
                                     "computer" => (
                                         openai::InputItemType::ComputerCall,
                                         openai::InputItem {
-                                            action: args_value.get("action").and_then(|v| {
-                                                serde_json::from_value(v.clone()).ok()
-                                            }),
+                                            action: parse_builtin_field(
+                                                &args_value,
+                                                "action",
+                                                "computer",
+                                            )?,
                                             ..Default::default()
                                         },
                                     ),
@@ -842,9 +960,11 @@ impl TryFromLLM<Message> for openai::InputItem {
                                     "local_shell" => (
                                         openai::InputItemType::LocalShellCall,
                                         openai::InputItem {
-                                            action: args_value.get("action").and_then(|v| {
-                                                serde_json::from_value(v.clone()).ok()
-                                            }),
+                                            action: parse_builtin_field(
+                                                &args_value,
+                                                "action",
+                                                "local_shell",
+                                            )?,
                                             ..Default::default()
                                         },
                                     ),
@@ -865,9 +985,11 @@ impl TryFromLLM<Message> for openai::InputItem {
                                                 .get("server_label")
                                                 .and_then(|v| v.as_str())
                                                 .map(|s| s.to_string()),
-                                            tools: args_value.get("tools").and_then(|v| {
-                                                serde_json::from_value(v.clone()).ok()
-                                            }),
+                                            tools: parse_builtin_field(
+                                                &args_value,
+                                                "tools",
+                                                "mcp_list_tools",
+                                            )?,
                                             ..Default::default()
                                         },
                                     ),
@@ -976,12 +1098,176 @@ impl TryFromLLM<Message> for openai::InputItem {
     }
 }
 
+/// Create an InputItem for a function call (regular or built-in tool).
+///
+/// This helper extracts the logic for converting a universal tool call to an OpenAI InputItem,
+/// handling both provider-executed built-in tools and regular function calls.
+fn create_function_call_input_item(
+    call_id: &str,
+    name: &str,
+    arguments: &ToolCallArguments,
+    provider_executed: Option<bool>,
+    id: Option<String>,
+) -> Result<openai::InputItem, ConvertError> {
+    // Check if this is a provider-executed built-in tool
+    if provider_executed == Some(true) {
+        // Convert back to the appropriate built-in tool type based on tool_name
+        let args_value = match &arguments {
+            ToolCallArguments::Valid(map) => serde_json::Value::Object(map.clone()),
+            ToolCallArguments::Invalid(s) => serde_json::Value::String(s.clone()),
+        };
+
+        let (input_item_type, mut item) = match name {
+            "web_search" => (
+                openai::InputItemType::WebSearchCall,
+                openai::InputItem {
+                    action: args_value
+                        .get("action")
+                        .and_then(|v| serde_json::from_value(v.clone()).ok()),
+                    queries: args_value
+                        .get("queries")
+                        .and_then(|v| serde_json::from_value(v.clone()).ok()),
+                    ..Default::default()
+                },
+            ),
+            "code_interpreter" => (
+                openai::InputItemType::CodeInterpreterCall,
+                openai::InputItem {
+                    code: args_value
+                        .get("code")
+                        .and_then(|v| v.as_str())
+                        .map(|s| s.to_string()),
+                    container_id: args_value
+                        .get("container_id")
+                        .and_then(|v| v.as_str())
+                        .map(|s| s.to_string()),
+                    outputs: args_value
+                        .get("outputs")
+                        .and_then(|v| serde_json::from_value(v.clone()).ok()),
+                    ..Default::default()
+                },
+            ),
+            "file_search" => (
+                openai::InputItemType::FileSearchCall,
+                openai::InputItem {
+                    queries: args_value
+                        .get("queries")
+                        .and_then(|v| serde_json::from_value(v.clone()).ok()),
+                    results: args_value
+                        .get("results")
+                        .and_then(|v| serde_json::from_value(v.clone()).ok()),
+                    ..Default::default()
+                },
+            ),
+            "computer" => (
+                openai::InputItemType::ComputerCall,
+                openai::InputItem {
+                    action: args_value
+                        .get("action")
+                        .and_then(|v| serde_json::from_value(v.clone()).ok()),
+                    ..Default::default()
+                },
+            ),
+            "image_generation" => (
+                openai::InputItemType::ImageGenerationCall,
+                openai::InputItem {
+                    result: args_value
+                        .get("result")
+                        .and_then(|v| v.as_str())
+                        .map(|s| s.to_string()),
+                    ..Default::default()
+                },
+            ),
+            "local_shell" => (
+                openai::InputItemType::LocalShellCall,
+                openai::InputItem {
+                    action: args_value
+                        .get("action")
+                        .and_then(|v| serde_json::from_value(v.clone()).ok()),
+                    ..Default::default()
+                },
+            ),
+            "mcp_call" => (
+                openai::InputItemType::McpCall,
+                openai::InputItem {
+                    server_label: args_value
+                        .get("server_label")
+                        .and_then(|v| v.as_str())
+                        .map(|s| s.to_string()),
+                    ..Default::default()
+                },
+            ),
+            "mcp_list_tools" => (
+                openai::InputItemType::McpListTools,
+                openai::InputItem {
+                    server_label: args_value
+                        .get("server_label")
+                        .and_then(|v| v.as_str())
+                        .map(|s| s.to_string()),
+                    tools: args_value
+                        .get("tools")
+                        .and_then(|v| serde_json::from_value(v.clone()).ok()),
+                    ..Default::default()
+                },
+            ),
+            "mcp_approval_request" => (
+                openai::InputItemType::McpApprovalRequest,
+                openai::InputItem {
+                    ..Default::default()
+                },
+            ),
+            _ => {
+                // Unknown provider-executed tool - fall back to FunctionCall
+                return Ok(openai::InputItem {
+                    role: None,
+                    content: None,
+                    input_item_type: Some(openai::InputItemType::FunctionCall),
+                    id,
+                    call_id: Some(call_id.to_string()),
+                    name: Some(name.to_string()),
+                    arguments: Some(arguments.to_string()),
+                    status: Some(openai::FunctionCallItemStatus::Completed),
+                    ..Default::default()
+                });
+            }
+        };
+
+        // Set common fields
+        item.id = id;
+        item.input_item_type = Some(input_item_type);
+        item.status = args_value
+            .get("status")
+            .and_then(|v| serde_json::from_value(v.clone()).ok());
+
+        Ok(item)
+    } else {
+        // Regular function call (not provider-executed)
+        Ok(openai::InputItem {
+            role: None, // Preserve original role state - request context function calls don't have roles
+            content: None,
+            input_item_type: Some(openai::InputItemType::FunctionCall),
+            id,
+            call_id: Some(call_id.to_string()),
+            name: Some(name.to_string()),
+            arguments: Some(arguments.to_string()),
+            status: Some(openai::FunctionCallItemStatus::Completed),
+            ..Default::default()
+        })
+    }
+}
+
 /// Convert universal messages to OpenAI Responses API InputItem format.
 ///
 /// This function handles the 1:N expansion for Tool messages - a single Tool message
 /// can contain multiple tool results, and each result becomes a separate InputItem
 /// (which is required by the Responses API).
 ///
+/// It also handles 1:N expansion for Assistant messages with mixed content (reasoning,
+/// text, and tool calls). Each content type becomes a separate InputItem in order:
+/// 1. Reasoning item (if reasoning parts exist)
+/// 2. Message item (if text/normal parts exist)
+/// 3. Function call items (one per tool call)
+///
 /// This is provided as a standalone function rather than a TryFromLLM impl because
 /// Rust's coherence rules don't allow overriding the blanket Vec implementation.
 pub fn universal_to_responses_input(
@@ -1018,6 +1304,102 @@ pub fn universal_to_responses_input(
                     }
                 }
             }
+            Message::Assistant { content, id } => {
+                // Handle assistant messages with potential 1:N expansion for mixed content
+                match content {
+                    AssistantContent::String(text) => {
+                        // Simple case: single message item
+                        result.push(openai::InputItem {
+                            role: Some(openai::InputItemRole::Assistant),
+                            content: Some(openai::InputItemContent::String(text.clone())),
+                            id: id.clone(),
+                            input_item_type: Some(openai::InputItemType::Message),
+                            status: Some(openai::FunctionCallItemStatus::Completed),
+                            ..Default::default()
+                        });
+                    }
+                    AssistantContent::Array(parts) => {
+                        // Categorize all parts into separate collections
+                        let mut reasoning_parts: Vec<openai::SummaryText> = vec![];
+                        let mut encrypted_content = None;
+                        let mut normal_parts: Vec<openai::InputContent> = vec![];
+                        let mut tool_calls: Vec<(String, String, ToolCallArguments, Option<bool>)> =
+                            vec![];
+
+                        for part in parts {
+                            match part {
+                                AssistantContentPart::Reasoning {
+                                    text,
+                                    encrypted_content: ec,
+                                } => {
+                                    encrypted_content = ec.clone();
+                                    if !text.is_empty() {
+                                        reasoning_parts.push(openai::SummaryText {
+                                            text: text.clone(),
+                                            summary_text_type: openai::SummaryType::SummaryText,
+                                        });
+                                    }
+                                }
+                                AssistantContentPart::ToolCall {
+                                    tool_call_id,
+                                    tool_name,
+                                    arguments,
+                                    provider_options: _,
+                                    provider_executed,
+                                } => {
+                                    tool_calls.push((
+                                        tool_call_id.clone(),
+                                        tool_name.clone(),
+                                        arguments.clone(),
+                                        *provider_executed,
+                                    ));
+                                }
+                                other_part => {
+                                    normal_parts.push(TryFromLLM::try_from(other_part.clone())?);
+                                }
+                            }
+                        }
+
+                        // 1. Emit reasoning item if present
+                        if !reasoning_parts.is_empty() || encrypted_content.is_some() {
+                            result.push(openai::InputItem {
+                                role: None,
+                                content: None,
+                                input_item_type: Some(openai::InputItemType::Reasoning),
+                                id: id.clone(),
+                                summary: Some(reasoning_parts),
+                                encrypted_content: encrypted_content.clone(),
+                                ..Default::default()
+                            });
+                        }
+
+                        // 2. Emit message item if normal parts present
+                        if !normal_parts.is_empty() {
+                            result.push(openai::InputItem {
+                                role: Some(openai::InputItemRole::Assistant),
+                                content: Some(openai::InputItemContent::InputContentArray(
+                                    normal_parts,
+                                )),
+                                input_item_type: Some(openai::InputItemType::Message),
+                                id: None, // id was used for reasoning if present
+                                status: Some(openai::FunctionCallItemStatus::Completed),
+                                ..Default::default()
+                            });
+                        }
+
+                        // 3. Emit function call items (one per tool call)
+                        for (call_id, name, arguments, provider_executed) in tool_calls {
+                            result.push(create_function_call_input_item(
+                                &call_id,
+                                &name,
+                                &arguments,
+                                provider_executed,
+                                id.clone(),
+                            )?);
+                        }
+                    }
+                }
+            }
             other => {
                 // For all other message types, use the standard conversion
                 result.push(<openai::InputItem as TryFromLLM<Message>>::try_from(
@@ -1402,14 +1784,14 @@ fn convert_output_message_content_to_input_content(
 // Chat Completion Conversions
 // ============================================================================
 
-/// Convert ChatCompletionRequestMessage to universal Message
-impl TryFromLLM<openai::ChatCompletionRequestMessage> for Message {
+/// Convert ChatCompletionRequestMessageExt to universal Message
+impl TryFromLLM<ChatCompletionRequestMessageExt> for Message {
     type Error = ConvertError;
 
-    fn try_from(msg: openai::ChatCompletionRequestMessage) -> Result<Self, Self::Error> {
-        match msg.role {
+    fn try_from(msg: ChatCompletionRequestMessageExt) -> Result<Self, Self::Error> {
+        match msg.base.role {
             openai::ChatCompletionRequestMessageRole::System => {
-                let content = match msg.content {
+                let content = match msg.base.content {
                     Some(openai::ChatCompletionRequestMessageContent::String(text)) => {
                         UserContent::String(text)
                     }
@@ -1425,7 +1807,7 @@ impl TryFromLLM<openai::ChatCompletionRequestMessage> for Message {
                 Ok(Message::System { content })
             }
             openai::ChatCompletionRequestMessageRole::User => {
-                let content = match msg.content {
+                let content = match msg.base.content {
                     Some(openai::ChatCompletionRequestMessageContent::String(text)) => {
                         UserContent::String(text)
                     }
@@ -1443,8 +1825,18 @@ impl TryFromLLM<openai::ChatCompletionRequestMessage> for Message {
             openai::ChatCompletionRequestMessageRole::Assistant => {
                 let mut content_parts: Vec<AssistantContentPart> = Vec::new();
 
+                // Add reasoning FIRST if present (natural model output order)
+                // Note: We preserve empty reasoning strings because the presence of the
+                // reasoning field indicates reasoning occurred (content may be hidden/summarized)
+                if let Some(reasoning) = msg.reasoning {
+                    content_parts.push(AssistantContentPart::Reasoning {
+                        text: reasoning,
+                        encrypted_content: msg.reasoning_signature.clone(),
+                    });
+                }
+
                 // Add text content if present
-                match msg.content {
+                match msg.base.content {
                     Some(openai::ChatCompletionRequestMessageContent::String(text)) => {
                         if !text.is_empty() {
                             content_parts.push(AssistantContentPart::Text(TextContentPart {
@@ -1481,7 +1873,7 @@ impl TryFromLLM<openai::ChatCompletionRequestMessage> for Message {
                 }
 
                 // Add tool calls if present
-                if let Some(tool_calls) = msg.tool_calls {
+                if let Some(tool_calls) = msg.base.tool_calls {
                     for tool_call in tool_calls {
                         if let Some(function) = tool_call.function {
                             content_parts.push(AssistantContentPart::ToolCall {
@@ -1513,7 +1905,7 @@ impl TryFromLLM<openai::ChatCompletionRequestMessage> for Message {
             }
             openai::ChatCompletionRequestMessageRole::Developer => {
                 // Treat developer messages as system messages in universal format
-                let content = match msg.content {
+                let content = match msg.base.content {
                     Some(openai::ChatCompletionRequestMessageContent::String(text)) => {
                         UserContent::String(text)
                     }
@@ -1530,7 +1922,7 @@ impl TryFromLLM<openai::ChatCompletionRequestMessage> for Message {
             }
             openai::ChatCompletionRequestMessageRole::Tool => {
                 // Tool messages should extract tool_call_id and content
-                let content_text = match msg.content {
+                let content_text = match msg.base.content {
                     Some(openai::ChatCompletionRequestMessageContent::String(text)) => text,
                     Some(openai::ChatCompletionRequestMessageContent::ChatCompletionRequestMessageContentPartArray(mut arr)) => {
                         if arr.len() != 1 {
@@ -1551,7 +1943,8 @@ impl TryFromLLM<openai::ChatCompletionRequestMessage> for Message {
                 };
 
                 let tool_call_id =
-                    msg.tool_call_id
+                    msg.base
+                        .tool_call_id
                         .ok_or_else(|| ConvertError::MissingRequiredField {
                             field: "tool_call_id".to_string(),
                         })?;
@@ -1568,8 +1961,9 @@ impl TryFromLLM<openai::ChatCompletionRequestMessage> for Message {
                     content: vec![ToolContentPart::ToolResult(tool_result)],
                 })
             }
-            _ => Err(ConvertError::InvalidRole {
-                role: format!("{:?}", msg.role),
+            _ => Err(ConvertError::InvalidEnumValue {
+                type_name: "role",
+                value: format!("{:?}", msg.base.role),
             }),
         }
     }
@@ -1597,15 +1991,19 @@ impl TryFromLLM<openai::ChatCompletionRequestMessageContentPart> for UserContent
             }
             openai::PurpleType::ImageUrl => {
                 if let Some(image_url) = part.image_url {
-                    // Convert ImageUrl to UserContentPart::Image
+                    // Parse data URLs to extract raw base64, keep HTTP URLs as-is
+                    let (image_data, media_type) =
+                        if let Some(block) = parse_base64_data_url(&image_url.url) {
+                            // Data URL: extract raw base64 and media type
+                            (block.data, Some(block.media_type))
+                        } else {
+                            // HTTP URL or other: keep as-is, no media type
+                            (image_url.url.clone(), None)
+                        };
+
                     Ok(UserContentPart::Image {
-                        image: serde_json::to_value(&image_url.url).map_err(|e| {
-                            ConvertError::JsonSerializationFailed {
-                                field: "image_url".to_string(),
-                                error: e.to_string(),
-                            }
-                        })?,
-                        media_type: Some("image/url".to_string()),
+                        image: serde_json::Value::String(image_data),
+                        media_type,
                         provider_options: None,
                     })
                 } else {
@@ -1625,43 +2023,56 @@ impl TryFromLLM<openai::ChatCompletionRequestMessageContentPart> for UserContent
 }
 
 /// Convert universal Message to ChatCompletionRequestMessage
-impl TryFromLLM<Message> for openai::ChatCompletionRequestMessage {
+impl TryFromLLM<Message> for ChatCompletionRequestMessageExt {
     type Error = ConvertError;
 
     fn try_from(msg: Message) -> Result<Self, Self::Error> {
         match msg {
-            Message::System { content } => Ok(openai::ChatCompletionRequestMessage {
-                role: openai::ChatCompletionRequestMessageRole::System,
-                content: Some(convert_user_content_to_chat_completion_content(content)?),
-                name: None,
-                tool_calls: None,
-                tool_call_id: None,
-                audio: None,
-                function_call: None,
-                refusal: None,
-            }),
-            Message::User { content } => Ok(openai::ChatCompletionRequestMessage {
-                role: openai::ChatCompletionRequestMessageRole::User,
-                content: Some(convert_user_content_to_chat_completion_content(content)?),
-                name: None,
-                tool_calls: None,
-                tool_call_id: None,
-                audio: None,
-                function_call: None,
-                refusal: None,
+            Message::System { content } => Ok(ChatCompletionRequestMessageExt {
+                base: openai::ChatCompletionRequestMessage {
+                    role: openai::ChatCompletionRequestMessageRole::System,
+                    content: Some(convert_user_content_to_chat_completion_content(content)?),
+                    name: None,
+                    tool_calls: None,
+                    tool_call_id: None,
+                    audio: None,
+                    function_call: None,
+                    refusal: None,
+                },
+                reasoning: None,
+                reasoning_signature: None,
             }),
-            Message::Assistant { content, id: _ } => {
-                let (text_content, tool_calls) = extract_content_and_tool_calls(content)?;
-
-                Ok(openai::ChatCompletionRequestMessage {
-                    role: openai::ChatCompletionRequestMessageRole::Assistant,
-                    content: text_content,
+            Message::User { content } => Ok(ChatCompletionRequestMessageExt {
+                base: openai::ChatCompletionRequestMessage {
+                    role: openai::ChatCompletionRequestMessageRole::User,
+                    content: Some(convert_user_content_to_chat_completion_content(content)?),
                     name: None,
-                    tool_calls,
+                    tool_calls: None,
                     tool_call_id: None,
                     audio: None,
                     function_call: None,
                     refusal: None,
+                },
+                reasoning: None,
+                reasoning_signature: None,
+            }),
+            Message::Assistant { content, id: _ } => {
+                let (text_content, tool_calls, reasoning, reasoning_signature) =
+                    extract_content_tool_calls_and_reasoning(content)?;
+
+                Ok(ChatCompletionRequestMessageExt {
+                    base: openai::ChatCompletionRequestMessage {
+                        role: openai::ChatCompletionRequestMessageRole::Assistant,
+                        content: text_content,
+                        name: None,
+                        tool_calls,
+                        tool_call_id: None,
+                        audio: None,
+                        function_call: None,
+                        refusal: None,
+                    },
+                    reasoning,
+                    reasoning_signature,
                 })
             }
             Message::Tool { content } => {
@@ -1688,17 +2099,21 @@ impl TryFromLLM<Message> for openai::ChatCompletionRequestMessage {
                     })?,
                 };
 
-                Ok(openai::ChatCompletionRequestMessage {
-                    role: openai::ChatCompletionRequestMessageRole::Tool,
-                    content: Some(openai::ChatCompletionRequestMessageContent::String(
-                        content_string,
-                    )),
-                    name: None,
-                    tool_calls: None,
-                    tool_call_id: Some(tool_result.tool_call_id.clone()),
-                    audio: None,
-                    function_call: None,
-                    refusal: None,
+                Ok(ChatCompletionRequestMessageExt {
+                    base: openai::ChatCompletionRequestMessage {
+                        role: openai::ChatCompletionRequestMessageRole::Tool,
+                        content: Some(openai::ChatCompletionRequestMessageContent::String(
+                            content_string,
+                        )),
+                        name: None,
+                        tool_calls: None,
+                        tool_call_id: Some(tool_result.tool_call_id.clone()),
+                        audio: None,
+                        function_call: None,
+                        refusal: None,
+                    },
+                    reasoning: None,
+                    reasoning_signature: None,
                 })
             }
         }
@@ -1736,11 +2151,11 @@ fn convert_user_content_part_to_chat_completion_part(
         }),
         UserContentPart::Image {
             image,
-            media_type: _,
+            media_type,
             provider_options: _,
         } => {
             // Convert image to ImageUrl format
-            let url = match image {
+            let image_str = match image {
                 serde_json::Value::String(url) => url,
                 _ => {
                     return Err(ConvertError::UnsupportedInputType {
@@ -1751,6 +2166,19 @@ fn convert_user_content_part_to_chat_completion_part(
                     })
                 }
             };
+
+            // If we have raw base64 data (not a URL) and media_type, create a proper data URL
+            let url = if !image_str.starts_with("data:")
+                && !image_str.starts_with("http://")
+                && !image_str.starts_with("https://")
+            {
+                // Assume raw base64 data - create data URL with media_type
+                let mt = media_type.as_deref().unwrap_or("image/jpeg");
+                format!("data:{};base64,{}", mt, image_str)
+            } else {
+                image_str
+            };
+
             Ok(openai::ChatCompletionRequestMessageContentPart {
                 text: None,
                 chat_completion_request_message_content_part_type: openai::PurpleType::ImageUrl,
@@ -1769,24 +2197,29 @@ fn convert_user_content_part_to_chat_completion_part(
     }
 }
 
-/// Extract text content and tool calls from AssistantContent
-fn extract_content_and_tool_calls(
+type ExtractedContentResult = (
+    Option<openai::ChatCompletionRequestMessageContent>,
+    Option<Vec<openai::ToolCall>>,
+    Option<String>,
+    Option<String>, // reasoning_signature
+);
+
+/// Extract text content, tool calls, reasoning, and reasoning_signature from AssistantContent
+fn extract_content_tool_calls_and_reasoning(
     content: AssistantContent,
-) -> Result<
-    (
-        Option<openai::ChatCompletionRequestMessageContent>,
-        Option<Vec<openai::ToolCall>>,
-    ),
-    ConvertError,
-> {
+) -> Result<ExtractedContentResult, ConvertError> {
     let mut text_parts = Vec::new();
     let mut tool_calls = Vec::new();
+    let mut reasoning_parts = Vec::new();
+    let mut reasoning_signature: Option<String> = None;
 
     match content {
         AssistantContent::String(text) => {
             return Ok((
                 Some(openai::ChatCompletionRequestMessageContent::String(text)),
                 None,
+                None,
+                None,
             ));
         }
         AssistantContent::Array(parts) => {
@@ -1795,6 +2228,16 @@ fn extract_content_and_tool_calls(
                     AssistantContentPart::Text(text_part) => {
                         text_parts.push(text_part.text);
                     }
+                    AssistantContentPart::Reasoning {
+                        text,
+                        encrypted_content,
+                    } => {
+                        reasoning_parts.push(text);
+                        // Take the first signature if multiple reasoning blocks exist
+                        if reasoning_signature.is_none() {
+                            reasoning_signature = encrypted_content;
+                        }
+                    }
                     AssistantContentPart::ToolCall {
                         tool_call_id,
                         tool_name,
@@ -1833,20 +2276,41 @@ fn extract_content_and_tool_calls(
         Some(tool_calls)
     };
 
-    Ok((text_content, tool_calls_option))
+    let reasoning = if reasoning_parts.is_empty() {
+        None
+    } else {
+        Some(reasoning_parts.join(""))
+    };
+
+    Ok((
+        text_content,
+        tool_calls_option,
+        reasoning,
+        reasoning_signature,
+    ))
 }
 
-/// Convert ChatCompletionResponseMessage to universal Message
-impl TryFromLLM<&openai::ChatCompletionResponseMessage> for Message {
+/// Convert ChatCompletionResponseMessageExt to universal Message
+impl TryFromLLM<ChatCompletionResponseMessageExt> for Message {
     type Error = ConvertError;
 
-    fn try_from(msg: &openai::ChatCompletionResponseMessage) -> Result<Self, Self::Error> {
-        match msg.role {
+    fn try_from(msg: ChatCompletionResponseMessageExt) -> Result<Self, Self::Error> {
+        match msg.base.role {
             openai::MessageRole::Assistant => {
                 let mut content_parts: Vec<AssistantContentPart> = Vec::new();
 
+                // Add reasoning FIRST if present (natural model output order: think first, respond after)
+                // Note: We preserve empty reasoning strings because the presence of the
+                // reasoning field indicates reasoning occurred (content may be hidden/summarized)
+                if let Some(reasoning) = msg.reasoning {
+                    content_parts.push(AssistantContentPart::Reasoning {
+                        text: reasoning,
+                        encrypted_content: msg.reasoning_signature.clone(),
+                    });
+                }
+
                 // Add text content if present
-                if let Some(text) = &msg.content {
+                if let Some(text) = &msg.base.content {
                     if !text.is_empty() {
                         content_parts.push(AssistantContentPart::Text(TextContentPart {
                             text: text.clone(),
@@ -1856,7 +2320,7 @@ impl TryFromLLM<&openai::ChatCompletionResponseMessage> for Message {
                 }
 
                 // Add tool calls if present
-                if let Some(tool_calls) = &msg.tool_calls {
+                if let Some(tool_calls) = &msg.base.tool_calls {
                     for tool_call in tool_calls {
                         if let Some(function) = &tool_call.function {
                             content_parts.push(AssistantContentPart::ToolCall {
@@ -1890,15 +2354,15 @@ impl TryFromLLM<&openai::ChatCompletionResponseMessage> for Message {
     }
 }
 
-/// Convert universal Message to ChatCompletionResponseMessage
-impl TryFromLLM<&Message> for openai::ChatCompletionResponseMessage {
+/// Convert universal Message to ChatCompletionResponseMessageExt
+impl TryFromLLM<&Message> for ChatCompletionResponseMessageExt {
     type Error = ConvertError;
 
     fn try_from(msg: &Message) -> Result<Self, Self::Error> {
         match msg {
             Message::Assistant { content, id: _ } => {
-                let (content_text, tool_calls) = match content {
-                    AssistantContent::String(text) => (Some(text.clone()), None),
+                let (content_text, tool_calls, reasoning, reasoning_signature) = match content {
+                    AssistantContent::String(text) => (Some(text.clone()), None, None, None),
                     AssistantContent::Array(parts) => {
                         // Extract text from parts and concatenate
                         let texts: Vec<String> = parts
@@ -1911,6 +2375,23 @@ impl TryFromLLM<&Message> for openai::ChatCompletionResponseMessage {
                             })
                             .collect();
 
+                        // Extract reasoning from parts and concatenate, also capture signature
+                        let mut reasonings: Vec<String> = Vec::new();
+                        let mut signature: Option<String> = None;
+                        for part in parts {
+                            if let AssistantContentPart::Reasoning {
+                                text,
+                                encrypted_content,
+                            } = part
+                            {
+                                reasonings.push(text.clone());
+                                // Take the first signature if multiple reasoning blocks exist
+                                if signature.is_none() {
+                                    signature = encrypted_content.clone();
+                                }
+                            }
+                        }
+
                         // Extract tool calls from parts
                         let tool_calls: Vec<openai::ToolCall> = parts
                             .iter()
@@ -1939,28 +2420,39 @@ impl TryFromLLM<&Message> for openai::ChatCompletionResponseMessage {
                             Some(texts.join(""))
                         };
 
+                        let reasoning = if reasonings.is_empty() {
+                            None
+                        } else {
+                            Some(reasonings.join(""))
+                        };
+
                         let tool_calls_option = if tool_calls.is_empty() {
                             None
                         } else {
                             Some(tool_calls)
                         };
 
-                        (content_text, tool_calls_option)
+                        (content_text, tool_calls_option, reasoning, signature)
                     }
                 };
 
-                Ok(openai::ChatCompletionResponseMessage {
-                    role: openai::MessageRole::Assistant,
-                    content: content_text,
-                    annotations: Some(vec![]), // Hardcode empty annotations for consistency
-                    audio: None,
-                    function_call: None,
-                    refusal: None,
-                    tool_calls,
+                Ok(ChatCompletionResponseMessageExt {
+                    base: openai::ChatCompletionResponseMessage {
+                        role: openai::MessageRole::Assistant,
+                        content: content_text,
+                        annotations: Some(vec![]), // Hardcode empty annotations for consistency
+                        audio: None,
+                        function_call: None,
+                        refusal: None,
+                        tool_calls,
+                    },
+                    reasoning,
+                    reasoning_signature,
                 })
             }
-            _ => Err(ConvertError::InvalidRole {
-                role: format!("{:?}", msg),
+            _ => Err(ConvertError::InvalidEnumValue {
+                type_name: "role",
+                value: format!("{:?}", msg),
             }),
         }
     }
diff --git a/crates/lingua/src/providers/openai/mod.rs b/crates/lingua/src/providers/openai/mod.rs
index 9ba962b6..00ede8e4 100644
--- a/crates/lingua/src/providers/openai/mod.rs
+++ b/crates/lingua/src/providers/openai/mod.rs
@@ -11,9 +11,12 @@ pub mod capabilities;
 pub mod convert;
 pub mod detect;
 pub mod generated;
+pub mod params;
+pub mod responses_adapter;
 
 // Re-export adapters and transformations
-pub use adapter::{apply_target_transforms, OpenAIAdapter, OpenAITransformError, ResponsesAdapter};
+pub use adapter::{apply_target_transforms, OpenAIAdapter, OpenAITransformError};
+pub use responses_adapter::ResponsesAdapter;
 
 #[cfg(test)]
 pub mod test_responses;
@@ -24,8 +27,10 @@ pub mod test_chat_completions;
 // Re-export detection functions
 pub use detect::{try_parse_openai, try_parse_responses, DetectionError};
 
-// Re-export conversion functions
-pub use convert::universal_to_responses_input;
+// Re-export conversion functions and extension types
+pub use convert::{
+    universal_to_responses_input, ChatCompletionRequestMessageExt, ChatCompletionResponseMessageExt,
+};
 
 // Re-export generated types (official OpenAI API types from OpenAPI spec)
 pub use generated::{
diff --git a/crates/lingua/src/providers/openai/params.rs b/crates/lingua/src/providers/openai/params.rs
new file mode 100644
index 00000000..bb7e85ed
--- /dev/null
+++ b/crates/lingua/src/providers/openai/params.rs
@@ -0,0 +1,198 @@
+/*!
+Typed parameter structs for OpenAI APIs.
+
+These structs use `#[serde(flatten)]` to automatically capture unknown fields,
+eliminating the need for explicit KNOWN_KEYS arrays.
+*/
+
+use crate::providers::openai::generated::{
+    ChatCompletionRequestMessage, Instructions, Reasoning, ReasoningEffort,
+};
+use crate::serde_json::Value;
+use serde::{Deserialize, Serialize};
+use std::collections::BTreeMap;
+
+/// OpenAI Chat Completions API request parameters.
+///
+/// All known fields are explicitly typed. Unknown fields automatically
+/// go into `extras` via `#[serde(flatten)]`.
+#[derive(Debug, Clone, Default, Serialize, Deserialize)]
+pub struct OpenAIChatParams {
+    // === Core fields ===
+    pub model: Option<String>,
+    pub messages: Option<Vec<ChatCompletionRequestMessage>>,
+
+    // === Sampling parameters ===
+    pub temperature: Option<f64>,
+    pub top_p: Option<f64>,
+    pub seed: Option<i64>,
+    pub presence_penalty: Option<f64>,
+    pub frequency_penalty: Option<f64>,
+
+    // === Output control ===
+    pub max_tokens: Option<i64>,
+    pub max_completion_tokens: Option<i64>,
+    pub stop: Option<Value>,
+    pub n: Option<i64>,
+    pub logprobs: Option<bool>,
+    pub top_logprobs: Option<i64>,
+    pub logit_bias: Option<Value>,
+
+    // === Tools and function calling ===
+    pub tools: Option<Value>,
+    pub tool_choice: Option<Value>,
+    pub parallel_tool_calls: Option<bool>,
+
+    // === Response format ===
+    pub response_format: Option<Value>,
+
+    // === Streaming ===
+    pub stream: Option<bool>,
+    pub stream_options: Option<Value>,
+
+    // === Reasoning (o-series models) ===
+    pub reasoning_effort: Option<ReasoningEffort>,
+
+    // === Metadata and identification ===
+    pub metadata: Option<Value>,
+    pub store: Option<bool>,
+    pub service_tier: Option<String>,
+    pub user: Option<String>,
+    pub safety_identifier: Option<String>,
+    pub prompt_cache_key: Option<String>,
+
+    // === Prediction ===
+    pub prediction: Option<Value>,
+
+    /// Unknown fields - automatically captured by serde flatten.
+    /// These are provider-specific fields not in the canonical set.
+    #[serde(flatten)]
+    pub extras: BTreeMap<String, Value>,
+}
+
+/// OpenAI Responses API request parameters.
+///
+/// The Responses API has different field names and structure than Chat Completions.
+/// All known fields are explicitly typed. Unknown fields automatically
+/// go into `extras` via `#[serde(flatten)]`.
+#[derive(Debug, Clone, Default, Serialize, Deserialize)]
+pub struct OpenAIResponsesParams {
+    // === Core fields ===
+    pub model: Option<String>,
+    pub input: Option<Instructions>,
+    pub instructions: Option<String>,
+
+    // === Sampling parameters ===
+    pub temperature: Option<f64>,
+    pub top_p: Option<f64>,
+
+    // === Output control ===
+    pub max_output_tokens: Option<i64>,
+    pub top_logprobs: Option<i64>,
+
+    // === Tools and function calling ===
+    pub tools: Option<Value>,
+    pub tool_choice: Option<Value>,
+    pub parallel_tool_calls: Option<bool>,
+
+    // === Text/Response format (nested structure) ===
+    pub text: Option<Value>,
+
+    // === Streaming ===
+    pub stream: Option<bool>,
+
+    // === Reasoning configuration (nested structure) ===
+    pub reasoning: Option<Reasoning>,
+
+    // === Context management ===
+    pub truncation: Option<Value>,
+
+    // === Metadata and identification ===
+    pub metadata: Option<Value>,
+    pub store: Option<bool>,
+    pub service_tier: Option<String>,
+    pub user: Option<String>,
+    pub safety_identifier: Option<String>,
+    pub prompt_cache_key: Option<String>,
+
+    /// Unknown fields - automatically captured by serde flatten.
+    #[serde(flatten)]
+    pub extras: BTreeMap<String, Value>,
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::serde_json;
+    use crate::serde_json::json;
+
+    #[test]
+    fn test_chat_params_known_fields() {
+        let json = json!({
+            "model": "gpt-4o",
+            "messages": [{"role": "user", "content": "Hello"}],
+            "temperature": 0.7,
+            "max_tokens": 100
+        });
+
+        let params: OpenAIChatParams = serde_json::from_value(json).unwrap();
+        assert_eq!(params.model, Some("gpt-4o".to_string()));
+        assert_eq!(params.temperature, Some(0.7));
+        assert_eq!(params.max_tokens, Some(100));
+        assert!(params.extras.is_empty());
+    }
+
+    #[test]
+    fn test_chat_params_unknown_fields_go_to_extras() {
+        let json = json!({
+            "model": "gpt-4o",
+            "messages": [],
+            "some_future_param": "value",
+            "another_unknown": 42
+        });
+
+        let params: OpenAIChatParams = serde_json::from_value(json).unwrap();
+        assert_eq!(params.model, Some("gpt-4o".to_string()));
+        assert_eq!(params.extras.len(), 2);
+        assert_eq!(
+            params.extras.get("some_future_param"),
+            Some(&Value::String("value".to_string()))
+        );
+        assert_eq!(
+            params.extras.get("another_unknown"),
+            Some(&Value::Number(42.into()))
+        );
+    }
+
+    #[test]
+    fn test_responses_params_known_fields() {
+        let json = json!({
+            "model": "gpt-5-nano",
+            "input": [{"role": "user", "content": "Hello"}],
+            "instructions": "Be helpful",
+            "max_output_tokens": 500,
+            "reasoning": {"effort": "medium"}
+        });
+
+        let params: OpenAIResponsesParams = serde_json::from_value(json).unwrap();
+        assert_eq!(params.model, Some("gpt-5-nano".to_string()));
+        assert_eq!(params.instructions, Some("Be helpful".to_string()));
+        assert_eq!(params.max_output_tokens, Some(500));
+        assert!(params.extras.is_empty());
+    }
+
+    #[test]
+    fn test_roundtrip_preserves_extras() {
+        let json = json!({
+            "model": "gpt-4o",
+            "messages": [],
+            "custom_field": {"nested": "data"}
+        });
+
+        let params: OpenAIChatParams = serde_json::from_value(json.clone()).unwrap();
+        let back: Value = serde_json::to_value(&params).unwrap();
+
+        // Custom field should be preserved
+        assert_eq!(back.get("custom_field"), json.get("custom_field"));
+    }
+}
diff --git a/crates/lingua/src/providers/openai/responses_adapter.rs b/crates/lingua/src/providers/openai/responses_adapter.rs
new file mode 100644
index 00000000..f6adca93
--- /dev/null
+++ b/crates/lingua/src/providers/openai/responses_adapter.rs
@@ -0,0 +1,848 @@
+/*!
+OpenAI Responses API adapter.
+
+This module provides the `ResponsesAdapter` for the Responses API,
+which is used by reasoning models like o1 and o3.
+*/
+
+use crate::capabilities::ProviderFormat;
+use crate::reject_params;
+use std::collections::HashMap;
+
+use crate::error::ConvertError;
+use crate::processing::adapters::{
+    insert_opt_bool, insert_opt_f64, insert_opt_i64, ProviderAdapter,
+};
+use crate::processing::transform::TransformError;
+use crate::providers::openai::generated::{
+    InputItem, InputItemContent, InputItemRole, InputItemType, Instructions, OutputItemType,
+};
+use crate::providers::openai::params::OpenAIResponsesParams;
+use crate::providers::openai::{try_parse_responses, universal_to_responses_input};
+use crate::serde_json::{self, Map, Value};
+use crate::universal::convert::TryFromLLM;
+use crate::universal::message::{
+    AssistantContent, Message, TextContentPart, UserContent, UserContentPart,
+};
+use crate::universal::tools::{tools_to_responses_value, UniversalTool};
+use crate::universal::{
+    FinishReason, UniversalParams, UniversalRequest, UniversalResponse, UniversalStreamChoice,
+    UniversalStreamChunk, UniversalUsage, PLACEHOLDER_ID, PLACEHOLDER_MODEL,
+};
+use std::convert::TryInto;
+
+/// Check if a model is a reasoning model that doesn't support temperature.
+fn is_reasoning_model(model: &str) -> bool {
+    let model_lower = model.to_lowercase();
+    model_lower.starts_with("o1")
+        || model_lower.starts_with("o3")
+        || model_lower.starts_with("gpt-5")
+}
+
+fn system_text(message: &Message) -> Option<&str> {
+    match message {
+        Message::System { content } => match content {
+            UserContent::String(text) => Some(text.as_str()),
+            UserContent::Array(parts) => {
+                if parts.len() != 1 {
+                    return None;
+                }
+                match &parts[0] {
+                    UserContentPart::Text(TextContentPart { text, .. }) => Some(text.as_str()),
+                    _ => None,
+                }
+            }
+        },
+        _ => None,
+    }
+}
+
+/// Adapter for OpenAI Responses API (used by reasoning models like o1).
+pub struct ResponsesAdapter;
+
+impl ProviderAdapter for ResponsesAdapter {
+    fn format(&self) -> ProviderFormat {
+        ProviderFormat::Responses
+    }
+
+    fn directory_name(&self) -> &'static str {
+        "responses"
+    }
+
+    fn display_name(&self) -> &'static str {
+        "Responses"
+    }
+
+    fn detect_request(&self, payload: &Value) -> bool {
+        try_parse_responses(payload).is_ok()
+    }
+
+    fn request_to_universal(&self, payload: Value) -> Result<UniversalRequest, TransformError> {
+        // Single parse: typed params now includes typed input via #[serde(flatten)]
+        let typed_params: OpenAIResponsesParams = serde_json::from_value(payload)
+            .map_err(|e| TransformError::ToUniversalFailed(e.to_string()))?;
+
+        // Extract input items from typed_params.input (partial move - other fields remain accessible)
+        let input_items: Vec<InputItem> = match typed_params.input {
+            Some(Instructions::InputItemArray(items)) => items,
+            Some(Instructions::String(s)) => {
+                // Single string input - create a user message InputItem
+                vec![InputItem {
+                    input_item_type: Some(InputItemType::Message),
+                    role: Some(InputItemRole::User),
+                    content: Some(InputItemContent::String(s)),
+                    ..Default::default()
+                }]
+            }
+            None => {
+                return Err(TransformError::ToUniversalFailed(
+                    "OpenAI Responses: missing 'input' field".to_string(),
+                ))
+            }
+        };
+
+        let mut messages = <Vec<Message> as TryFromLLM<Vec<InputItem>>>::try_from(input_items)
+            .map_err(|e| TransformError::ToUniversalFailed(e.to_string()))?;
+
+        if let Some(instructions) = typed_params.instructions.as_ref().filter(|s| !s.is_empty()) {
+            messages.insert(
+                0,
+                Message::System {
+                    content: UserContent::String(instructions.clone()),
+                },
+            );
+        }
+
+        // Extract response_format from nested text.format structure and convert to typed config
+        let response_format = typed_params
+            .text
+            .as_ref()
+            .and_then(|t| t.get("format"))
+            .and_then(|v| (ProviderFormat::Responses, v).try_into().ok());
+
+        // Extract max_tokens first - needed for reasoning budget computation
+        let max_tokens = typed_params.max_output_tokens;
+
+        // Convert reasoning to ReasoningConfig, computing budget_tokens with max_tokens context
+        let reasoning = typed_params
+            .reasoning
+            .as_ref()
+            .map(|r| (r, max_tokens).into());
+
+        let mut params = UniversalParams {
+            temperature: typed_params.temperature,
+            top_p: typed_params.top_p,
+            top_k: None,
+            max_tokens,
+            stop: None, // Responses API doesn't use stop
+            tools: typed_params
+                .tools
+                .as_ref()
+                .map(UniversalTool::from_value_array),
+            tool_choice: typed_params
+                .tool_choice
+                .as_ref()
+                .and_then(|v| (ProviderFormat::Responses, v).try_into().ok()),
+            response_format,
+            seed: None,             // Responses API uses different randomness control
+            presence_penalty: None, // Responses API doesn't support penalties
+            frequency_penalty: None,
+            stream: typed_params.stream,
+            // New canonical fields
+            parallel_tool_calls: typed_params.parallel_tool_calls,
+            reasoning,
+            metadata: typed_params.metadata,
+            store: typed_params.store,
+            service_tier: typed_params.service_tier,
+            logprobs: None, // Responses API doesn't support logprobs boolean
+            top_logprobs: typed_params.top_logprobs,
+        };
+
+        // Sync parallel_tool_calls with tool_choice.disable_parallel for roundtrip fidelity
+        // OpenAI uses parallel_tool_calls at params level, Anthropic uses tool_choice.disable_parallel
+        if params.parallel_tool_calls == Some(false) {
+            if let Some(ref mut tc) = params.tool_choice {
+                if tc.disable_parallel.is_none() {
+                    tc.disable_parallel = Some(true);
+                }
+            }
+        }
+
+        // Collect provider-specific extras for round-trip preservation
+        // This includes both unknown fields (from serde flatten) and known Responses API fields
+        // that aren't part of UniversalParams
+        let mut extras_map: Map<String, Value> = typed_params.extras.into_iter().collect();
+
+        // Add Responses API specific known fields that aren't in UniversalParams
+        if let Some(instructions) = typed_params.instructions {
+            extras_map.insert("instructions".into(), Value::String(instructions));
+        }
+        if let Some(text) = typed_params.text {
+            extras_map.insert("text".into(), text);
+        }
+        if let Some(truncation) = typed_params.truncation {
+            extras_map.insert("truncation".into(), truncation);
+        }
+        if let Some(user) = typed_params.user {
+            extras_map.insert("user".into(), Value::String(user));
+        }
+        if let Some(safety_identifier) = typed_params.safety_identifier {
+            extras_map.insert("safety_identifier".into(), Value::String(safety_identifier));
+        }
+        if let Some(prompt_cache_key) = typed_params.prompt_cache_key {
+            extras_map.insert("prompt_cache_key".into(), Value::String(prompt_cache_key));
+        }
+
+        let mut provider_extras = HashMap::new();
+        if !extras_map.is_empty() {
+            provider_extras.insert(ProviderFormat::Responses, extras_map);
+        }
+
+        Ok(UniversalRequest {
+            model: typed_params.model,
+            messages,
+            params,
+            provider_extras,
+        })
+    }
+
+    fn request_from_universal(&self, req: &UniversalRequest) -> Result<Value, TransformError> {
+        let model = req.model.as_ref().ok_or(TransformError::ValidationFailed {
+            target: ProviderFormat::Responses,
+            reason: "missing model".to_string(),
+        })?;
+
+        // Validate unsupported parameters
+        reject_params!(req, ProviderFormat::Responses, top_k);
+        // Stop sequences need special handling (check if non-empty)
+        if req
+            .params
+            .stop
+            .as_ref()
+            .is_some_and(|stop| !stop.is_empty())
+        {
+            return Err(TransformError::ValidationFailed {
+                target: ProviderFormat::Responses,
+                reason: "does not support stop sequences".to_string(),
+            });
+        }
+
+        let responses_extras = req.provider_extras.get(&ProviderFormat::Responses);
+        let mut messages_for_input = req.messages.clone();
+        if let Some(extras) = responses_extras {
+            if let Some(instructions) = extras.get("instructions").and_then(Value::as_str) {
+                if let Some(first_text) = messages_for_input.first().and_then(system_text) {
+                    if first_text == instructions {
+                        messages_for_input.remove(0);
+                    }
+                }
+            }
+        }
+
+        // Use existing conversion with 1:N Tool message expansion
+        let input_items = universal_to_responses_input(&messages_for_input)
+            .map_err(|e| TransformError::FromUniversalFailed(e.to_string()))?;
+
+        let mut obj = Map::new();
+        obj.insert("model".into(), Value::String(model.clone()));
+        obj.insert(
+            "input".into(),
+            serde_json::to_value(input_items)
+                .map_err(|e| TransformError::SerializationFailed(e.to_string()))?,
+        );
+
+        // Pass temperature through for non-reasoning models
+        // Reasoning models (o1-*, o3-*, gpt-5-*) don't support temperature
+        if !is_reasoning_model(model) {
+            insert_opt_f64(&mut obj, "temperature", req.params.temperature);
+        }
+        insert_opt_f64(&mut obj, "top_p", req.params.top_p);
+        insert_opt_i64(&mut obj, "max_output_tokens", req.params.max_tokens);
+        insert_opt_i64(&mut obj, "top_logprobs", req.params.top_logprobs);
+        // Note: presence_penalty, frequency_penalty, seed, logprobs (bool) are NOT supported by Responses API
+        insert_opt_bool(&mut obj, "stream", req.params.stream);
+
+        // Get provider-specific extras for Responses API
+        let responses_extras = req.provider_extras.get(&ProviderFormat::Responses);
+
+        // Convert tools to Responses API format
+        if let Some(tools) = req.params.tools.as_ref() {
+            if let Some(tools_value) = tools_to_responses_value(tools)? {
+                obj.insert("tools".into(), tools_value);
+            }
+        }
+
+        // Convert tool_choice using helper method
+        if let Some(tool_choice_val) = req.params.tool_choice_for(ProviderFormat::Responses) {
+            obj.insert("tool_choice".into(), tool_choice_val);
+        }
+
+        // Convert response_format to Responses API text format using helper method
+        if let Some(text_val) = req.params.response_format_for(ProviderFormat::Responses) {
+            obj.insert("text".into(), text_val);
+        }
+
+        // Add reasoning from canonical params
+        if let Some(reasoning_val) = req.params.reasoning_for(ProviderFormat::Responses) {
+            obj.insert("reasoning".into(), reasoning_val);
+        }
+
+        // Add parallel_tool_calls from canonical params
+        if let Some(parallel) = req.params.parallel_tool_calls {
+            obj.insert("parallel_tool_calls".into(), Value::Bool(parallel));
+        }
+
+        // Add metadata from canonical params
+        if let Some(metadata) = req.params.metadata.as_ref() {
+            obj.insert("metadata".into(), metadata.clone());
+        }
+
+        // Add store from canonical params
+        if let Some(store) = req.params.store {
+            obj.insert("store".into(), Value::Bool(store));
+        }
+
+        // Add service_tier from canonical params
+        if let Some(ref service_tier) = req.params.service_tier {
+            obj.insert("service_tier".into(), Value::String(service_tier.clone()));
+        }
+
+        // Merge back provider-specific extras (only for Responses API)
+        if let Some(extras) = responses_extras {
+            for (k, v) in extras {
+                // Don't overwrite canonical fields we already handled
+                if !obj.contains_key(k) {
+                    obj.insert(k.clone(), v.clone());
+                }
+            }
+        }
+
+        Ok(Value::Object(obj))
+    }
+
+    fn detect_response(&self, payload: &Value) -> bool {
+        // Responses API response has output[] array and object="response"
+        payload.get("output").and_then(Value::as_array).is_some()
+            && payload
+                .get("object")
+                .and_then(Value::as_str)
+                .is_some_and(|o| o == "response")
+    }
+
+    fn response_to_universal(&self, payload: Value) -> Result<UniversalResponse, TransformError> {
+        let output = payload
+            .get("output")
+            .and_then(Value::as_array)
+            .ok_or_else(|| TransformError::ToUniversalFailed("missing output".to_string()))?;
+
+        // Convert output items to messages
+        // Responses API has multiple output types: message, function_call, reasoning, etc.
+        let mut messages: Vec<Message> = Vec::new();
+        let mut tool_calls: Vec<Value> = Vec::new();
+
+        for item in output {
+            let item_type = item.get("type").and_then(Value::as_str);
+
+            match item_type {
+                Some("message") => {
+                    // Message type - extract text content
+                    if let Some(content) = item.get("content") {
+                        if let Some(content_arr) = content.as_array() {
+                            let text: String = content_arr
+                                .iter()
+                                .filter_map(|c| {
+                                    if c.get("type").and_then(Value::as_str) == Some("output_text")
+                                    {
+                                        c.get("text").and_then(Value::as_str).map(String::from)
+                                    } else {
+                                        None
+                                    }
+                                })
+                                .collect::<Vec<_>>()
+                                .join("");
+                            if !text.is_empty() {
+                                messages.push(Message::Assistant {
+                                    content: AssistantContent::String(text),
+                                    id: None,
+                                });
+                            }
+                        }
+                    }
+                }
+                Some("function_call") => {
+                    // Function call - collect for later conversion to tool calls
+                    tool_calls.push(item.clone());
+                }
+                _ => {
+                    // Skip reasoning and other types for now
+                }
+            }
+        }
+
+        // If we have tool calls but no messages, create an assistant message with tool calls
+        if !tool_calls.is_empty() && messages.is_empty() {
+            // Convert function_call items to tool call format
+            use crate::universal::message::{AssistantContentPart, ToolCallArguments};
+            let parts: Vec<AssistantContentPart> = tool_calls
+                .iter()
+                .filter_map(|tc| {
+                    let name = tc.get("name").and_then(Value::as_str)?;
+                    let call_id = tc.get("call_id").and_then(Value::as_str)?;
+                    let arguments = tc.get("arguments").and_then(Value::as_str)?;
+
+                    // Try to parse arguments as JSON, fall back to invalid string
+                    let args = serde_json::from_str::<Map<String, Value>>(arguments)
+                        .map(ToolCallArguments::Valid)
+                        .unwrap_or_else(|_| ToolCallArguments::Invalid(arguments.to_string()));
+
+                    Some(AssistantContentPart::ToolCall {
+                        tool_call_id: call_id.to_string(),
+                        tool_name: name.to_string(),
+                        arguments: args,
+                        provider_options: None,
+                        provider_executed: None,
+                    })
+                })
+                .collect();
+
+            if !parts.is_empty() {
+                messages.push(Message::Assistant {
+                    content: AssistantContent::Array(parts),
+                    id: None,
+                });
+            }
+        }
+
+        // If still no messages, try output_text field as fallback
+        // Include empty string to preserve message structure from source
+        if messages.is_empty() {
+            if let Some(text) = payload.get("output_text").and_then(Value::as_str) {
+                messages.push(Message::Assistant {
+                    content: AssistantContent::String(text.to_string()),
+                    id: None,
+                });
+            }
+        }
+
+        // Map status to finish_reason
+        // If we have tool calls, the finish reason should be ToolCalls regardless of status
+        let finish_reason = if !tool_calls.is_empty() {
+            Some(FinishReason::ToolCalls)
+        } else {
+            match payload.get("status").and_then(Value::as_str) {
+                Some(s) => Some(s.parse().map_err(|_| ConvertError::InvalidEnumValue {
+                    type_name: "FinishReason",
+                    value: s.to_string(),
+                })?),
+                None => None,
+            }
+        };
+
+        let usage = UniversalUsage::extract_from_response(&payload, self.format());
+
+        Ok(UniversalResponse {
+            model: payload
+                .get("model")
+                .and_then(Value::as_str)
+                .map(String::from),
+            messages,
+            usage,
+            finish_reason,
+        })
+    }
+
+    fn response_from_universal(&self, resp: &UniversalResponse) -> Result<Value, TransformError> {
+        // Convert messages to InputItems (handles 1:N expansion for mixed content)
+        let input_items = universal_to_responses_input(&resp.messages)
+            .map_err(|e| TransformError::FromUniversalFailed(e.to_string()))?;
+
+        // Convert InputItems to OutputItems using existing infrastructure
+        let output_items: Vec<crate::providers::openai::generated::OutputItem> = input_items
+            .into_iter()
+            .map(TryFromLLM::try_from)
+            .collect::<Result<_, _>>()
+            .map_err(|e: ConvertError| TransformError::FromUniversalFailed(e.to_string()))?;
+
+        // Serialize OutputItems to JSON values
+        let output: Vec<Value> = output_items
+            .iter()
+            .map(serde_json::to_value)
+            .collect::<Result<_, _>>()
+            .map_err(|e| {
+                TransformError::SerializationFailed(format!(
+                    "Failed to serialize output item: {}",
+                    e
+                ))
+            })?;
+
+        // Calculate output_text (concatenate text from all message-type items)
+        let output_text = output_items
+            .iter()
+            .filter(|item| item.output_item_type == Some(OutputItemType::Message))
+            .filter_map(|item| item.content.as_ref())
+            .flat_map(|content| content.iter())
+            .filter_map(|c| c.text.as_ref())
+            .cloned()
+            .collect::<Vec<_>>()
+            .join("");
+
+        let status = resp
+            .finish_reason
+            .as_ref()
+            .map(|r| r.to_provider_string(self.format()).to_string())
+            .unwrap_or_else(|| "completed".to_string());
+
+        // Build response with all required fields for TheResponseObject
+        let mut obj = serde_json::json!({
+            "id": format!("resp_{}", PLACEHOLDER_ID),
+            "object": "response",
+            "model": resp.model.as_deref().unwrap_or(PLACEHOLDER_MODEL),
+            "output": output,
+            "output_text": output_text,
+            "status": status,
+            "created_at": 0.0,
+            "tool_choice": "none",
+            "tools": [],
+            "parallel_tool_calls": false
+        });
+
+        if let Some(usage) = &resp.usage {
+            obj.as_object_mut()
+                .unwrap()
+                .insert("usage".into(), usage.to_provider_value(self.format()));
+        }
+
+        Ok(obj)
+    }
+
+    // =========================================================================
+    // Streaming response handling
+    // =========================================================================
+
+    fn detect_stream_response(&self, payload: &Value) -> bool {
+        // Responses API streaming has two formats:
+        // 1. type field starting with "response." at top level
+        // 2. object="response.delta" at top level with delta.type nested
+        payload
+            .get("type")
+            .and_then(Value::as_str)
+            .is_some_and(|t| t.starts_with("response."))
+            || payload
+                .get("object")
+                .and_then(Value::as_str)
+                .is_some_and(|o| o == "response.delta")
+    }
+
+    fn stream_to_universal(
+        &self,
+        payload: Value,
+    ) -> Result<Option<UniversalStreamChunk>, TransformError> {
+        // Handle two streaming formats:
+        // 1. Standard: type field at top level (e.g., "response.created")
+        // 2. Alternate: object="response.delta" with delta.type nested (e.g., delta.type="response.start")
+        let event_type = if let Some(t) = payload.get("type").and_then(Value::as_str) {
+            t.to_string()
+        } else if payload.get("object").and_then(Value::as_str) == Some("response.delta") {
+            // Alternate format - get type from delta
+            let delta_type = payload
+                .get("delta")
+                .and_then(|d| d.get("type"))
+                .and_then(Value::as_str)
+                .unwrap_or("unknown");
+            // Map alternate type names to standard ones
+            match delta_type {
+                "response.start" => "response.created".to_string(),
+                "response.done" => "response.completed".to_string(),
+                "content_part.delta" => "response.output_text.delta".to_string(),
+                "content_part.start" | "content_part.done" | "output_item.start"
+                | "output_item.done" => {
+                    return Ok(Some(UniversalStreamChunk::keep_alive()));
+                }
+                other => format!("response.{}", other),
+            }
+        } else {
+            return Err(TransformError::ToUniversalFailed(
+                "missing type field".to_string(),
+            ));
+        };
+
+        // For alternate format, extract data from delta instead of top level
+        let is_alternate_format =
+            payload.get("object").and_then(Value::as_str) == Some("response.delta");
+        let delta_obj = payload.get("delta");
+
+        match event_type.as_str() {
+            "response.output_text.delta" => {
+                // Text delta - extract from delta field
+                // Standard format: payload.delta is the text string
+                // Alternate format: payload.delta.text is the text string
+                let text = if is_alternate_format {
+                    delta_obj
+                        .and_then(|d| d.get("text"))
+                        .and_then(Value::as_str)
+                } else {
+                    payload.get("delta").and_then(Value::as_str)
+                };
+
+                // Use null for empty/missing text, preserving semantic equivalence with source
+                let content_value = match text {
+                    Some(t) if !t.is_empty() => Value::String(t.to_string()),
+                    _ => Value::Null, // Empty or missing text becomes null
+                };
+
+                let output_index = payload
+                    .get("output_index")
+                    .or_else(|| delta_obj.and_then(|d| d.get("index")))
+                    .and_then(Value::as_u64)
+                    .unwrap_or(0) as u32;
+
+                Ok(Some(UniversalStreamChunk::new(
+                    None,
+                    None,
+                    vec![UniversalStreamChoice {
+                        index: output_index,
+                        delta: Some(serde_json::json!({
+                            "role": "assistant",
+                            "content": content_value
+                        })),
+                        finish_reason: None,
+                    }],
+                    None,
+                    None,
+                )))
+            }
+
+            "response.completed" => {
+                // Final event with usage
+                let response = payload.get("response");
+                let usage = response
+                    .and_then(|r| r.get("usage"))
+                    .map(|u| UniversalUsage::from_provider_value(u, self.format()));
+
+                let model = response
+                    .and_then(|r| r.get("model"))
+                    .and_then(Value::as_str)
+                    .map(String::from);
+
+                let id = response
+                    .and_then(|r| r.get("id"))
+                    .and_then(Value::as_str)
+                    .map(String::from);
+
+                Ok(Some(UniversalStreamChunk::new(
+                    id,
+                    model,
+                    vec![UniversalStreamChoice {
+                        index: 0,
+                        delta: Some(serde_json::json!({})),
+                        finish_reason: Some("stop".to_string()),
+                    }],
+                    None,
+                    usage,
+                )))
+            }
+
+            "response.incomplete" => {
+                // Incomplete response - typically due to length
+                let response = payload.get("response");
+                let usage = response
+                    .and_then(|r| r.get("usage"))
+                    .map(|u| UniversalUsage::from_provider_value(u, self.format()));
+
+                Ok(Some(UniversalStreamChunk::new(
+                    None,
+                    None,
+                    vec![UniversalStreamChoice {
+                        index: 0,
+                        delta: Some(serde_json::json!({})),
+                        finish_reason: Some("length".to_string()),
+                    }],
+                    None,
+                    usage,
+                )))
+            }
+
+            "response.created" | "response.in_progress" => {
+                // Initial metadata events - extract model/id/usage
+                // Standard format: payload.response contains the data
+                // Alternate format: payload.delta.response contains the data
+                let response = if is_alternate_format {
+                    delta_obj.and_then(|d| d.get("response"))
+                } else {
+                    payload.get("response")
+                };
+                let model = response
+                    .and_then(|r| r.get("model"))
+                    .and_then(Value::as_str)
+                    .map(String::from);
+                let id = response
+                    .and_then(|r| r.get("id"))
+                    .and_then(Value::as_str)
+                    .map(String::from);
+                let usage = response
+                    .and_then(|r| r.get("usage"))
+                    .map(|u| UniversalUsage::from_provider_value(u, self.format()));
+
+                Ok(Some(UniversalStreamChunk::new(
+                    id,
+                    model,
+                    vec![UniversalStreamChoice {
+                        index: 0,
+                        delta: Some(serde_json::json!({"role": "assistant", "content": ""})),
+                        finish_reason: None,
+                    }],
+                    None,
+                    usage,
+                )))
+            }
+
+            // All other events are metadata/keep-alive
+            _ => Ok(Some(UniversalStreamChunk::keep_alive())),
+        }
+    }
+
+    fn stream_from_universal(&self, chunk: &UniversalStreamChunk) -> Result<Value, TransformError> {
+        if chunk.is_keep_alive() {
+            // Return a generic in_progress event
+            return Ok(serde_json::json!({
+                "type": "response.in_progress",
+                "sequence_number": 0
+            }));
+        }
+
+        // Check for finish chunk
+        let has_finish = chunk
+            .choices
+            .first()
+            .and_then(|c| c.finish_reason.as_ref())
+            .is_some();
+
+        // Check if this is an initial metadata chunk (has model/id/usage but no content)
+        let is_initial_metadata =
+            (chunk.model.is_some() || chunk.id.is_some() || chunk.usage.is_some())
+                && !has_finish
+                && chunk
+                    .choices
+                    .first()
+                    .and_then(|c| c.delta.as_ref())
+                    .is_none_or(|d| {
+                        // Initial chunk has role but empty/no content
+                        d.get("content")
+                            .and_then(Value::as_str)
+                            .is_none_or(|s| s.is_empty())
+                    });
+
+        if is_initial_metadata {
+            // Return response.created with model/id/usage
+            let id = chunk
+                .id
+                .clone()
+                .unwrap_or_else(|| format!("resp_{}", PLACEHOLDER_ID));
+            let mut response = serde_json::json!({
+                "id": id,
+                "object": "response",
+                "model": chunk.model.as_deref().unwrap_or(PLACEHOLDER_MODEL),
+                "status": "in_progress",
+                "output": []
+            });
+
+            if let Some(usage) = &chunk.usage {
+                if let Some(obj) = response.as_object_mut() {
+                    obj.insert("usage".into(), usage.to_provider_value(self.format()));
+                }
+            }
+
+            return Ok(serde_json::json!({
+                "type": "response.created",
+                "response": response
+            }));
+        }
+
+        if has_finish {
+            let finish_reason = chunk.choices.first().and_then(|c| c.finish_reason.as_ref());
+            let status = match finish_reason.map(|r| r.as_str()) {
+                Some("stop") => "completed",
+                Some("length") => "incomplete",
+                _ => "completed",
+            };
+
+            let id = chunk
+                .id
+                .clone()
+                .unwrap_or_else(|| format!("resp_{}", PLACEHOLDER_ID));
+            let mut response = serde_json::json!({
+                "id": id,
+                "object": "response",
+                "model": chunk.model.as_deref().unwrap_or(PLACEHOLDER_MODEL),
+                "status": status,
+                "output": []
+            });
+
+            if let Some(usage) = &chunk.usage {
+                if let Some(obj) = response.as_object_mut() {
+                    obj.insert("usage".into(), usage.to_provider_value(self.format()));
+                }
+            }
+
+            return Ok(serde_json::json!({
+                "type": if status == "completed" { "response.completed" } else { "response.incomplete" },
+                "response": response
+            }));
+        }
+
+        // Check for content delta
+        if let Some(choice) = chunk.choices.first() {
+            if let Some(delta) = &choice.delta {
+                if let Some(content) = delta.get("content").and_then(Value::as_str) {
+                    return Ok(serde_json::json!({
+                        "type": "response.output_text.delta",
+                        "output_index": choice.index,
+                        "content_index": 0,
+                        "delta": content
+                    }));
+                }
+
+                // If content is null or missing, return empty text delta
+                // Using text delta (instead of output_item.start) ensures proper roundtrip
+                // since our stream_to_universal converts empty text back to null
+                // Note: When tool_calls are present with null content, this will emit empty text
+                // which is documented as an expected limitation in streaming_expected_differences.json
+                let content_is_missing_or_null =
+                    delta.get("content").is_none() || delta.get("content") == Some(&Value::Null);
+
+                if content_is_missing_or_null {
+                    return Ok(serde_json::json!({
+                        "type": "response.output_text.delta",
+                        "output_index": choice.index,
+                        "content_index": 0,
+                        "delta": ""
+                    }));
+                }
+            }
+        }
+
+        // Fallback - return output_text.delta with empty content
+        Ok(serde_json::json!({
+            "type": "response.output_text.delta",
+            "output_index": 0,
+            "content_index": 0,
+            "delta": ""
+        }))
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::serde_json::json;
+
+    #[test]
+    fn test_responses_detect_request() {
+        let adapter = ResponsesAdapter;
+        let payload = json!({
+            "model": "o1",
+            "input": [{"role": "user", "content": "Hello"}]
+        });
+        assert!(adapter.detect_request(&payload));
+    }
+}
diff --git a/crates/lingua/src/providers/openai/test_chat_completions.rs b/crates/lingua/src/providers/openai/test_chat_completions.rs
index 6932ccd4..c7b869bd 100644
--- a/crates/lingua/src/providers/openai/test_chat_completions.rs
+++ b/crates/lingua/src/providers/openai/test_chat_completions.rs
@@ -1,6 +1,8 @@
+use crate::providers::openai::convert::{
+    ChatCompletionRequestMessageExt, ChatCompletionResponseMessageExt,
+};
 use crate::providers::openai::generated::{
-    ChatCompletionRequestMessage, ChatCompletionResponseMessage, CreateChatCompletionRequestClass,
-    CreateChatCompletionResponse,
+    CreateChatCompletionRequestClass, CreateChatCompletionResponse,
 };
 use crate::serde_json::Value;
 use crate::universal::{convert::TryFromLLM, Message};
@@ -34,19 +36,32 @@ mod tests {
 
         run_roundtrip_test(
             case,
-            // Extract messages from request
+            // Extract messages from request (convert to extended type)
             |request: &CreateChatCompletionRequestClass| Ok(&request.messages),
-            // Convert to universal
-            |messages: &Vec<ChatCompletionRequestMessage>| {
-                <Vec<Message> as TryFromLLM<Vec<ChatCompletionRequestMessage>>>::try_from(
-                    messages.clone(),
+            // Convert to universal (via extended type)
+            |messages: &Vec<crate::providers::openai::generated::ChatCompletionRequestMessage>| {
+                // Wrap base messages in extended type for conversion
+                let ext_messages: Vec<ChatCompletionRequestMessageExt> = messages
+                    .iter()
+                    .map(|m| ChatCompletionRequestMessageExt {
+                        base: m.clone(),
+                        reasoning: None,
+                        reasoning_signature: None,
+                    })
+                    .collect();
+                <Vec<Message> as TryFromLLM<Vec<ChatCompletionRequestMessageExt>>>::try_from(
+                    ext_messages,
                 )
                 .map_err(|e| format!("Failed to convert to universal format: {}", e))
             },
             // Convert from universal
             |messages: Vec<Message>| {
-                <Vec<ChatCompletionRequestMessage> as TryFromLLM<Vec<Message>>>::try_from(messages)
-                    .map_err(|e| format!("Failed to roundtrip conversion: {}", e))
+                let ext_messages = <Vec<ChatCompletionRequestMessageExt> as TryFromLLM<
+                    Vec<Message>,
+                >>::try_from(messages)
+                .map_err(|e| format!("Failed to roundtrip conversion: {}", e))?;
+                // Extract base messages (reasoning would be in separate field)
+                Ok(ext_messages.into_iter().map(|m| m.base).collect())
             },
             // Extract response content (collect response messages from choices)
             |response: &CreateChatCompletionResponse| {
@@ -57,13 +72,21 @@ mod tests {
                     .collect();
                 Ok(response_messages)
             },
-            // Convert response to universal
-            |response_messages: &Vec<ChatCompletionResponseMessage>| {
+            // Convert response to universal (via extended type)
+            |response_messages: &Vec<
+                crate::providers::openai::generated::ChatCompletionResponseMessage,
+            >| {
                 let mut universal_messages = Vec::new();
                 for response_message in response_messages {
+                    // Wrap base message in extended type for conversion
+                    let ext_msg = ChatCompletionResponseMessageExt {
+                        base: response_message.clone(),
+                        reasoning: None,
+                        reasoning_signature: None,
+                    };
                     let universal_msg: Message = <Message as TryFromLLM<
-                        &ChatCompletionResponseMessage,
-                    >>::try_from(response_message)
+                        ChatCompletionResponseMessageExt,
+                    >>::try_from(ext_msg)
                     .map_err(|e| {
                         format!("Failed to convert response to universal format: {}", e)
                     })?;
@@ -75,12 +98,13 @@ mod tests {
             |messages: Vec<Message>| {
                 let mut response_messages = Vec::new();
                 for universal_msg in &messages {
-                    let response_msg: ChatCompletionResponseMessage =
-                        <ChatCompletionResponseMessage as TryFromLLM<&Message>>::try_from(
+                    let ext_msg: ChatCompletionResponseMessageExt =
+                        <ChatCompletionResponseMessageExt as TryFromLLM<&Message>>::try_from(
                             universal_msg,
                         )
                         .map_err(|e| format!("Failed to roundtrip response conversion: {}", e))?;
-                    response_messages.push(response_msg);
+                    // Extract base message (reasoning would be in separate field)
+                    response_messages.push(ext_msg.base);
                 }
                 Ok(response_messages)
             },
diff --git a/crates/lingua/src/python.rs b/crates/lingua/src/python.rs
index aead002d..7e25e702 100644
--- a/crates/lingua/src/python.rs
+++ b/crates/lingua/src/python.rs
@@ -3,6 +3,7 @@ use serde::{Deserialize, Serialize};
 
 // Import our types and conversion traits
 use crate::providers::anthropic::generated as anthropic;
+use crate::providers::openai::convert::ChatCompletionRequestMessageExt;
 use crate::providers::openai::generated as openai;
 use crate::serde_json;
 use crate::universal::{convert::TryFromLLM, Message};
@@ -76,13 +77,13 @@ where
 /// Convert array of Chat Completions messages to Lingua Messages
 #[pyfunction]
 fn chat_completions_messages_to_lingua(py: Python, value: &PyAny) -> PyResult<PyObject> {
-    convert_to_lingua::<Vec<openai::ChatCompletionRequestMessage>, Vec<Message>>(py, value)
+    convert_to_lingua::<Vec<ChatCompletionRequestMessageExt>, Vec<Message>>(py, value)
 }
 
 /// Convert array of Lingua Messages to Chat Completions messages
 #[pyfunction]
 fn lingua_to_chat_completions_messages(py: Python, value: &PyAny) -> PyResult<PyObject> {
-    convert_from_lingua::<Vec<Message>, Vec<openai::ChatCompletionRequestMessage>>(py, value)
+    convert_from_lingua::<Vec<Message>, Vec<ChatCompletionRequestMessageExt>>(py, value)
 }
 
 /// Convert array of Responses API messages to Lingua Messages
diff --git a/crates/lingua/src/universal/mod.rs b/crates/lingua/src/universal/mod.rs
index eacc0c6e..720c7499 100644
--- a/crates/lingua/src/universal/mod.rs
+++ b/crates/lingua/src/universal/mod.rs
@@ -12,15 +12,27 @@ This module provides a 1:1 Rust implementation of the AI SDK ModelMessage format
 pub mod convert;
 pub mod defaults;
 pub mod message;
+pub mod reasoning;
 pub mod request;
 pub mod response;
+pub mod response_format;
 pub mod stream;
+pub mod tool_choice;
+pub mod tools;
 pub mod transform;
 
 // Re-export main types for convenience
 pub use defaults::*;
 pub use message::*;
-pub use request::{UniversalParams, UniversalRequest};
+pub use request::{
+    parse_stop_sequences, JsonSchemaConfig, ReasoningConfig, ReasoningEffort, ResponseFormatConfig,
+    ResponseFormatType, SummaryMode, ToolChoiceConfig, ToolChoiceMode, UniversalParams,
+    UniversalRequest,
+};
 pub use response::{FinishReason, UniversalResponse, UniversalUsage};
 pub use stream::{UniversalStreamChoice, UniversalStreamChunk};
+pub use tools::{
+    tools_to_anthropic_value, tools_to_openai_chat_value, tools_to_responses_value, UniversalTool,
+    UniversalToolType,
+};
 pub use transform::{extract_system_messages, flatten_consecutive_messages};
diff --git a/crates/lingua/src/universal/reasoning.rs b/crates/lingua/src/universal/reasoning.rs
new file mode 100644
index 00000000..749722bb
--- /dev/null
+++ b/crates/lingua/src/universal/reasoning.rs
@@ -0,0 +1,527 @@
+/*!
+Reasoning conversion utilities for cross-provider semantic translation.
+
+This module provides heuristics for converting between different providers'
+reasoning/thinking configurations:
+- OpenAI Chat: `reasoning_effort` (low/medium/high)
+- OpenAI Responses: `reasoning` object with `effort` and `summary` fields
+- Anthropic: `thinking.budget_tokens`
+- Google: `thinkingConfig.thinkingBudget`
+
+## Canonical Format
+
+The universal representation uses `budget_tokens` as the single canonical field.
+Adapters convert between provider-specific formats (like OpenAI's effort levels)
+and the canonical token budget at the provider boundary.
+
+## Design
+
+The conversion uses documented, deterministic heuristics:
+- `effort_to_budget`: Converts effort level to token budget using multipliers
+- `budget_to_effort`: Converts token budget to effort level using thresholds
+
+All conversions happen in adapter code via trait implementations, not in universal types.
+
+## Usage
+
+```ignore
+use crate::universal::request::ReasoningConfig;
+use crate::providers::openai::generated::ReasoningEffort as OpenAIEffort;
+
+// FROM OpenAI: Use tuple-based From trait for context-aware conversion
+let config: ReasoningConfig = (openai_effort, Some(max_tokens)).into();
+
+// FROM OpenAI: Fallback without max_tokens (uses DEFAULT_MAX_TOKENS)
+let config: ReasoningConfig = (&openai_reasoning).into();
+
+// FROM Anthropic: Direct conversion (already uses budget_tokens)
+let config: ReasoningConfig = (&anthropic_thinking).into();
+
+// TO provider: Convert at adapter boundary
+let output = config.to_provider(ProviderFormat::Anthropic, Some(4096))?;
+```
+*/
+
+use crate::capabilities::ProviderFormat;
+use crate::processing::transform::TransformError;
+use crate::providers::anthropic::generated::{Thinking, ThinkingType};
+use crate::providers::openai::generated::{
+    Reasoning as OpenAIReasoning, ReasoningEffort as OpenAIReasoningEffort,
+    Summary as OpenAISummary,
+};
+use crate::serde_json::{json, Map, Value};
+#[cfg(test)]
+use crate::universal::request::SummaryMode;
+use crate::universal::request::{ReasoningConfig, ReasoningEffort};
+
+// =============================================================================
+// Heuristic Constants
+// =============================================================================
+
+/// Multiplier for "low" effort (25% of max_tokens)
+pub const EFFORT_LOW_MULTIPLIER: f64 = 0.25;
+
+/// Multiplier for "medium" effort (50% of max_tokens)
+pub const EFFORT_MEDIUM_MULTIPLIER: f64 = 0.50;
+
+/// Multiplier for "high" effort (75% of max_tokens)
+pub const EFFORT_HIGH_MULTIPLIER: f64 = 0.75;
+
+/// Threshold below which budget is considered "low" effort
+pub const EFFORT_LOW_THRESHOLD: f64 = 0.35;
+
+/// Threshold above which budget is considered "high" effort
+pub const EFFORT_HIGH_THRESHOLD: f64 = 0.65;
+
+/// Minimum thinking budget for Anthropic
+pub const MIN_THINKING_BUDGET: i64 = 1024;
+
+/// Default max_tokens to use when not specified
+pub const DEFAULT_MAX_TOKENS: i64 = 4096;
+
+/// Default reasoning effort when enabled but no budget specified
+pub const DEFAULT_REASONING_EFFORT: ReasoningEffort = ReasoningEffort::Medium;
+
+/// Required temperature for Anthropic when thinking is enabled
+pub const ANTHROPIC_THINKING_TEMPERATURE: f64 = 1.0;
+
+// =============================================================================
+// Effort ↔ Budget Conversion
+// =============================================================================
+
+/// Convert effort level to token budget.
+///
+/// Uses multipliers applied to max_tokens:
+/// - low: 25% of max_tokens
+/// - medium: 50% of max_tokens
+/// - high: 75% of max_tokens
+///
+/// Result is clamped to minimum of 1024 tokens (Anthropic requirement).
+pub fn effort_to_budget(effort: ReasoningEffort, max_tokens: Option<i64>) -> i64 {
+    let max = max_tokens.unwrap_or(DEFAULT_MAX_TOKENS);
+    let multiplier = match effort {
+        ReasoningEffort::Low => EFFORT_LOW_MULTIPLIER,
+        ReasoningEffort::Medium => EFFORT_MEDIUM_MULTIPLIER,
+        ReasoningEffort::High => EFFORT_HIGH_MULTIPLIER,
+    };
+    let budget = (max as f64 * multiplier).floor() as i64;
+    budget.max(MIN_THINKING_BUDGET)
+}
+
+/// Convert token budget to effort level.
+///
+/// Uses ratio of budget/max_tokens with thresholds:
+/// - ratio < 0.35: low
+/// - 0.35 <= ratio < 0.65: medium
+/// - ratio >= 0.65: high
+pub fn budget_to_effort(budget: i64, max_tokens: Option<i64>) -> ReasoningEffort {
+    let max = max_tokens.unwrap_or(DEFAULT_MAX_TOKENS);
+    let ratio = budget as f64 / max as f64;
+
+    if ratio < EFFORT_LOW_THRESHOLD {
+        ReasoningEffort::Low
+    } else if ratio < EFFORT_HIGH_THRESHOLD {
+        ReasoningEffort::Medium
+    } else {
+        ReasoningEffort::High
+    }
+}
+
+// =============================================================================
+// Typed From Implementations for Provider-to-Universal Conversions
+// =============================================================================
+
+/// Convert Anthropic Thinking to ReasoningConfig.
+///
+/// Anthropic's thinking is already normalized on `budget_tokens`, so this is a direct mapping.
+impl From<&Thinking> for ReasoningConfig {
+    fn from(thinking: &Thinking) -> Self {
+        ReasoningConfig {
+            enabled: Some(matches!(thinking.thinking_type, ThinkingType::Enabled)),
+            budget_tokens: thinking.budget_tokens,
+            ..Default::default()
+        }
+    }
+}
+
+/// Convert OpenAI ReasoningEffort to ReasoningConfig with context (for Chat API).
+///
+/// Takes max_tokens as context to compute accurate budget_tokens.
+/// Uses DEFAULT_MAX_TOKENS if max_tokens is None.
+impl From<(OpenAIReasoningEffort, Option<i64>)> for ReasoningConfig {
+    fn from((effort, max_tokens): (OpenAIReasoningEffort, Option<i64>)) -> Self {
+        let universal_effort = match effort {
+            OpenAIReasoningEffort::Low | OpenAIReasoningEffort::Minimal => ReasoningEffort::Low,
+            OpenAIReasoningEffort::Medium => ReasoningEffort::Medium,
+            OpenAIReasoningEffort::High => ReasoningEffort::High,
+        };
+        ReasoningConfig {
+            enabled: Some(true),
+            budget_tokens: Some(effort_to_budget(universal_effort, max_tokens)),
+            ..Default::default()
+        }
+    }
+}
+
+/// Convert OpenAI Reasoning to ReasoningConfig (for Responses API) - fallback.
+///
+/// Uses DEFAULT_MAX_TOKENS for effort→budget conversion when max_tokens is not available.
+/// For context-aware conversion, use the tuple-based From impl.
+impl From<&OpenAIReasoning> for ReasoningConfig {
+    fn from(reasoning: &OpenAIReasoning) -> Self {
+        let budget_tokens = reasoning.effort.as_ref().map(|e| {
+            let universal_effort = match e {
+                OpenAIReasoningEffort::Low | OpenAIReasoningEffort::Minimal => ReasoningEffort::Low,
+                OpenAIReasoningEffort::Medium => ReasoningEffort::Medium,
+                OpenAIReasoningEffort::High => ReasoningEffort::High,
+            };
+            effort_to_budget(universal_effort, None) // Uses DEFAULT_MAX_TOKENS
+        });
+
+        let summary = reasoning
+            .summary
+            .as_ref()
+            .or(reasoning.generate_summary.as_ref())
+            .map(|s| match s {
+                OpenAISummary::Auto => crate::universal::request::SummaryMode::Auto,
+                OpenAISummary::Concise => crate::universal::request::SummaryMode::Auto, // Map concise to auto
+                OpenAISummary::Detailed => crate::universal::request::SummaryMode::Detailed,
+            });
+
+        ReasoningConfig {
+            enabled: Some(true),
+            budget_tokens,
+            summary,
+        }
+    }
+}
+
+/// Convert OpenAI Reasoning to ReasoningConfig with context (for Responses API).
+///
+/// Takes max_tokens as context to compute accurate budget_tokens.
+/// Uses provided max_tokens or DEFAULT_MAX_TOKENS if None.
+impl From<(&OpenAIReasoning, Option<i64>)> for ReasoningConfig {
+    fn from((reasoning, max_tokens): (&OpenAIReasoning, Option<i64>)) -> Self {
+        let budget_tokens = reasoning.effort.as_ref().map(|e| {
+            let universal_effort = match e {
+                OpenAIReasoningEffort::Low | OpenAIReasoningEffort::Minimal => ReasoningEffort::Low,
+                OpenAIReasoningEffort::Medium => ReasoningEffort::Medium,
+                OpenAIReasoningEffort::High => ReasoningEffort::High,
+            };
+            effort_to_budget(universal_effort, max_tokens)
+        });
+
+        let summary = reasoning
+            .summary
+            .as_ref()
+            .or(reasoning.generate_summary.as_ref())
+            .map(|s| match s {
+                OpenAISummary::Auto => crate::universal::request::SummaryMode::Auto,
+                OpenAISummary::Concise => crate::universal::request::SummaryMode::Auto, // Map concise to auto
+                OpenAISummary::Detailed => crate::universal::request::SummaryMode::Detailed,
+            });
+
+        ReasoningConfig {
+            enabled: Some(true),
+            budget_tokens,
+            summary,
+        }
+    }
+}
+
+// =============================================================================
+// to_provider Method for TO Conversions
+// =============================================================================
+
+impl ReasoningConfig {
+    /// Convert this config to a provider-specific value.
+    ///
+    /// # Arguments
+    /// * `provider` - Target provider format
+    /// * `max_tokens` - Max tokens for effort→budget conversion (for Anthropic/Google)
+    ///
+    /// # Returns
+    /// `Ok(Some(value))` if conversion succeeded
+    /// `Ok(None)` if reasoning is not enabled or no value should be set
+    /// `Err(_)` if conversion failed
+    pub fn to_provider(
+        &self,
+        provider: ProviderFormat,
+        max_tokens: Option<i64>,
+    ) -> Result<Option<Value>, TransformError> {
+        match provider {
+            ProviderFormat::OpenAI => Ok(to_openai_chat(self, max_tokens).map(Value::String)),
+            ProviderFormat::Responses => Ok(to_openai_responses(self, max_tokens)),
+            ProviderFormat::Anthropic => Ok(to_anthropic(self, max_tokens)),
+            ProviderFormat::Converse => Ok(to_anthropic(self, max_tokens)), // Bedrock uses same format as Anthropic
+            ProviderFormat::Google => Ok(to_google(self, max_tokens)),
+            _ => Ok(None),
+        }
+    }
+}
+
+// =============================================================================
+// Value-based Helper Functions - For Providers Without Typed Params
+// =============================================================================
+
+/// Parse Google `thinkingConfig` object into ReasoningConfig.
+///
+/// Google doesn't have typed params yet, so we still need Value-based parsing.
+pub fn from_google(config: &Value) -> ReasoningConfig {
+    let enabled = config
+        .get("includeThoughts")
+        .and_then(Value::as_bool)
+        .or_else(|| {
+            // If thinkingBudget > 0, thinking is enabled
+            config
+                .get("thinkingBudget")
+                .and_then(Value::as_i64)
+                .map(|b| b > 0)
+        });
+
+    let budget_tokens = config.get("thinkingBudget").and_then(Value::as_i64);
+
+    ReasoningConfig {
+        enabled,
+        budget_tokens,
+        ..Default::default()
+    }
+}
+
+// =============================================================================
+// Private Helper Functions - TO Provider Formats
+// =============================================================================
+
+/// Convert ReasoningConfig to OpenAI Chat `reasoning_effort` string.
+fn to_openai_chat(config: &ReasoningConfig, max_tokens: Option<i64>) -> Option<String> {
+    if config.enabled != Some(true) {
+        return None;
+    }
+
+    // Convert budget_tokens → effort at adapter boundary
+    if let Some(budget) = config.budget_tokens {
+        let effort = budget_to_effort(budget, max_tokens);
+        return Some(effort.to_string());
+    }
+
+    // If just enabled with no specifics, use default effort
+    Some(DEFAULT_REASONING_EFFORT.to_string())
+}
+
+/// Convert ReasoningConfig to OpenAI Responses API `reasoning` object.
+fn to_openai_responses(config: &ReasoningConfig, max_tokens: Option<i64>) -> Option<Value> {
+    if config.enabled != Some(true) {
+        return None;
+    }
+
+    let mut obj = Map::new();
+
+    // Convert budget_tokens → effort at adapter boundary
+    let effort = if let Some(budget) = config.budget_tokens {
+        budget_to_effort(budget, max_tokens).to_string()
+    } else {
+        DEFAULT_REASONING_EFFORT.to_string() // Default if only enabled=true
+    };
+
+    obj.insert("effort".into(), Value::String(effort));
+
+    // Summary
+    if let Some(summary) = config.summary {
+        obj.insert("summary".into(), Value::String(summary.to_string()));
+    }
+
+    Some(Value::Object(obj))
+}
+
+/// Convert ReasoningConfig to Anthropic `thinking` object.
+fn to_anthropic(config: &ReasoningConfig, _max_tokens: Option<i64>) -> Option<Value> {
+    if config.enabled != Some(true) {
+        return None;
+    }
+
+    // Use budget_tokens or default minimum
+    let budget = config.budget_tokens.unwrap_or(MIN_THINKING_BUDGET);
+
+    Some(json!({
+        "type": "enabled",
+        "budget_tokens": budget
+    }))
+}
+
+/// Convert ReasoningConfig to Google `thinkingConfig` object.
+fn to_google(config: &ReasoningConfig, _max_tokens: Option<i64>) -> Option<Value> {
+    if config.enabled != Some(true) {
+        return None;
+    }
+
+    // Use budget_tokens or default minimum
+    let budget = config.budget_tokens.unwrap_or(MIN_THINKING_BUDGET);
+
+    Some(json!({
+        "includeThoughts": true,
+        "thinkingBudget": budget
+    }))
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn test_effort_to_budget() {
+        // With default max_tokens (4096)
+        assert_eq!(effort_to_budget(ReasoningEffort::Low, None), 1024); // 4096 * 0.25 = 1024
+        assert_eq!(effort_to_budget(ReasoningEffort::Medium, None), 2048); // 4096 * 0.50 = 2048
+        assert_eq!(effort_to_budget(ReasoningEffort::High, None), 3072); // 4096 * 0.75 = 3072
+
+        // With custom max_tokens
+        assert_eq!(effort_to_budget(ReasoningEffort::Medium, Some(8192)), 4096);
+
+        // Minimum budget enforced
+        assert_eq!(effort_to_budget(ReasoningEffort::Low, Some(1000)), 1024); // Would be 250, clamped to 1024
+    }
+
+    #[test]
+    fn test_budget_to_effort() {
+        // With default max_tokens (4096)
+        assert_eq!(budget_to_effort(500, None), ReasoningEffort::Low); // 500/4096 = 0.12 < 0.35
+        assert_eq!(budget_to_effort(2000, None), ReasoningEffort::Medium); // 2000/4096 = 0.49
+        assert_eq!(budget_to_effort(3000, None), ReasoningEffort::High); // 3000/4096 = 0.73 >= 0.65
+
+        // With custom max_tokens
+        assert_eq!(budget_to_effort(4096, Some(8192)), ReasoningEffort::Medium);
+        // 4096/8192 = 0.5
+    }
+
+    #[test]
+    fn test_roundtrip_effort() {
+        // effort → budget → effort should preserve the original level
+        for effort in [
+            ReasoningEffort::Low,
+            ReasoningEffort::Medium,
+            ReasoningEffort::High,
+        ] {
+            let budget = effort_to_budget(effort, Some(4096));
+            let back = budget_to_effort(budget, Some(4096));
+            assert_eq!(effort, back, "Roundtrip failed for {:?}", effort);
+        }
+    }
+
+    #[test]
+    fn test_from_anthropic_thinking() {
+        let thinking = Thinking {
+            thinking_type: ThinkingType::Enabled,
+            budget_tokens: Some(2048),
+        };
+        let config = ReasoningConfig::from(&thinking);
+        assert_eq!(config.enabled, Some(true));
+        assert_eq!(config.budget_tokens, Some(2048));
+    }
+
+    #[test]
+    fn test_to_anthropic_thinking() {
+        let config = ReasoningConfig {
+            enabled: Some(true),
+            budget_tokens: Some(2048),
+            ..Default::default()
+        };
+
+        let thinking = config
+            .to_provider(ProviderFormat::Anthropic, Some(4096))
+            .unwrap()
+            .unwrap();
+        assert_eq!(thinking.get("type").unwrap(), "enabled");
+        assert_eq!(thinking.get("budget_tokens").unwrap(), 2048);
+    }
+
+    #[test]
+    fn test_to_openai_chat_reasoning() {
+        let config = ReasoningConfig {
+            enabled: Some(true),
+            budget_tokens: Some(2048),
+            ..Default::default()
+        };
+
+        let effort = config
+            .to_provider(ProviderFormat::OpenAI, Some(4096))
+            .unwrap()
+            .unwrap();
+        assert_eq!(effort.as_str().unwrap(), "medium"); // 2048/4096 = 0.5 → medium
+    }
+
+    #[test]
+    fn test_from_openai_reasoning_effort() {
+        // Test tuple-based conversion with max_tokens
+        let config = ReasoningConfig::from((OpenAIReasoningEffort::High, Some(4096)));
+        assert_eq!(config.enabled, Some(true));
+        assert_eq!(config.budget_tokens, Some(3072)); // 75% of 4096
+    }
+
+    #[test]
+    fn test_from_openai_responses_reasoning() {
+        let reasoning = OpenAIReasoning {
+            effort: Some(OpenAIReasoningEffort::High),
+            summary: Some(OpenAISummary::Detailed),
+            generate_summary: None,
+        };
+
+        // Test fallback conversion (uses DEFAULT_MAX_TOKENS)
+        let config_fallback = ReasoningConfig::from(&reasoning);
+        assert_eq!(config_fallback.enabled, Some(true));
+        assert_eq!(config_fallback.budget_tokens, Some(3072)); // 75% of DEFAULT_MAX_TOKENS (4096)
+        assert_eq!(config_fallback.summary, Some(SummaryMode::Detailed));
+
+        // Test context-aware conversion with custom max_tokens
+        let config_context = ReasoningConfig::from((&reasoning, Some(8192)));
+        assert_eq!(config_context.enabled, Some(true));
+        assert_eq!(config_context.budget_tokens, Some(6144)); // 75% of 8192
+        assert_eq!(config_context.summary, Some(SummaryMode::Detailed));
+    }
+
+    #[test]
+    fn test_to_bedrock_thinking() {
+        // Bedrock uses the same format as Anthropic for Claude models
+        let config = ReasoningConfig {
+            enabled: Some(true),
+            budget_tokens: Some(3072),
+            ..Default::default()
+        };
+
+        let thinking = config
+            .to_provider(ProviderFormat::Converse, Some(4096))
+            .unwrap()
+            .unwrap();
+        assert_eq!(thinking.get("type").unwrap(), "enabled");
+        assert_eq!(thinking.get("budget_tokens").unwrap(), 3072);
+    }
+
+    #[test]
+    fn test_to_bedrock_thinking_with_budget() {
+        // When budget_tokens is explicitly set, it should be used directly
+        let config = ReasoningConfig {
+            enabled: Some(true),
+            budget_tokens: Some(5000),
+            ..Default::default()
+        };
+
+        let thinking = config
+            .to_provider(ProviderFormat::Converse, Some(8192))
+            .unwrap()
+            .unwrap();
+        assert_eq!(thinking.get("type").unwrap(), "enabled");
+        assert_eq!(thinking.get("budget_tokens").unwrap(), 5000);
+    }
+
+    #[test]
+    fn test_to_bedrock_thinking_disabled() {
+        let config = ReasoningConfig {
+            enabled: Some(false),
+            ..Default::default()
+        };
+
+        let result = config
+            .to_provider(ProviderFormat::Converse, Some(4096))
+            .unwrap();
+        assert!(result.is_none());
+    }
+}
diff --git a/crates/lingua/src/universal/request.rs b/crates/lingua/src/universal/request.rs
index bd0b7ece..b2afc6b8 100644
--- a/crates/lingua/src/universal/request.rs
+++ b/crates/lingua/src/universal/request.rs
@@ -6,24 +6,39 @@ converted to/from any provider format.
 
 ## Design principles
 
-1. **Round-trip preservation**: Any field not mapped to a canonical field goes
-   into `extras` and is restored when converting back to the source format.
+1. **Round-trip preservation**: Provider-specific fields are stored in
+   `provider_extras` keyed by `ProviderFormat`, and restored when converting
+   back to the same provider format.
 
 2. **Canonical naming**: Uses consistent field names (e.g., `max_tokens`, `top_p`)
    regardless of what individual providers call them.
 
-3. **Minimal typing for complex fields**: Fields like `tools`, `tool_choice`, and
-   `response_format` are kept as `Value` since they vary significantly across providers.
+3. **Typed configs**: Complex fields like `tool_choice`, `response_format`, `reasoning`,
+   and `stop` use typed structs. Only `tools` and `metadata` remain as `Value`.
+
+4. **Provider isolation**: Provider-specific extras are scoped by `ProviderFormat`
+   to prevent cross-provider contamination (e.g., OpenAI extras don't bleed into
+   Anthropic requests).
 */
 
+use std::collections::HashMap;
+use std::fmt;
+use std::str::FromStr;
+
+use serde::{Deserialize, Serialize};
+
+use crate::capabilities::ProviderFormat;
+use crate::error::ConvertError;
 use crate::serde_json::{Map, Value};
 use crate::universal::message::Message;
+use crate::universal::tools::UniversalTool;
 
 /// Universal request envelope for LLM API calls.
 ///
 /// This type captures the common structure across all provider request formats.
-/// Provider-specific fields that don't map to canonical params go into `extras`.
-#[derive(Debug, Clone)]
+/// Provider-specific fields are stored in `provider_extras`, keyed by the source
+/// provider format to prevent cross-provider contamination.
+#[derive(Debug, Clone, Serialize)]
 pub struct UniversalRequest {
     /// Model identifier (may be None for providers that use endpoint-based model selection)
     pub model: Option<String>,
@@ -31,18 +46,27 @@ pub struct UniversalRequest {
     /// Conversation messages in universal format
     pub messages: Vec<Message>,
 
-    /// Common request parameters
+    /// Common request parameters (canonical fields only)
     pub params: UniversalParams,
 
-    /// Provider-specific fields not captured in params
-    pub extras: Map<String, Value>,
+    /// Provider-specific fields, keyed by the source ProviderFormat.
+    ///
+    /// When transforming back to the same provider, these extras are merged back.
+    /// When transforming to a different provider, they are ignored (no cross-pollination).
+    ///
+    /// Example: OpenAI Chat extras stay in `provider_extras[ProviderFormat::OpenAI]`
+    /// and are only merged back when converting to OpenAI Chat, not to Anthropic.
+    #[serde(skip)]
+    pub provider_extras: HashMap<ProviderFormat, Map<String, Value>>,
 }
 
 /// Common request parameters across providers.
 ///
 /// Uses canonical names - adapters handle mapping to provider-specific names.
-#[derive(Debug, Clone, Default)]
+/// This struct contains ONLY canonical fields - no extras or provider-specific baggage.
+#[derive(Debug, Clone, Default, Serialize)]
 pub struct UniversalParams {
+    // === Sampling parameters ===
     /// Sampling temperature (0.0 to 2.0 typically)
     pub temperature: Option<f64>,
 
@@ -52,30 +76,535 @@ pub struct UniversalParams {
     /// Top-k sampling (not supported by all providers)
     pub top_k: Option<i64>,
 
+    /// Random seed for deterministic generation
+    pub seed: Option<i64>,
+
+    /// Presence penalty (-2.0 to 2.0)
+    pub presence_penalty: Option<f64>,
+
+    /// Frequency penalty (-2.0 to 2.0)
+    pub frequency_penalty: Option<f64>,
+
+    // === Output control ===
     /// Maximum tokens to generate
     pub max_tokens: Option<i64>,
 
-    /// Stop sequences (kept as Value due to union type in OpenAI)
-    pub stop: Option<Value>,
+    /// Stop sequences for generation termination.
+    ///
+    /// All providers accept arrays of strings. OpenAI also accepts a single string,
+    /// but we normalize to arrays for simplicity - OpenAI accepts both forms.
+    pub stop: Option<Vec<String>>,
 
-    /// Tool definitions (schema varies by provider)
-    pub tools: Option<Value>,
+    /// Whether to return log probabilities (OpenAI-specific but canonical)
+    pub logprobs: Option<bool>,
 
-    /// Tool selection strategy (varies by provider)
-    pub tool_choice: Option<Value>,
+    /// Number of top logprobs to return (0-20)
+    pub top_logprobs: Option<i64>,
 
-    /// Output format specification (varies by provider)
-    pub response_format: Option<Value>,
+    // === Tools and function calling ===
+    /// Tool definitions in universal format.
+    ///
+    /// Tools are normalized to `UniversalTool` which handles the different formats:
+    /// - Anthropic: `{"name", "description", "input_schema"}` for custom, `{"type": "bash_20250124"}` for builtins
+    /// - OpenAI Chat: `{"type": "function", "function": {...}}`
+    /// - OpenAI Responses: `{"type": "function", "name", ...}` or `{"type": "code_interpreter"}`
+    pub tools: Option<Vec<UniversalTool>>,
 
-    /// Random seed for deterministic generation
-    pub seed: Option<i64>,
+    /// Tool selection strategy configuration.
+    ///
+    /// Uses canonical fields (`mode`, `tool_name`) for cross-provider conversion.
+    pub tool_choice: Option<ToolChoiceConfig>,
 
-    /// Presence penalty (-2.0 to 2.0)
-    pub presence_penalty: Option<f64>,
+    /// Whether tools can be called in parallel
+    pub parallel_tool_calls: Option<bool>,
 
-    /// Frequency penalty (-2.0 to 2.0)
-    pub frequency_penalty: Option<f64>,
+    // === Response format ===
+    /// Response format configuration.
+    ///
+    /// Uses canonical fields (`format_type`, `json_schema`) for cross-provider conversion.
+    pub response_format: Option<ResponseFormatConfig>,
+
+    // === Reasoning / Extended thinking ===
+    /// Reasoning configuration for extended thinking / chain-of-thought.
+    ///
+    /// Uses canonical fields (`effort`, `budget_tokens`) for cross-provider conversion.
+    /// Skipped when disabled or empty to normalize `{enabled: false}` to `null`.
+    #[serde(skip_serializing_if = "reasoning_should_skip")]
+    pub reasoning: Option<ReasoningConfig>,
+
+    // === Metadata and identification ===
+    /// Request metadata (user tracking, experiment tags, etc.)
+    pub metadata: Option<Value>,
+
+    /// Whether to store completion for training/evals (OpenAI-specific but canonical)
+    pub store: Option<bool>,
+
+    /// Service tier preference
+    pub service_tier: Option<String>,
 
+    // === Streaming ===
     /// Whether to stream the response
     pub stream: Option<bool>,
 }
+
+// =============================================================================
+// UniversalParams Helper Methods
+// =============================================================================
+
+impl UniversalParams {
+    /// Get tool_choice for a provider.
+    pub fn tool_choice_for(&self, provider: ProviderFormat) -> Option<Value> {
+        let config = self.tool_choice.clone().unwrap_or_default();
+        config
+            .to_provider(provider, self.parallel_tool_calls)
+            .ok()
+            .flatten()
+    }
+
+    /// Get reasoning config for a provider.
+    ///
+    /// This helper reduces boilerplate in adapters by handling the common pattern:
+    /// ```ignore
+    /// req.params.reasoning.as_ref()
+    ///     .and_then(|r| r.to_provider(provider, max_tokens).ok())
+    ///     .flatten()
+    /// ```
+    pub fn reasoning_for(&self, provider: ProviderFormat) -> Option<Value> {
+        self.reasoning
+            .as_ref()
+            .and_then(|r| r.to_provider(provider, self.max_tokens).ok())
+            .flatten()
+    }
+
+    /// Get response_format for a provider.
+    ///
+    /// This helper reduces boilerplate in adapters by handling the common pattern:
+    /// ```ignore
+    /// req.params.response_format.as_ref()
+    ///     .and_then(|rf| rf.to_provider(provider).ok())
+    ///     .flatten()
+    /// ```
+    pub fn response_format_for(&self, provider: ProviderFormat) -> Option<Value> {
+        self.response_format
+            .as_ref()
+            .and_then(|rf| rf.to_provider(provider).ok())
+            .flatten()
+    }
+}
+
+// =============================================================================
+// Reasoning Configuration
+// =============================================================================
+
+/// Configuration for extended thinking / reasoning capabilities.
+///
+/// Uses `budget_tokens` as the canonical field for cross-provider conversion.
+/// When converting TO a provider, values are converted at the adapter boundary.
+/// OpenAI's `reasoning_effort` levels are converted to/from budget_tokens using heuristics.
+#[derive(Debug, Clone, Default, Serialize, Deserialize)]
+pub struct ReasoningConfig {
+    /// Whether reasoning/thinking is enabled.
+    #[serde(skip_serializing_if = "Option::is_none")]
+    pub enabled: Option<bool>,
+
+    /// Token budget for thinking (canonical field).
+    /// All providers' reasoning configurations are normalized to this field.
+    /// OpenAI effort levels are converted to budget_tokens at adapter boundaries.
+    #[serde(skip_serializing_if = "Option::is_none")]
+    pub budget_tokens: Option<i64>,
+
+    /// Summary mode for reasoning output.
+    /// Maps to OpenAI Responses API's `reasoning.summary` field.
+    #[serde(skip_serializing_if = "Option::is_none")]
+    pub summary: Option<SummaryMode>,
+}
+
+impl ReasoningConfig {
+    /// Returns true if this config represents "no reasoning" (disabled or empty).
+    /// Used for skip_serializing_if to normalize disabled configs to null.
+    pub fn is_effectively_disabled(&self) -> bool {
+        // Explicitly disabled
+        if self.enabled == Some(false) {
+            return true;
+        }
+        // Empty config (no meaningful fields set)
+        self.enabled.is_none() && self.budget_tokens.is_none() && self.summary.is_none()
+    }
+}
+
+/// Helper for serde skip_serializing_if on Option<ReasoningConfig>.
+/// Returns true if the reasoning config should be skipped during serialization.
+fn reasoning_should_skip(reasoning: &Option<ReasoningConfig>) -> bool {
+    match reasoning {
+        None => true,
+        Some(config) => config.is_effectively_disabled(),
+    }
+}
+
+/// Reasoning effort level (portable across providers).
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize)]
+pub enum ReasoningEffort {
+    Low,
+    Medium,
+    High,
+}
+
+impl ReasoningEffort {
+    /// Returns the string representation.
+    pub fn as_str(&self) -> &'static str {
+        match self {
+            Self::Low => "low",
+            Self::Medium => "medium",
+            Self::High => "high",
+        }
+    }
+}
+
+impl FromStr for ReasoningEffort {
+    type Err = ConvertError;
+
+    fn from_str(s: &str) -> Result<Self, Self::Err> {
+        match s.to_lowercase().as_str() {
+            "low" => Ok(Self::Low),
+            "medium" => Ok(Self::Medium),
+            "high" => Ok(Self::High),
+            _ => Err(ConvertError::InvalidEnumValue {
+                type_name: "ReasoningEffort",
+                value: s.to_string(),
+            }),
+        }
+    }
+}
+
+impl fmt::Display for ReasoningEffort {
+    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
+        f.write_str(self.as_str())
+    }
+}
+
+impl AsRef<str> for ReasoningEffort {
+    fn as_ref(&self) -> &str {
+        self.as_str()
+    }
+}
+
+/// Summary mode for reasoning output.
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize, Deserialize)]
+pub enum SummaryMode {
+    /// No summary included in response.
+    None,
+    /// Provider decides whether to include summary.
+    Auto,
+    /// Detailed summary included in response.
+    Detailed,
+}
+
+impl SummaryMode {
+    /// Returns the string representation.
+    pub fn as_str(&self) -> &'static str {
+        match self {
+            Self::None => "none",
+            Self::Auto => "auto",
+            Self::Detailed => "detailed",
+        }
+    }
+}
+
+impl FromStr for SummaryMode {
+    type Err = ConvertError;
+
+    fn from_str(s: &str) -> Result<Self, Self::Err> {
+        match s.to_lowercase().as_str() {
+            "none" => Ok(Self::None),
+            "auto" => Ok(Self::Auto),
+            "detailed" => Ok(Self::Detailed),
+            _ => Err(ConvertError::InvalidEnumValue {
+                type_name: "SummaryMode",
+                value: s.to_string(),
+            }),
+        }
+    }
+}
+
+impl fmt::Display for SummaryMode {
+    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
+        f.write_str(self.as_str())
+    }
+}
+
+impl AsRef<str> for SummaryMode {
+    fn as_ref(&self) -> &str {
+        self.as_str()
+    }
+}
+
+// =============================================================================
+// Tool Choice Configuration
+// =============================================================================
+
+/// Tool selection strategy configuration.
+///
+/// Uses canonical fields (`mode`, `tool_name`) for cross-provider conversion.
+///
+/// Provider mapping:
+/// - OpenAI Chat: `"auto"` | `"none"` | `"required"` | `{ type: "function", function: { name } }`
+/// - OpenAI Responses: `"auto"` | `{ type: "function", name }`
+/// - Anthropic: `{ type: "auto" | "any" | "none" | "tool", name?, disable_parallel_tool_use? }`
+#[derive(Debug, Clone, Default, Serialize)]
+pub struct ToolChoiceConfig {
+    /// Selection mode - the semantic intent of the tool choice
+    pub mode: Option<ToolChoiceMode>,
+
+    /// Specific tool name (when mode = Tool)
+    pub tool_name: Option<String>,
+
+    /// Whether to disable parallel tool calls.
+    /// Maps to Anthropic's `disable_parallel_tool_use` field.
+    /// For OpenAI, this is handled via the separate `parallel_tool_calls` param.
+    pub disable_parallel: Option<bool>,
+}
+
+/// Tool selection mode (portable across providers).
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize)]
+pub enum ToolChoiceMode {
+    /// Provider decides whether to use tools
+    Auto,
+    /// No tools allowed
+    None,
+    /// Must use a tool (OpenAI "required" / Anthropic "any")
+    Required,
+    /// Specific tool required (use `tool_name` field)
+    Tool,
+}
+
+impl ToolChoiceMode {
+    /// Returns the string representation (OpenAI format).
+    pub fn as_str(&self) -> &'static str {
+        match self {
+            Self::Auto => "auto",
+            Self::None => "none",
+            Self::Required => "required",
+            Self::Tool => "function",
+        }
+    }
+
+    /// Convert to Anthropic format string.
+    pub fn as_anthropic_str(&self) -> &'static str {
+        match self {
+            Self::Auto => "auto",
+            Self::None => "none",
+            Self::Required => "any",
+            Self::Tool => "tool",
+        }
+    }
+}
+
+impl FromStr for ToolChoiceMode {
+    type Err = ConvertError;
+
+    fn from_str(s: &str) -> Result<Self, Self::Err> {
+        match s.to_lowercase().as_str() {
+            "auto" => Ok(Self::Auto),
+            "none" => Ok(Self::None),
+            "required" | "any" => Ok(Self::Required),
+            "tool" | "function" => Ok(Self::Tool),
+            _ => Err(ConvertError::InvalidEnumValue {
+                type_name: "ToolChoiceMode",
+                value: s.to_string(),
+            }),
+        }
+    }
+}
+
+impl fmt::Display for ToolChoiceMode {
+    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
+        f.write_str(self.as_str())
+    }
+}
+
+impl AsRef<str> for ToolChoiceMode {
+    fn as_ref(&self) -> &str {
+        self.as_str()
+    }
+}
+
+// =============================================================================
+// Response Format Configuration
+// =============================================================================
+
+/// Response format configuration for structured output.
+///
+/// Provider mapping:
+/// - OpenAI Chat: `{ type: "text" | "json_object" | "json_schema", json_schema? }`
+/// - OpenAI Responses: nested under `text.format`
+/// - Google: `response_mime_type` + `response_schema`
+/// - Anthropic: `{ type: "json_schema", schema, name?, strict?, description? }`
+#[derive(Debug, Clone, Default, Serialize)]
+pub struct ResponseFormatConfig {
+    /// Output format type
+    pub format_type: Option<ResponseFormatType>,
+
+    /// JSON schema configuration (when format_type = JsonSchema)
+    pub json_schema: Option<JsonSchemaConfig>,
+}
+
+/// Response format type (portable across providers).
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize)]
+pub enum ResponseFormatType {
+    /// Plain text output (default)
+    Text,
+    /// JSON object output (unstructured)
+    JsonObject,
+    /// JSON output conforming to a schema
+    JsonSchema,
+}
+
+impl ResponseFormatType {
+    /// Returns the string representation.
+    pub fn as_str(&self) -> &'static str {
+        match self {
+            Self::Text => "text",
+            Self::JsonObject => "json_object",
+            Self::JsonSchema => "json_schema",
+        }
+    }
+}
+
+impl FromStr for ResponseFormatType {
+    type Err = ConvertError;
+
+    fn from_str(s: &str) -> Result<Self, Self::Err> {
+        match s.to_lowercase().as_str() {
+            "text" => Ok(Self::Text),
+            "json_object" => Ok(Self::JsonObject),
+            "json_schema" => Ok(Self::JsonSchema),
+            _ => Err(ConvertError::InvalidEnumValue {
+                type_name: "ResponseFormatType",
+                value: s.to_string(),
+            }),
+        }
+    }
+}
+
+impl fmt::Display for ResponseFormatType {
+    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
+        f.write_str(self.as_str())
+    }
+}
+
+impl AsRef<str> for ResponseFormatType {
+    fn as_ref(&self) -> &str {
+        self.as_str()
+    }
+}
+
+/// JSON schema configuration for structured output.
+#[derive(Debug, Clone, Serialize)]
+pub struct JsonSchemaConfig {
+    /// Schema name (required by OpenAI)
+    pub name: String,
+
+    /// The JSON schema definition
+    pub schema: Value,
+
+    /// Whether to enable strict schema validation
+    pub strict: Option<bool>,
+
+    /// Human-readable description of the schema
+    pub description: Option<String>,
+}
+
+// =============================================================================
+// Stop Sequences Helper
+// =============================================================================
+
+/// Parse stop sequences from a JSON value.
+///
+/// Handles:
+/// - `"single_string"` → `vec!["single_string"]`
+/// - `["arr", "of", "strings"]` → `vec!["arr", "of", "strings"]`
+/// - Other types → `None`
+pub fn parse_stop_sequences(value: &Value) -> Option<Vec<String>> {
+    match value {
+        Value::String(s) => Some(vec![s.clone()]),
+        Value::Array(arr) => {
+            let sequences: Vec<String> = arr
+                .iter()
+                .filter_map(Value::as_str)
+                .map(String::from)
+                .collect();
+            if sequences.is_empty() {
+                None
+            } else {
+                Some(sequences)
+            }
+        }
+        _ => None,
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::serde_json::json;
+
+    #[test]
+    fn test_parse_stop_sequences_single_string() {
+        let value = json!("stop");
+        assert_eq!(parse_stop_sequences(&value), Some(vec!["stop".to_string()]));
+    }
+
+    #[test]
+    fn test_parse_stop_sequences_array_of_strings() {
+        let value = json!(["stop1", "stop2"]);
+        assert_eq!(
+            parse_stop_sequences(&value),
+            Some(vec!["stop1".to_string(), "stop2".to_string()])
+        );
+    }
+
+    #[test]
+    fn test_parse_stop_sequences_empty_array() {
+        let value = json!([]);
+        assert_eq!(parse_stop_sequences(&value), None);
+    }
+
+    #[test]
+    fn test_parse_stop_sequences_array_with_non_strings() {
+        let value = json!([1, 2, 3]);
+        assert_eq!(parse_stop_sequences(&value), None);
+    }
+
+    #[test]
+    fn test_parse_stop_sequences_mixed_array() {
+        let value = json!(["stop", 1, "end"]);
+        assert_eq!(
+            parse_stop_sequences(&value),
+            Some(vec!["stop".to_string(), "end".to_string()])
+        );
+    }
+
+    #[test]
+    fn test_parse_stop_sequences_null() {
+        let value = json!(null);
+        assert_eq!(parse_stop_sequences(&value), None);
+    }
+
+    #[test]
+    fn test_parse_stop_sequences_number() {
+        let value = json!(42);
+        assert_eq!(parse_stop_sequences(&value), None);
+    }
+
+    #[test]
+    fn test_parse_stop_sequences_object() {
+        let value = json!({});
+        assert_eq!(parse_stop_sequences(&value), None);
+    }
+
+    #[test]
+    fn test_parse_stop_sequences_boolean() {
+        let value = json!(true);
+        assert_eq!(parse_stop_sequences(&value), None);
+    }
+}
diff --git a/crates/lingua/src/universal/response.rs b/crates/lingua/src/universal/response.rs
index dc454883..a22a656d 100644
--- a/crates/lingua/src/universal/response.rs
+++ b/crates/lingua/src/universal/response.rs
@@ -5,12 +5,15 @@ This module provides a canonical representation of LLM responses that can be
 converted to/from any provider format.
 */
 
+use crate::capabilities::ProviderFormat;
+use crate::serde_json::{self, Value};
 use crate::universal::message::Message;
+use serde::Serialize;
 
 /// Universal response envelope for LLM API responses.
 ///
 /// This type captures the common structure across all provider response formats.
-#[derive(Debug, Clone)]
+#[derive(Debug, Clone, Serialize)]
 pub struct UniversalResponse {
     /// Model that generated the response
     pub model: Option<String>,
@@ -47,7 +50,7 @@ pub struct UniversalUsage {
 /// Reason why the model stopped generating.
 ///
 /// Normalized across provider-specific values.
-#[derive(Debug, Clone, PartialEq, Eq)]
+#[derive(Debug, Clone, PartialEq, Eq, Serialize)]
 pub enum FinishReason {
     /// Normal completion (OpenAI: "stop", Anthropic: "end_turn", Google: "STOP")
     Stop,
@@ -65,16 +68,303 @@ pub enum FinishReason {
     Other(String),
 }
 
+impl std::fmt::Display for FinishReason {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        // Display as canonical (OpenAI) format strings
+        let s = match self {
+            Self::Stop => "stop",
+            Self::Length => "length",
+            Self::ToolCalls => "tool_calls",
+            Self::ContentFilter => "content_filter",
+            Self::Other(s) => s,
+        };
+        write!(f, "{}", s)
+    }
+}
+
 impl std::str::FromStr for FinishReason {
     type Err = std::convert::Infallible;
 
     fn from_str(s: &str) -> Result<Self, Self::Err> {
         Ok(match s.to_lowercase().as_str() {
             "stop" | "end_turn" | "completed" => FinishReason::Stop,
-            "length" | "max_tokens" | "max_output_tokens" => FinishReason::Length,
+            "length" | "max_tokens" | "max_output_tokens" | "incomplete" => FinishReason::Length,
             "tool_calls" | "tool_use" => FinishReason::ToolCalls,
-            "content_filter" => FinishReason::ContentFilter,
+            "content_filter" | "content_filtered" | "safety" => FinishReason::ContentFilter,
             _ => FinishReason::Other(s.to_string()),
         })
     }
 }
+
+impl FinishReason {
+    /// Parse a provider-specific finish reason string to universal FinishReason.
+    ///
+    /// This is the inverse of `to_provider_string()` and handles provider-specific
+    /// string variants:
+    /// - OpenAI Chat: "stop", "length", "tool_calls", "content_filter"
+    /// - OpenAI Responses: "completed", "incomplete"
+    /// - Anthropic: "end_turn", "stop_sequence", "max_tokens", "tool_use"
+    /// - Bedrock: "end_turn", "stop_sequence", "max_tokens", "tool_use", "content_filtered"
+    /// - Google: "STOP", "MAX_TOKENS", "TOOL_CALLS", "SAFETY", "RECITATION", "OTHER"
+    pub fn from_provider_string(s: &str, provider: ProviderFormat) -> Self {
+        match (s, provider) {
+            // Stop variants
+            (
+                "end_turn" | "stop_sequence",
+                ProviderFormat::Anthropic | ProviderFormat::Converse,
+            ) => Self::Stop,
+            ("STOP", ProviderFormat::Google) => Self::Stop,
+            ("completed", ProviderFormat::Responses) => Self::Stop,
+            ("stop", _) => Self::Stop,
+
+            // Length variants
+            ("max_tokens", ProviderFormat::Anthropic | ProviderFormat::Converse) => Self::Length,
+            ("MAX_TOKENS", ProviderFormat::Google) => Self::Length,
+            ("incomplete", ProviderFormat::Responses) => Self::Length,
+            ("length", _) => Self::Length,
+
+            // ToolCalls variants
+            ("tool_use", ProviderFormat::Anthropic | ProviderFormat::Converse) => Self::ToolCalls,
+            ("TOOL_CALLS", ProviderFormat::Google) => Self::ToolCalls,
+            ("tool_calls", _) => Self::ToolCalls,
+
+            // ContentFilter variants
+            ("content_filtered", ProviderFormat::Converse) => Self::ContentFilter,
+            ("SAFETY" | "RECITATION" | "OTHER", ProviderFormat::Google) => Self::ContentFilter,
+            ("content_filter", _) => Self::ContentFilter,
+
+            // Unknown - pass through
+            (other, _) => Self::Other(other.to_string()),
+        }
+    }
+
+    /// Convert a universal FinishReason to the provider-specific string representation.
+    ///
+    /// Each provider uses different strings for finish reasons:
+    /// - OpenAI Chat: "stop", "length", "tool_calls", "content_filter"
+    /// - OpenAI Responses: "completed", "incomplete"
+    /// - Anthropic: "end_turn", "max_tokens", "tool_use"
+    /// - Bedrock: "end_turn", "max_tokens", "tool_use", "content_filtered"
+    /// - Google: "STOP", "MAX_TOKENS", "TOOL_CALLS", "SAFETY"
+    /// - Mistral: uses OpenAI format
+    pub fn to_provider_string(&self, provider: ProviderFormat) -> &str {
+        match (self, provider) {
+            // Stop variants
+            (Self::Stop, ProviderFormat::Anthropic | ProviderFormat::Converse) => "end_turn",
+            (Self::Stop, ProviderFormat::Google) => "STOP",
+            (Self::Stop, ProviderFormat::Responses) => "completed",
+            (
+                Self::Stop,
+                ProviderFormat::OpenAI | ProviderFormat::Mistral | ProviderFormat::Unknown,
+            ) => "stop",
+
+            // Length variants
+            (
+                Self::Length,
+                ProviderFormat::OpenAI | ProviderFormat::Mistral | ProviderFormat::Unknown,
+            ) => "length",
+            (Self::Length, ProviderFormat::Responses) => "incomplete",
+            (Self::Length, ProviderFormat::Google) => "MAX_TOKENS",
+            (Self::Length, ProviderFormat::Anthropic | ProviderFormat::Converse) => "max_tokens",
+
+            // ToolCalls variants
+            (Self::ToolCalls, ProviderFormat::Anthropic | ProviderFormat::Converse) => "tool_use",
+            (Self::ToolCalls, ProviderFormat::Google) => "TOOL_CALLS",
+            (Self::ToolCalls, ProviderFormat::Responses) => "completed", // Tool calls also complete
+            (
+                Self::ToolCalls,
+                ProviderFormat::OpenAI | ProviderFormat::Mistral | ProviderFormat::Unknown,
+            ) => "tool_calls",
+
+            // ContentFilter variants
+            (Self::ContentFilter, ProviderFormat::Converse) => "content_filtered",
+            (Self::ContentFilter, ProviderFormat::Google) => "SAFETY",
+            (Self::ContentFilter, ProviderFormat::Responses) => "incomplete",
+            (
+                Self::ContentFilter,
+                ProviderFormat::OpenAI
+                | ProviderFormat::Anthropic
+                | ProviderFormat::Mistral
+                | ProviderFormat::Unknown,
+            ) => "content_filter",
+
+            // Other - pass through as-is
+            (Self::Other(s), _) => s.as_str(),
+        }
+    }
+}
+
+impl UniversalUsage {
+    /// Parse usage from provider-specific JSON value.
+    ///
+    /// Different providers use different field names:
+    /// - OpenAI Chat: prompt_tokens, completion_tokens, prompt_tokens_details.cached_tokens
+    /// - OpenAI Responses: input_tokens, output_tokens, input_tokens_details.cached_tokens
+    /// - Anthropic: input_tokens, output_tokens, cache_read_input_tokens
+    /// - Bedrock: inputTokens, outputTokens, cacheReadInputTokens
+    /// - Google: promptTokenCount, candidatesTokenCount, cachedContentTokenCount
+    /// - Mistral: uses OpenAI format
+    pub fn from_provider_value(usage: &Value, provider: ProviderFormat) -> Self {
+        match provider {
+            // OpenAI, Mistral, and Unknown use OpenAI format
+            ProviderFormat::OpenAI | ProviderFormat::Mistral | ProviderFormat::Unknown => Self {
+                prompt_tokens: usage.get("prompt_tokens").and_then(Value::as_i64),
+                completion_tokens: usage.get("completion_tokens").and_then(Value::as_i64),
+                prompt_cached_tokens: usage
+                    .get("prompt_tokens_details")
+                    .and_then(|d| d.get("cached_tokens"))
+                    .and_then(Value::as_i64),
+                prompt_cache_creation_tokens: None, // OpenAI doesn't report cache creation tokens
+                completion_reasoning_tokens: usage
+                    .get("completion_tokens_details")
+                    .and_then(|d| d.get("reasoning_tokens"))
+                    .and_then(Value::as_i64),
+            },
+            ProviderFormat::Responses => Self {
+                prompt_tokens: usage.get("input_tokens").and_then(Value::as_i64),
+                completion_tokens: usage.get("output_tokens").and_then(Value::as_i64),
+                prompt_cached_tokens: usage
+                    .get("input_tokens_details")
+                    .and_then(|d| d.get("cached_tokens"))
+                    .and_then(Value::as_i64),
+                prompt_cache_creation_tokens: None,
+                completion_reasoning_tokens: usage
+                    .get("output_tokens_details")
+                    .and_then(|d| d.get("reasoning_tokens"))
+                    .and_then(Value::as_i64),
+            },
+            ProviderFormat::Anthropic => Self {
+                prompt_tokens: usage.get("input_tokens").and_then(Value::as_i64),
+                completion_tokens: usage.get("output_tokens").and_then(Value::as_i64),
+                prompt_cached_tokens: usage.get("cache_read_input_tokens").and_then(Value::as_i64),
+                prompt_cache_creation_tokens: usage
+                    .get("cache_creation_input_tokens")
+                    .and_then(Value::as_i64),
+                completion_reasoning_tokens: None, // Anthropic doesn't expose thinking tokens separately
+            },
+            ProviderFormat::Converse => Self {
+                prompt_tokens: usage.get("inputTokens").and_then(Value::as_i64),
+                completion_tokens: usage.get("outputTokens").and_then(Value::as_i64),
+                prompt_cached_tokens: usage.get("cacheReadInputTokens").and_then(Value::as_i64),
+                prompt_cache_creation_tokens: usage
+                    .get("cacheWriteInputTokens")
+                    .and_then(Value::as_i64),
+                completion_reasoning_tokens: None, // Bedrock doesn't expose thinking tokens separately
+            },
+            ProviderFormat::Google => Self {
+                prompt_tokens: usage.get("promptTokenCount").and_then(Value::as_i64),
+                completion_tokens: usage.get("candidatesTokenCount").and_then(Value::as_i64),
+                prompt_cached_tokens: usage.get("cachedContentTokenCount").and_then(Value::as_i64),
+                prompt_cache_creation_tokens: None, // Google doesn't report cache creation tokens
+                completion_reasoning_tokens: usage
+                    .get("thoughtsTokenCount")
+                    .and_then(Value::as_i64),
+            },
+        }
+    }
+
+    /// Extract usage from a response payload, handling provider-specific key names.
+    ///
+    /// Most providers use "usage", but Google uses "usageMetadata".
+    pub fn extract_from_response(payload: &Value, provider: ProviderFormat) -> Option<Self> {
+        let key = match provider {
+            ProviderFormat::Google => "usageMetadata",
+            _ => "usage",
+        };
+        payload
+            .get(key)
+            .map(|u| Self::from_provider_value(u, provider))
+    }
+
+    /// Convert to provider-specific JSON representation.
+    ///
+    /// Returns a JSON object with provider-specific field names.
+    pub fn to_provider_value(&self, provider: ProviderFormat) -> Value {
+        let prompt = self.prompt_tokens.unwrap_or(0);
+        let completion = self.completion_tokens.unwrap_or(0);
+
+        match provider {
+            // OpenAI, Mistral, and Unknown use OpenAI format
+            ProviderFormat::OpenAI | ProviderFormat::Mistral | ProviderFormat::Unknown => {
+                let mut obj = serde_json::json!({
+                    "prompt_tokens": prompt,
+                    "completion_tokens": completion,
+                    "total_tokens": prompt + completion
+                });
+                let obj_map = obj.as_object_mut().unwrap();
+
+                if let Some(cached_tokens) = self.prompt_cached_tokens {
+                    obj_map.insert(
+                        "prompt_tokens_details".into(),
+                        serde_json::json!({ "cached_tokens": cached_tokens }),
+                    );
+                }
+
+                if let Some(reasoning_tokens) = self.completion_reasoning_tokens {
+                    obj_map.insert(
+                        "completion_tokens_details".into(),
+                        serde_json::json!({ "reasoning_tokens": reasoning_tokens }),
+                    );
+                }
+
+                obj
+            }
+            ProviderFormat::Responses => {
+                let mut obj = serde_json::json!({
+                    "input_tokens": prompt,
+                    "output_tokens": completion,
+                    "total_tokens": prompt + completion
+                });
+                let obj_map = obj.as_object_mut().unwrap();
+
+                if let Some(cached_tokens) = self.prompt_cached_tokens {
+                    obj_map.insert(
+                        "input_tokens_details".into(),
+                        serde_json::json!({ "cached_tokens": cached_tokens }),
+                    );
+                }
+
+                if let Some(reasoning_tokens) = self.completion_reasoning_tokens {
+                    obj_map.insert(
+                        "output_tokens_details".into(),
+                        serde_json::json!({ "reasoning_tokens": reasoning_tokens }),
+                    );
+                }
+
+                obj
+            }
+            ProviderFormat::Anthropic => {
+                let mut obj = serde_json::json!({
+                    "input_tokens": prompt,
+                    "output_tokens": completion
+                });
+                let obj_map = obj.as_object_mut().unwrap();
+
+                if let Some(cache_creation) = self.prompt_cache_creation_tokens {
+                    obj_map.insert(
+                        "cache_creation_input_tokens".into(),
+                        serde_json::json!(cache_creation),
+                    );
+                }
+
+                if let Some(cache_read) = self.prompt_cached_tokens {
+                    obj_map.insert(
+                        "cache_read_input_tokens".into(),
+                        serde_json::json!(cache_read),
+                    );
+                }
+
+                obj
+            }
+            ProviderFormat::Converse => serde_json::json!({
+                "inputTokens": prompt,
+                "outputTokens": completion
+            }),
+            ProviderFormat::Google => serde_json::json!({
+                "promptTokenCount": prompt,
+                "candidatesTokenCount": completion,
+                "totalTokenCount": prompt + completion
+            }),
+        }
+    }
+}
diff --git a/crates/lingua/src/universal/response_format.rs b/crates/lingua/src/universal/response_format.rs
new file mode 100644
index 00000000..656a174a
--- /dev/null
+++ b/crates/lingua/src/universal/response_format.rs
@@ -0,0 +1,429 @@
+/*!
+Response format conversion utilities for cross-provider semantic translation.
+
+This module provides bidirectional conversion between different providers'
+response format configurations:
+- OpenAI Chat: `{ type: "text" | "json_object" | "json_schema", json_schema? }`
+- OpenAI Responses: nested under `text.format` with flattened schema
+- Google: `response_mime_type` + `response_schema`
+- Anthropic: `{ type: "json_schema", schema, description? }` (no name/strict)
+
+## Design
+
+The conversion uses canonical fields (`format_type`, `json_schema`) for cross-provider
+semantic translation. Same-provider round-trips are handled at a higher level via
+passthrough optimization.
+
+## Usage
+
+```ignore
+use std::convert::TryInto;
+use crate::capabilities::ProviderFormat;
+use crate::universal::request::ResponseFormatConfig;
+
+// FROM: Parse provider-specific value to universal config
+let config: ResponseFormatConfig = (ProviderFormat::OpenAI, &raw_json).try_into()?;
+
+// TO: Convert universal config to provider-specific value
+let output = config.to_provider(ProviderFormat::OpenAI)?;
+```
+*/
+
+use std::convert::TryFrom;
+
+use crate::capabilities::ProviderFormat;
+use crate::error::ConvertError;
+use crate::processing::transform::TransformError;
+use crate::serde_json::{json, Map, Value};
+use crate::universal::request::{JsonSchemaConfig, ResponseFormatConfig, ResponseFormatType};
+
+// =============================================================================
+// TryFrom Implementation for FROM Conversions
+// =============================================================================
+
+impl<'a> TryFrom<(ProviderFormat, &'a Value)> for ResponseFormatConfig {
+    type Error = TransformError;
+
+    fn try_from((provider, value): (ProviderFormat, &'a Value)) -> Result<Self, Self::Error> {
+        match provider {
+            ProviderFormat::OpenAI => Ok(from_openai_chat(value)?),
+            ProviderFormat::Responses => Ok(from_openai_responses(value)?),
+            ProviderFormat::Anthropic => Ok(from_anthropic(value)?),
+            _ => Ok(Self::default()),
+        }
+    }
+}
+
+// =============================================================================
+// to_provider Method for TO Conversions
+// =============================================================================
+
+impl ResponseFormatConfig {
+    /// Convert this config to a provider-specific value.
+    ///
+    /// # Arguments
+    /// * `provider` - Target provider format
+    ///
+    /// # Returns
+    /// `Ok(Some(value))` if conversion succeeded
+    /// `Ok(None)` if no value should be set
+    /// `Err(_)` if conversion failed
+    pub fn to_provider(&self, provider: ProviderFormat) -> Result<Option<Value>, TransformError> {
+        match provider {
+            ProviderFormat::OpenAI => Ok(to_openai_chat(self)),
+            ProviderFormat::Responses => Ok(to_openai_responses_text(self)),
+            ProviderFormat::Anthropic => Ok(to_anthropic(self)),
+            _ => Ok(None),
+        }
+    }
+}
+
+// =============================================================================
+// Private Helper Functions - FROM Provider Formats
+// =============================================================================
+
+/// Parse OpenAI Chat `response_format` into ResponseFormatConfig.
+///
+/// Handles:
+/// - `{ type: "text" }`
+/// - `{ type: "json_object" }`
+/// - `{ type: "json_schema", json_schema: { name, schema, strict?, description? } }`
+fn from_openai_chat(value: &Value) -> Result<ResponseFormatConfig, ConvertError> {
+    let format_type = match value.get("type").and_then(Value::as_str) {
+        Some(s) => Some(s.parse().map_err(|_| ConvertError::InvalidEnumValue {
+            type_name: "ResponseFormatType",
+            value: s.to_string(),
+        })?),
+        None => None,
+    };
+
+    let json_schema = if format_type == Some(ResponseFormatType::JsonSchema) {
+        value.get("json_schema").and_then(|js| {
+            let name = js.get("name").and_then(Value::as_str)?;
+            let schema = js.get("schema").cloned()?;
+            Some(JsonSchemaConfig {
+                name: name.to_string(),
+                schema,
+                strict: js.get("strict").and_then(Value::as_bool),
+                description: js
+                    .get("description")
+                    .and_then(Value::as_str)
+                    .map(String::from),
+            })
+        })
+    } else {
+        None
+    };
+
+    Ok(ResponseFormatConfig {
+        format_type,
+        json_schema,
+    })
+}
+
+/// Parse Anthropic `output_format` into ResponseFormatConfig.
+///
+/// Handles:
+/// - `{ type: "json_schema", schema: {...}, name?, strict?, description? }`
+///
+/// Note: Anthropic's format is simpler - schema is directly at top level,
+/// not nested under a `json_schema` key like OpenAI.
+fn from_anthropic(value: &Value) -> Result<ResponseFormatConfig, ConvertError> {
+    let format_type = match value.get("type").and_then(Value::as_str) {
+        Some(s) => Some(s.parse().map_err(|_| ConvertError::InvalidEnumValue {
+            type_name: "ResponseFormatType",
+            value: s.to_string(),
+        })?),
+        None => None,
+    };
+
+    let json_schema = if format_type == Some(ResponseFormatType::JsonSchema) {
+        value.get("schema").cloned().map(|schema| JsonSchemaConfig {
+            name: value
+                .get("name")
+                .and_then(Value::as_str)
+                .map(String::from)
+                .unwrap_or_else(|| "response".to_string()),
+            schema,
+            strict: value.get("strict").and_then(Value::as_bool),
+            description: value
+                .get("description")
+                .and_then(Value::as_str)
+                .map(String::from),
+        })
+    } else {
+        None
+    };
+
+    Ok(ResponseFormatConfig {
+        format_type,
+        json_schema,
+    })
+}
+
+/// Parse OpenAI Responses API `text.format` into ResponseFormatConfig.
+///
+/// Handles the flattened structure:
+/// - `{ type: "json_schema", name, schema, strict?, description? }`
+fn from_openai_responses(value: &Value) -> Result<ResponseFormatConfig, ConvertError> {
+    let format_type = match value.get("type").and_then(Value::as_str) {
+        Some(s) => Some(s.parse().map_err(|_| ConvertError::InvalidEnumValue {
+            type_name: "ResponseFormatType",
+            value: s.to_string(),
+        })?),
+        None => None,
+    };
+
+    let json_schema = if format_type == Some(ResponseFormatType::JsonSchema) {
+        value.get("name").and_then(Value::as_str).and_then(|name| {
+            value.get("schema").cloned().map(|schema| JsonSchemaConfig {
+                name: name.to_string(),
+                schema,
+                strict: value.get("strict").and_then(Value::as_bool),
+                description: value
+                    .get("description")
+                    .and_then(Value::as_str)
+                    .map(String::from),
+            })
+        })
+    } else {
+        None
+    };
+
+    Ok(ResponseFormatConfig {
+        format_type,
+        json_schema,
+    })
+}
+
+// =============================================================================
+// Private Helper Functions - TO Provider Formats
+// =============================================================================
+
+/// Convert ResponseFormatConfig to OpenAI Chat `response_format` value.
+///
+/// Output format:
+/// - `{ type: "text" }`
+/// - `{ type: "json_object" }`
+/// - `{ type: "json_schema", json_schema: { name, schema, strict?, description? } }`
+fn to_openai_chat(config: &ResponseFormatConfig) -> Option<Value> {
+    let format_type = config.format_type?;
+
+    match format_type {
+        ResponseFormatType::Text => Some(json!({ "type": "text" })),
+        ResponseFormatType::JsonObject => Some(json!({ "type": "json_object" })),
+        ResponseFormatType::JsonSchema => {
+            let js = config.json_schema.as_ref()?;
+            let mut json_schema = Map::new();
+            json_schema.insert("name".into(), Value::String(js.name.clone()));
+            json_schema.insert("schema".into(), js.schema.clone());
+            if let Some(strict) = js.strict {
+                json_schema.insert("strict".into(), Value::Bool(strict));
+            }
+            if let Some(ref desc) = js.description {
+                json_schema.insert("description".into(), Value::String(desc.clone()));
+            }
+            Some(json!({
+                "type": "json_schema",
+                "json_schema": json_schema
+            }))
+        }
+    }
+}
+
+/// Convert ResponseFormatConfig to OpenAI Responses API `text` object.
+///
+/// Output format (flattened, wrapped in text object):
+/// - `{ format: { type: "text" } }`
+/// - `{ format: { type: "json_schema", name, schema, strict?, description? } }`
+///
+/// Returns the full `text` object, not just the format.
+fn to_openai_responses_text(config: &ResponseFormatConfig) -> Option<Value> {
+    let format_type = config.format_type?;
+
+    let format_obj = match format_type {
+        ResponseFormatType::Text => json!({ "type": "text" }),
+        ResponseFormatType::JsonObject => json!({ "type": "json_object" }),
+        ResponseFormatType::JsonSchema => {
+            let js = config.json_schema.as_ref()?;
+            let mut obj = Map::new();
+            obj.insert("type".into(), Value::String("json_schema".into()));
+            obj.insert("name".into(), Value::String(js.name.clone()));
+            obj.insert("schema".into(), js.schema.clone());
+            if let Some(strict) = js.strict {
+                obj.insert("strict".into(), Value::Bool(strict));
+            }
+            if let Some(ref desc) = js.description {
+                obj.insert("description".into(), Value::String(desc.clone()));
+            }
+            Value::Object(obj)
+        }
+    };
+
+    Some(json!({ "format": format_obj }))
+}
+
+/// Convert ResponseFormatConfig to Anthropic `output_format` value.
+///
+/// Output format:
+/// - `{ type: "json_schema", schema: {...}, description? }`
+///
+/// Note: Anthropic rejects `name` and `strict` fields with a 400 error.
+/// Returns `None` for Text type. JsonObject is converted to json_schema with generic schema.
+fn to_anthropic(config: &ResponseFormatConfig) -> Option<Value> {
+    let format_type = config.format_type?;
+
+    match format_type {
+        // Anthropic doesn't support text format for structured outputs
+        ResponseFormatType::Text => None,
+        // json_object is converted to json_schema with generic { type: "object" } schema
+        // Anthropic requires additionalProperties: false in the schema
+        ResponseFormatType::JsonObject => Some(json!({
+            "type": "json_schema",
+            "schema": { "type": "object", "additionalProperties": false }
+        })),
+        ResponseFormatType::JsonSchema => {
+            let js = config.json_schema.as_ref()?;
+            let mut obj = Map::new();
+            obj.insert("type".into(), Value::String("json_schema".into()));
+            obj.insert("schema".into(), js.schema.clone());
+            // Note: Anthropic doesn't support "name" or "strict" fields - it returns 400 if present
+            if let Some(ref desc) = js.description {
+                obj.insert("description".into(), Value::String(desc.clone()));
+            }
+            Some(Value::Object(obj))
+        }
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use std::convert::TryInto;
+
+    #[test]
+    fn test_from_openai_chat_text() {
+        let value = json!({ "type": "text" });
+        let config: ResponseFormatConfig = (ProviderFormat::OpenAI, &value).try_into().unwrap();
+        assert_eq!(config.format_type, Some(ResponseFormatType::Text));
+        assert!(config.json_schema.is_none());
+    }
+
+    #[test]
+    fn test_from_openai_chat_json_schema() {
+        let value = json!({
+            "type": "json_schema",
+            "json_schema": {
+                "name": "person_info",
+                "schema": {
+                    "type": "object",
+                    "properties": {
+                        "name": { "type": "string" }
+                    }
+                },
+                "strict": true
+            }
+        });
+        let config: ResponseFormatConfig = (ProviderFormat::OpenAI, &value).try_into().unwrap();
+        assert_eq!(config.format_type, Some(ResponseFormatType::JsonSchema));
+        let js = config.json_schema.unwrap();
+        assert_eq!(js.name, "person_info");
+        assert_eq!(js.strict, Some(true));
+    }
+
+    #[test]
+    fn test_to_openai_chat_json_schema() {
+        let config = ResponseFormatConfig {
+            format_type: Some(ResponseFormatType::JsonSchema),
+            json_schema: Some(JsonSchemaConfig {
+                name: "test_schema".into(),
+                schema: json!({ "type": "object" }),
+                strict: Some(true),
+                description: None,
+            }),
+        };
+        let value = config.to_provider(ProviderFormat::OpenAI).unwrap().unwrap();
+        assert_eq!(value.get("type").unwrap(), "json_schema");
+        assert!(value.get("json_schema").is_some());
+        assert_eq!(
+            value
+                .get("json_schema")
+                .unwrap()
+                .get("name")
+                .unwrap()
+                .as_str()
+                .unwrap(),
+            "test_schema"
+        );
+    }
+
+    #[test]
+    fn test_roundtrip_openai_chat() {
+        let original = json!({
+            "type": "json_schema",
+            "json_schema": {
+                "name": "test",
+                "schema": { "type": "object" },
+                "strict": true
+            }
+        });
+        let config: ResponseFormatConfig = (ProviderFormat::OpenAI, &original).try_into().unwrap();
+        let back = config.to_provider(ProviderFormat::OpenAI).unwrap().unwrap();
+        assert_eq!(original, back);
+    }
+
+    #[test]
+    fn test_to_responses_text_format() {
+        let config = ResponseFormatConfig {
+            format_type: Some(ResponseFormatType::JsonSchema),
+            json_schema: Some(JsonSchemaConfig {
+                name: "test".into(),
+                schema: json!({ "type": "object" }),
+                strict: Some(true),
+                description: None,
+            }),
+        };
+        let value = config
+            .to_provider(ProviderFormat::Responses)
+            .unwrap()
+            .unwrap();
+        let format = value.get("format").unwrap();
+        assert_eq!(format.get("type").unwrap(), "json_schema");
+        assert_eq!(format.get("name").unwrap(), "test");
+    }
+
+    #[test]
+    fn test_cross_provider_openai_to_anthropic() {
+        // Parse OpenAI format
+        let openai_format = json!({
+            "type": "json_schema",
+            "json_schema": {
+                "name": "person_info",
+                "schema": {
+                    "type": "object",
+                    "properties": {
+                        "name": { "type": "string" }
+                    }
+                },
+                "strict": true
+            }
+        });
+        let config: ResponseFormatConfig =
+            (ProviderFormat::OpenAI, &openai_format).try_into().unwrap();
+
+        // Convert to Anthropic format
+        let anthropic_format = config
+            .to_provider(ProviderFormat::Anthropic)
+            .unwrap()
+            .unwrap();
+
+        // Verify Anthropic format structure
+        assert_eq!(anthropic_format.get("type").unwrap(), "json_schema");
+        // Name and strict are NOT included because Anthropic doesn't support them
+        assert!(anthropic_format.get("name").is_none());
+        assert!(anthropic_format.get("strict").is_none());
+        assert!(anthropic_format.get("schema").is_some());
+        // Anthropic format doesn't have nested json_schema wrapper
+        assert!(anthropic_format.get("json_schema").is_none());
+    }
+}
diff --git a/crates/lingua/src/universal/tool_choice.rs b/crates/lingua/src/universal/tool_choice.rs
new file mode 100644
index 00000000..1895339a
--- /dev/null
+++ b/crates/lingua/src/universal/tool_choice.rs
@@ -0,0 +1,447 @@
+/*!
+Tool choice conversion utilities for cross-provider semantic translation.
+
+This module provides bidirectional conversion between different providers'
+tool choice configurations:
+- OpenAI Chat: `"auto"` | `"none"` | `"required"` | `{ type: "function", function: { name } }`
+- OpenAI Responses: `"auto"` | `{ type: "function", name }`
+- Anthropic: `{ type: "auto" | "any" | "none" | "tool", name?, disable_parallel_tool_use? }`
+
+## Design
+
+Uses canonical fields (`mode`, `tool_name`) for cross-provider conversion.
+
+## Usage
+
+```ignore
+use std::convert::TryInto;
+use crate::capabilities::ProviderFormat;
+use crate::universal::request::ToolChoiceConfig;
+
+// FROM: Parse provider-specific value to universal config
+let config: ToolChoiceConfig = (ProviderFormat::Anthropic, &raw_json).try_into()?;
+
+// TO: Convert universal config to provider-specific value
+// parallel_tool_calls: Some(false) disables parallel calls; None uses config.disable_parallel
+let output = config.to_provider(ProviderFormat::Anthropic, Some(false))?;
+```
+*/
+
+use std::convert::TryFrom;
+
+use crate::capabilities::ProviderFormat;
+use crate::processing::transform::TransformError;
+use crate::serde_json::{json, Map, Value};
+use crate::universal::request::{ToolChoiceConfig, ToolChoiceMode};
+
+// =============================================================================
+// TryFrom Implementation for FROM Conversions
+// =============================================================================
+
+impl<'a> TryFrom<(ProviderFormat, &'a Value)> for ToolChoiceConfig {
+    type Error = TransformError;
+
+    fn try_from((provider, value): (ProviderFormat, &'a Value)) -> Result<Self, Self::Error> {
+        match provider {
+            ProviderFormat::OpenAI => from_openai_chat(value),
+            ProviderFormat::Responses => from_openai_responses(value),
+            ProviderFormat::Anthropic => from_anthropic(value),
+            _ => Ok(Self::default()),
+        }
+    }
+}
+
+// =============================================================================
+// to_provider Method for TO Conversions
+// =============================================================================
+
+impl ToolChoiceConfig {
+    /// Convert this config to a provider-specific value.
+    ///
+    /// # Arguments
+    /// * `provider` - Target provider format
+    /// * `parallel_tool_calls` - Whether parallel tool calls are enabled (for Anthropic's disable_parallel_tool_use)
+    ///
+    /// # Returns
+    /// `Ok(Some(value))` if conversion succeeded
+    /// `Ok(None)` if no value should be set (e.g., mode is None)
+    /// `Err(_)` if conversion failed
+    pub fn to_provider(
+        &self,
+        provider: ProviderFormat,
+        parallel_tool_calls: Option<bool>,
+    ) -> Result<Option<Value>, TransformError> {
+        match provider {
+            ProviderFormat::OpenAI => Ok(to_openai_chat(self)),
+            ProviderFormat::Responses => Ok(to_openai_responses(self)),
+            ProviderFormat::Anthropic => Ok(to_anthropic(self, parallel_tool_calls)),
+            _ => Ok(None),
+        }
+    }
+}
+
+// =============================================================================
+// Private Helper Functions - FROM Provider Formats
+// =============================================================================
+
+/// Parse OpenAI Chat `tool_choice` into ToolChoiceConfig.
+///
+/// Handles:
+/// - String: `"auto"`, `"none"`, `"required"`
+/// - Object: `{ type: "function", function: { name: "..." } }`
+fn from_openai_chat(value: &Value) -> Result<ToolChoiceConfig, TransformError> {
+    match value {
+        Value::String(s) => {
+            let mode = s
+                .parse()
+                .map_err(|e| TransformError::ToUniversalFailed(format!("{}", e)))?;
+            Ok(ToolChoiceConfig {
+                mode: Some(mode),
+                tool_name: None,
+                disable_parallel: None,
+            })
+        }
+        Value::Object(obj) => {
+            // OpenAI Chat uses { type: "function", function: { name: "..." } }
+            let type_str = obj.get("type").and_then(Value::as_str);
+            match type_str {
+                Some("function") | None => {}
+                Some(other) => {
+                    return Err(TransformError::ToUniversalFailed(format!(
+                        "unrecognized tool_choice type: '{}'",
+                        other
+                    )))
+                }
+            }
+
+            let tool_name = obj
+                .get("function")
+                .and_then(|f| f.get("name"))
+                .and_then(Value::as_str)
+                .map(String::from);
+
+            Ok(ToolChoiceConfig {
+                mode: Some(ToolChoiceMode::Tool),
+                tool_name,
+                disable_parallel: None,
+            })
+        }
+        _ => Ok(ToolChoiceConfig::default()),
+    }
+}
+
+/// Parse OpenAI Responses API `tool_choice` into ToolChoiceConfig.
+///
+/// Handles:
+/// - String: `"auto"`, `"none"`, `"required"`
+/// - Object: `{ type: "function", name: "..." }` (flatter than Chat)
+fn from_openai_responses(value: &Value) -> Result<ToolChoiceConfig, TransformError> {
+    match value {
+        Value::String(s) => {
+            let mode = s
+                .parse()
+                .map_err(|e| TransformError::ToUniversalFailed(format!("{}", e)))?;
+            Ok(ToolChoiceConfig {
+                mode: Some(mode),
+                tool_name: None,
+                disable_parallel: None,
+            })
+        }
+        Value::Object(obj) => {
+            let tool_name = obj.get("name").and_then(Value::as_str).map(String::from);
+
+            // OpenAI Responses uses { type: "function", name: "..." }
+            let type_str = obj.get("type").and_then(Value::as_str);
+            let mode = match type_str {
+                Some("function") | None => Some(ToolChoiceMode::Tool),
+                Some(other) => {
+                    return Err(TransformError::ToUniversalFailed(format!(
+                        "unrecognized tool_choice type: '{}'",
+                        other
+                    )))
+                }
+            };
+
+            Ok(ToolChoiceConfig {
+                mode,
+                tool_name,
+                disable_parallel: None,
+            })
+        }
+        _ => Ok(ToolChoiceConfig::default()),
+    }
+}
+
+/// Parse Anthropic `tool_choice` into ToolChoiceConfig.
+///
+/// Handles:
+/// - `{ type: "auto" }`
+/// - `{ type: "any" }`
+/// - `{ type: "none" }`
+/// - `{ type: "tool", name: "..." }`
+/// - `{ ..., disable_parallel_tool_use: true }`
+fn from_anthropic(value: &Value) -> Result<ToolChoiceConfig, TransformError> {
+    let obj = match value.as_object() {
+        Some(o) => o,
+        None => return Ok(ToolChoiceConfig::default()),
+    };
+
+    let mode = match obj.get("type").and_then(Value::as_str) {
+        Some(s) => Some(
+            s.parse()
+                .map_err(|e| TransformError::ToUniversalFailed(format!("{}", e)))?,
+        ),
+        None => None,
+    };
+
+    let tool_name = obj.get("name").and_then(Value::as_str).map(String::from);
+
+    let disable_parallel = obj
+        .get("disable_parallel_tool_use")
+        .and_then(Value::as_bool);
+
+    Ok(ToolChoiceConfig {
+        mode,
+        tool_name,
+        disable_parallel,
+    })
+}
+
+// =============================================================================
+// Private Helper Functions - TO Provider Formats
+// =============================================================================
+
+/// Convert ToolChoiceConfig to OpenAI Chat `tool_choice` value.
+///
+/// Output format:
+/// - `"auto"`, `"none"`, `"required"` for simple modes
+/// - `{ type: "function", function: { name: "..." } }` for specific tool
+fn to_openai_chat(config: &ToolChoiceConfig) -> Option<Value> {
+    let mode = config.mode?;
+
+    match mode {
+        ToolChoiceMode::Auto => Some(Value::String("auto".into())),
+        ToolChoiceMode::None => Some(Value::String("none".into())),
+        ToolChoiceMode::Required => Some(Value::String("required".into())),
+        ToolChoiceMode::Tool => {
+            let name = config.tool_name.as_ref()?;
+            Some(json!({
+                "type": "function",
+                "function": {
+                    "name": name
+                }
+            }))
+        }
+    }
+}
+
+/// Convert ToolChoiceConfig to OpenAI Responses API `tool_choice` value.
+///
+/// Output format:
+/// - `"auto"`, `"none"`, `"required"` for simple modes
+/// - `{ type: "function", name: "..." }` for specific tool (flatter than Chat)
+fn to_openai_responses(config: &ToolChoiceConfig) -> Option<Value> {
+    let mode = config.mode?;
+
+    match mode {
+        ToolChoiceMode::Auto => Some(Value::String("auto".into())),
+        ToolChoiceMode::None => Some(Value::String("none".into())),
+        ToolChoiceMode::Required => Some(Value::String("required".into())),
+        ToolChoiceMode::Tool => {
+            let name = config.tool_name.as_ref()?;
+            Some(json!({
+                "type": "function",
+                "name": name
+            }))
+        }
+    }
+}
+
+/// Convert ToolChoiceConfig to Anthropic `tool_choice` value.
+///
+/// Output format:
+/// - `{ type: "auto" }`, `{ type: "any" }`, `{ type: "none" }`
+/// - `{ type: "tool", name: "..." }`
+/// - Includes `disable_parallel_tool_use` if set
+fn to_anthropic(config: &ToolChoiceConfig, parallel_tool_calls: Option<bool>) -> Option<Value> {
+    // If parallel_tool_calls is explicitly false, we MUST emit tool_choice with disable_parallel_tool_use
+    let needs_disable_parallel =
+        parallel_tool_calls == Some(false) || config.disable_parallel == Some(true);
+
+    // Get mode, defaulting to Auto if we need to disable parallel (so we can emit the field)
+    let mode = match config.mode {
+        Some(m) => m,
+        None if needs_disable_parallel => ToolChoiceMode::Auto,
+        None => return None,
+    };
+
+    let mut obj = Map::new();
+    obj.insert("type".into(), Value::String(mode.as_anthropic_str().into()));
+
+    if mode == ToolChoiceMode::Tool {
+        if let Some(ref name) = config.tool_name {
+            obj.insert("name".into(), Value::String(name.clone()));
+        }
+    }
+
+    if needs_disable_parallel {
+        obj.insert("disable_parallel_tool_use".into(), Value::Bool(true));
+    }
+
+    Some(Value::Object(obj))
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use std::convert::TryInto;
+
+    #[test]
+    fn test_from_openai_chat_string() {
+        let value = json!("auto");
+        let config: ToolChoiceConfig = (ProviderFormat::OpenAI, &value).try_into().unwrap();
+        assert_eq!(config.mode, Some(ToolChoiceMode::Auto));
+        assert_eq!(config.tool_name, None);
+    }
+
+    #[test]
+    fn test_from_openai_chat_function() {
+        let value = json!({
+            "type": "function",
+            "function": { "name": "get_weather" }
+        });
+        let config: ToolChoiceConfig = (ProviderFormat::OpenAI, &value).try_into().unwrap();
+        assert_eq!(config.mode, Some(ToolChoiceMode::Tool));
+        assert_eq!(config.tool_name, Some("get_weather".into()));
+    }
+
+    #[test]
+    fn test_from_anthropic_tool() {
+        let value = json!({
+            "type": "tool",
+            "name": "get_weather"
+        });
+        let config: ToolChoiceConfig = (ProviderFormat::Anthropic, &value).try_into().unwrap();
+        assert_eq!(config.mode, Some(ToolChoiceMode::Tool));
+        assert_eq!(config.tool_name, Some("get_weather".into()));
+    }
+
+    #[test]
+    fn test_from_anthropic_with_disable_parallel() {
+        let value = json!({
+            "type": "auto",
+            "disable_parallel_tool_use": true
+        });
+        let config: ToolChoiceConfig = (ProviderFormat::Anthropic, &value).try_into().unwrap();
+        assert_eq!(config.mode, Some(ToolChoiceMode::Auto));
+        assert_eq!(config.disable_parallel, Some(true));
+    }
+
+    #[test]
+    fn test_to_openai_chat_auto() {
+        let config = ToolChoiceConfig {
+            mode: Some(ToolChoiceMode::Auto),
+            ..Default::default()
+        };
+        let value = config
+            .to_provider(ProviderFormat::OpenAI, None)
+            .unwrap()
+            .unwrap();
+        assert_eq!(value, json!("auto"));
+    }
+
+    #[test]
+    fn test_to_openai_chat_function() {
+        let config = ToolChoiceConfig {
+            mode: Some(ToolChoiceMode::Tool),
+            tool_name: Some("get_weather".into()),
+            ..Default::default()
+        };
+        let value = config
+            .to_provider(ProviderFormat::OpenAI, None)
+            .unwrap()
+            .unwrap();
+        assert_eq!(
+            value,
+            json!({
+                "type": "function",
+                "function": { "name": "get_weather" }
+            })
+        );
+    }
+
+    #[test]
+    fn test_to_anthropic_any() {
+        let config = ToolChoiceConfig {
+            mode: Some(ToolChoiceMode::Required),
+            ..Default::default()
+        };
+        let value = config
+            .to_provider(ProviderFormat::Anthropic, None)
+            .unwrap()
+            .unwrap();
+        assert_eq!(value.get("type").unwrap(), "any");
+    }
+
+    #[test]
+    fn test_to_anthropic_with_parallel_disabled() {
+        let config = ToolChoiceConfig {
+            mode: Some(ToolChoiceMode::Auto),
+            ..Default::default()
+        };
+        // parallel_tool_calls: false → disable_parallel_tool_use: true
+        let value = config
+            .to_provider(ProviderFormat::Anthropic, Some(false))
+            .unwrap()
+            .unwrap();
+        assert_eq!(value.get("type").unwrap(), "auto");
+        assert_eq!(value.get("disable_parallel_tool_use").unwrap(), true);
+    }
+
+    #[test]
+    fn test_roundtrip_openai_chat() {
+        let original = json!({
+            "type": "function",
+            "function": { "name": "get_weather" }
+        });
+        let config: ToolChoiceConfig = (ProviderFormat::OpenAI, &original).try_into().unwrap();
+        let back = config
+            .to_provider(ProviderFormat::OpenAI, None)
+            .unwrap()
+            .unwrap();
+        assert_eq!(original, back);
+    }
+
+    #[test]
+    fn test_cross_provider_openai_to_anthropic() {
+        // OpenAI required → Anthropic any
+        let openai_value = json!("required");
+        let config: ToolChoiceConfig = (ProviderFormat::OpenAI, &openai_value).try_into().unwrap();
+        let anthropic_value = config
+            .to_provider(ProviderFormat::Anthropic, None)
+            .unwrap()
+            .unwrap();
+        assert_eq!(anthropic_value.get("type").unwrap(), "any");
+    }
+
+    #[test]
+    fn test_invalid_string_mode_errors() {
+        // Unrecognized string mode should error
+        let value = json!("invalid_mode");
+        let result: Result<ToolChoiceConfig, _> = (ProviderFormat::OpenAI, &value).try_into();
+        assert!(result.is_err());
+        assert!(result.unwrap_err().to_string().contains("invalid_mode"));
+    }
+
+    #[test]
+    fn test_invalid_object_type_errors() {
+        // Unrecognized type in object should error
+        let value = json!({
+            "type": "unknown_type",
+            "name": "some_tool"
+        });
+        let result: Result<ToolChoiceConfig, _> = (ProviderFormat::Responses, &value).try_into();
+        assert!(result.is_err());
+        assert!(result.unwrap_err().to_string().contains("unknown_type"));
+    }
+}
diff --git a/crates/lingua/src/universal/tools.rs b/crates/lingua/src/universal/tools.rs
new file mode 100644
index 00000000..2a7a3e4e
--- /dev/null
+++ b/crates/lingua/src/universal/tools.rs
@@ -0,0 +1,873 @@
+/*!
+Tool format conversion utilities for cross-provider semantic translation.
+
+This module provides bidirectional conversion between different providers'
+tool formats:
+- Anthropic: `{"name": "...", "description": "...", "input_schema": {...}}`
+- OpenAI: `{"type": "function", "function": {"name": "...", "description": "...", "parameters": {...}}}`
+
+## Design
+
+Tools are a complex case because different providers have fundamentally different
+structures. Unlike simple fields like `stop` or `tool_choice`, tools require
+structural transformation rather than just field renaming.
+
+Anthropic built-in tools (bash, text_editor, web_search) have a "type" field
+at the root level, but custom tools do not. OpenAI always requires "type": "function"
+with the tool definition nested under "function".
+
+## UniversalTool
+
+The `UniversalTool` type provides a typed representation that can convert to/from
+any provider format. It distinguishes between:
+- Function tools (user-defined, work across all providers)
+- Builtin tools (provider-specific, may not translate)
+*/
+
+use serde::{Deserialize, Serialize};
+
+use crate::error::ConvertError;
+use crate::serde_json::{json, Map, Value};
+
+// =============================================================================
+// Universal Tool Types
+// =============================================================================
+
+/// A tool definition in universal format.
+///
+/// This provides a typed representation that normalizes the different tool formats
+/// across providers (Anthropic, OpenAI Chat, OpenAI Responses API, etc.).
+#[derive(Debug, Clone, PartialEq, Serialize, Deserialize)]
+pub struct UniversalTool {
+    /// Tool name (required for all tool types)
+    pub name: String,
+
+    /// Tool description
+    #[serde(skip_serializing_if = "Option::is_none")]
+    pub description: Option<String>,
+
+    /// Parameters/input schema (JSON Schema)
+    #[serde(skip_serializing_if = "Option::is_none")]
+    pub parameters: Option<Value>,
+
+    /// Tool type classification
+    #[serde(flatten)]
+    pub tool_type: UniversalToolType,
+}
+
+/// Classification of tool types.
+#[derive(Debug, Clone, Default, PartialEq, Serialize, Deserialize)]
+#[serde(tag = "kind")]
+pub enum UniversalToolType {
+    /// User-defined function tool (works across all providers)
+    #[default]
+    #[serde(rename = "function")]
+    Function,
+
+    /// Provider-specific built-in tool (may not translate to other providers)
+    #[serde(rename = "builtin")]
+    Builtin {
+        /// Provider identifier (e.g., "anthropic", "openai_responses")
+        provider: String,
+        /// Original type name (e.g., "bash_20250124", "code_interpreter")
+        builtin_type: String,
+        /// Provider-specific configuration
+        #[serde(skip_serializing_if = "Option::is_none")]
+        config: Option<Value>,
+    },
+}
+
+// =============================================================================
+// UniversalTool Constructors
+// =============================================================================
+
+impl UniversalTool {
+    /// Create a new function tool.
+    pub fn function(
+        name: impl Into<String>,
+        description: Option<String>,
+        parameters: Option<Value>,
+    ) -> Self {
+        Self {
+            name: name.into(),
+            description,
+            parameters,
+            tool_type: UniversalToolType::Function,
+        }
+    }
+
+    /// Create a new builtin tool.
+    pub fn builtin(
+        name: impl Into<String>,
+        provider: impl Into<String>,
+        builtin_type: impl Into<String>,
+        config: Option<Value>,
+    ) -> Self {
+        Self {
+            name: name.into(),
+            description: None,
+            parameters: None,
+            tool_type: UniversalToolType::Builtin {
+                provider: provider.into(),
+                builtin_type: builtin_type.into(),
+                config,
+            },
+        }
+    }
+
+    /// Check if this is a function tool.
+    pub fn is_function(&self) -> bool {
+        matches!(self.tool_type, UniversalToolType::Function)
+    }
+
+    /// Check if this is a builtin tool.
+    pub fn is_builtin(&self) -> bool {
+        matches!(self.tool_type, UniversalToolType::Builtin { .. })
+    }
+
+    /// Get the builtin provider, if this is a builtin tool.
+    pub fn builtin_provider(&self) -> Option<&str> {
+        match &self.tool_type {
+            UniversalToolType::Builtin { provider, .. } => Some(provider),
+            _ => None,
+        }
+    }
+}
+
+// =============================================================================
+// Conversion from Provider Formats
+// =============================================================================
+
+impl UniversalTool {
+    /// Parse a tool from Anthropic format (JSON Value).
+    ///
+    /// Handles both custom tools and built-in tools (bash, text_editor, web_search).
+    pub fn from_anthropic_value(value: &Value) -> Option<Self> {
+        // Check for built-in tools first (have "type" field)
+        if let Some(tool_type) = value.get("type").and_then(Value::as_str) {
+            let name = value
+                .get("name")
+                .and_then(Value::as_str)
+                .unwrap_or(tool_type)
+                .to_string();
+
+            // Determine builtin type from the type field
+            if tool_type.starts_with("bash_")
+                || tool_type.starts_with("text_editor_")
+                || tool_type.starts_with("web_search_")
+            {
+                return Some(Self::builtin(
+                    name,
+                    "anthropic",
+                    tool_type,
+                    Some(value.clone()),
+                ));
+            }
+        }
+
+        // Custom tool format: {"name", "description", "input_schema"}
+        let name = value.get("name").and_then(Value::as_str)?;
+        let description = value
+            .get("description")
+            .and_then(Value::as_str)
+            .map(String::from);
+        let parameters = value.get("input_schema").cloned();
+
+        Some(Self::function(name, description, parameters))
+    }
+
+    /// Parse a tool from OpenAI Chat Completions format (JSON Value).
+    ///
+    /// Format: `{"type": "function", "function": {"name", "description", "parameters"}}`
+    pub fn from_openai_chat_value(value: &Value) -> Option<Self> {
+        // OpenAI Chat format requires type: "function" and nested function object
+        if value.get("type").and_then(Value::as_str) != Some("function") {
+            return None;
+        }
+
+        let func = value.get("function")?;
+        let name = func.get("name").and_then(Value::as_str)?;
+        let description = func
+            .get("description")
+            .and_then(Value::as_str)
+            .map(String::from);
+        let parameters = func.get("parameters").cloned();
+
+        Some(Self::function(name, description, parameters))
+    }
+
+    /// Parse a tool from OpenAI Responses API format (JSON Value).
+    ///
+    /// Function format: `{"type": "function", "name", "description", "parameters", "strict"}`
+    /// Builtin format: `{"type": "code_interpreter"}`, `{"type": "web_search_preview"}`, etc.
+    pub fn from_responses_value(value: &Value) -> Option<Self> {
+        let tool_type = value.get("type").and_then(Value::as_str)?;
+
+        match tool_type {
+            "function" => {
+                // Responses API function: name is at top level, not nested
+                let name = value.get("name").and_then(Value::as_str)?;
+                let description = value
+                    .get("description")
+                    .and_then(Value::as_str)
+                    .map(String::from);
+                let parameters = value.get("parameters").cloned();
+
+                Some(Self::function(name, description, parameters))
+            }
+            "code_interpreter"
+            | "web_search_preview"
+            | "mcp"
+            | "file_search"
+            | "computer_use_preview" => {
+                // Responses API built-in tools
+                Some(Self::builtin(
+                    tool_type,
+                    "openai_responses",
+                    tool_type,
+                    Some(value.clone()),
+                ))
+            }
+            _ => None,
+        }
+    }
+
+    /// Parse tools from a JSON Value array, auto-detecting the format.
+    pub fn from_value_array(tools: &Value) -> Vec<Self> {
+        let Some(arr) = tools.as_array() else {
+            return Vec::new();
+        };
+
+        let format = detect_tools_format(tools);
+
+        arr.iter()
+            .filter_map(|tool| match format {
+                ToolsFormat::OpenAIChat => Self::from_openai_chat_value(tool),
+                ToolsFormat::OpenAIResponses => Self::from_responses_value(tool),
+                ToolsFormat::AnthropicCustom | ToolsFormat::AnthropicBuiltin => {
+                    Self::from_anthropic_value(tool)
+                }
+                ToolsFormat::Unknown => {
+                    // Try each format in order
+                    Self::from_openai_chat_value(tool)
+                        .or_else(|| Self::from_responses_value(tool))
+                        .or_else(|| Self::from_anthropic_value(tool))
+                }
+            })
+            .collect()
+    }
+}
+
+// =============================================================================
+// Conversion to Provider Formats
+// =============================================================================
+
+impl UniversalTool {
+    /// Convert to Anthropic format (JSON Value).
+    ///
+    /// Returns an error if the tool is a builtin from a different provider.
+    pub fn to_anthropic_value(&self) -> Result<Value, ConvertError> {
+        match &self.tool_type {
+            UniversalToolType::Function => {
+                let mut obj = Map::new();
+                obj.insert("name".into(), Value::String(self.name.clone()));
+
+                if let Some(desc) = &self.description {
+                    obj.insert("description".into(), Value::String(desc.clone()));
+                }
+
+                obj.insert(
+                    "input_schema".into(),
+                    self.parameters.clone().unwrap_or_else(|| json!({})),
+                );
+
+                Ok(Value::Object(obj))
+            }
+            UniversalToolType::Builtin {
+                provider,
+                builtin_type,
+                config,
+            } => {
+                if provider != "anthropic" {
+                    return Err(ConvertError::UnsupportedToolType {
+                        tool_name: self.name.clone(),
+                        tool_type: builtin_type.clone(),
+                        target_provider: "Anthropic".to_string(),
+                    });
+                }
+                // Return the original config for Anthropic builtins
+                config
+                    .clone()
+                    .ok_or_else(|| ConvertError::MissingRequiredField {
+                        field: format!("config for Anthropic builtin tool '{}'", self.name),
+                    })
+            }
+        }
+    }
+
+    /// Convert to OpenAI Chat Completions format (JSON Value).
+    ///
+    /// Returns an error if the tool is a builtin (Chat Completions doesn't support builtins).
+    pub fn to_openai_chat_value(&self) -> Result<Value, ConvertError> {
+        match &self.tool_type {
+            UniversalToolType::Function => {
+                let mut func = Map::new();
+                func.insert("name".into(), Value::String(self.name.clone()));
+
+                if let Some(desc) = &self.description {
+                    func.insert("description".into(), Value::String(desc.clone()));
+                }
+
+                func.insert(
+                    "parameters".into(),
+                    self.parameters.clone().unwrap_or_else(|| json!({})),
+                );
+
+                Ok(json!({
+                    "type": "function",
+                    "function": Value::Object(func)
+                }))
+            }
+            UniversalToolType::Builtin { builtin_type, .. } => {
+                Err(ConvertError::UnsupportedToolType {
+                    tool_name: self.name.clone(),
+                    tool_type: builtin_type.clone(),
+                    target_provider: "OpenAI Chat Completions".to_string(),
+                })
+            }
+        }
+    }
+
+    /// Convert to OpenAI Responses API format (JSON Value).
+    ///
+    /// Returns an error if the tool is a builtin from a different provider.
+    pub fn to_responses_value(&self) -> Result<Value, ConvertError> {
+        match &self.tool_type {
+            UniversalToolType::Function => {
+                let mut obj = Map::new();
+                obj.insert("type".into(), Value::String("function".to_string()));
+                obj.insert("name".into(), Value::String(self.name.clone()));
+
+                if let Some(desc) = &self.description {
+                    obj.insert("description".into(), Value::String(desc.clone()));
+                }
+
+                obj.insert(
+                    "parameters".into(),
+                    self.parameters.clone().unwrap_or_else(|| json!({})),
+                );
+
+                // Responses API function tools have strict: false by default
+                obj.insert("strict".into(), Value::Bool(false));
+
+                Ok(Value::Object(obj))
+            }
+            UniversalToolType::Builtin {
+                provider,
+                builtin_type,
+                config,
+            } => {
+                if provider != "openai_responses" {
+                    return Err(ConvertError::UnsupportedToolType {
+                        tool_name: self.name.clone(),
+                        tool_type: builtin_type.clone(),
+                        target_provider: "OpenAI Responses API".to_string(),
+                    });
+                }
+                // Return the original config for Responses API builtins
+                config
+                    .clone()
+                    .ok_or_else(|| ConvertError::MissingRequiredField {
+                        field: format!("config for Responses API builtin tool '{}'", self.name),
+                    })
+            }
+        }
+    }
+}
+
+// =============================================================================
+// Batch Conversion Utilities
+// =============================================================================
+
+/// Convert a slice of UniversalTools to Anthropic format Value array.
+///
+/// Returns an error if any tool cannot be converted (e.g., non-Anthropic builtins).
+pub fn tools_to_anthropic_value(tools: &[UniversalTool]) -> Result<Option<Value>, ConvertError> {
+    if tools.is_empty() {
+        return Ok(None);
+    }
+    let converted: Vec<Value> = tools
+        .iter()
+        .map(|t| t.to_anthropic_value())
+        .collect::<Result<Vec<_>, _>>()?;
+    Ok(Some(Value::Array(converted)))
+}
+
+/// Convert a slice of UniversalTools to OpenAI Chat format Value array.
+///
+/// Returns an error if any tool cannot be converted (e.g., builtins).
+pub fn tools_to_openai_chat_value(tools: &[UniversalTool]) -> Result<Option<Value>, ConvertError> {
+    if tools.is_empty() {
+        return Ok(None);
+    }
+    let converted: Vec<Value> = tools
+        .iter()
+        .map(|t| t.to_openai_chat_value())
+        .collect::<Result<Vec<_>, _>>()?;
+    Ok(Some(Value::Array(converted)))
+}
+
+/// Convert a slice of UniversalTools to Responses API format Value array.
+///
+/// Returns an error if any tool cannot be converted (e.g., Anthropic builtins).
+pub fn tools_to_responses_value(tools: &[UniversalTool]) -> Result<Option<Value>, ConvertError> {
+    if tools.is_empty() {
+        return Ok(None);
+    }
+    let converted: Vec<Value> = tools
+        .iter()
+        .map(|t| t.to_responses_value())
+        .collect::<Result<Vec<_>, _>>()?;
+    Ok(Some(Value::Array(converted)))
+}
+
+// =============================================================================
+// Format Detection
+// =============================================================================
+
+/// Detected tools format for cross-provider translation.
+#[derive(Debug, Clone, Copy, PartialEq, Eq)]
+pub enum ToolsFormat {
+    /// OpenAI Chat Completions format: `{type: "function", function: {name, description, parameters}}`
+    OpenAIChat,
+    /// OpenAI Responses API format: `{type: "function", name, description, parameters}` (no wrapper)
+    OpenAIResponses,
+    /// Anthropic custom tool format: `{name, description, input_schema}` (no type field)
+    AnthropicCustom,
+    /// Anthropic built-in tool format: `{type: "bash_20250124", name: "bash"}` etc.
+    AnthropicBuiltin,
+    /// Unknown or unrecognized format
+    Unknown,
+}
+
+/// Detect the format of a tools array.
+///
+/// # Detection logic
+///
+/// 1. If first tool has `type` field and `function` wrapper → OpenAIChat
+/// 2. If first tool has `type` field, no `function`, and type is builtin → AnthropicBuiltin
+/// 3. If first tool has `type` field, no `function`, not builtin → OpenAIResponses
+/// 4. If first tool has `name` but no `type` → AnthropicCustom
+/// 5. Otherwise → Unknown
+fn detect_tools_format(tools: &Value) -> ToolsFormat {
+    let Some(arr) = tools.as_array() else {
+        return ToolsFormat::Unknown;
+    };
+    let Some(first) = arr.first() else {
+        return ToolsFormat::Unknown;
+    };
+
+    let has_type = first.get("type").and_then(Value::as_str);
+    let has_function_wrapper = first.get("function").is_some();
+    let has_name = first.get("name").is_some();
+
+    match (has_type, has_function_wrapper, has_name) {
+        // Has type and function wrapper → OpenAI Chat format
+        (Some("function"), true, _) => ToolsFormat::OpenAIChat,
+
+        // Has type, no function wrapper → check if Anthropic builtin or Responses API
+        (Some(t), false, _) => {
+            // Anthropic built-in tools use versioned type names (e.g., bash_20250124).
+            // Update this list when Anthropic adds new built-in tool types.
+            if t.starts_with("bash_")
+                || t.starts_with("text_editor_")
+                || t.starts_with("web_search_")
+            {
+                ToolsFormat::AnthropicBuiltin
+            } else {
+                ToolsFormat::OpenAIResponses
+            }
+        }
+
+        // Has name but no type → Anthropic custom format
+        (None, _, true) => ToolsFormat::AnthropicCustom,
+
+        // Anything else
+        _ => ToolsFormat::Unknown,
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn test_universal_tool_function_constructor() {
+        let tool = UniversalTool::function(
+            "get_weather",
+            Some("Get the weather".to_string()),
+            Some(json!({"type": "object"})),
+        );
+
+        assert_eq!(tool.name, "get_weather");
+        assert_eq!(tool.description, Some("Get the weather".to_string()));
+        assert!(tool.is_function());
+        assert!(!tool.is_builtin());
+        assert!(tool.builtin_provider().is_none());
+    }
+
+    #[test]
+    fn test_universal_tool_builtin_constructor() {
+        let tool = UniversalTool::builtin(
+            "bash",
+            "anthropic",
+            "bash_20250124",
+            Some(json!({"name": "bash"})),
+        );
+
+        assert_eq!(tool.name, "bash");
+        assert!(!tool.is_function());
+        assert!(tool.is_builtin());
+        assert_eq!(tool.builtin_provider(), Some("anthropic"));
+    }
+
+    #[test]
+    fn test_universal_tool_from_anthropic_custom() {
+        let anthropic = json!({
+            "name": "get_weather",
+            "description": "Get weather info",
+            "input_schema": {"type": "object", "properties": {"location": {"type": "string"}}}
+        });
+
+        let tool = UniversalTool::from_anthropic_value(&anthropic).unwrap();
+
+        assert_eq!(tool.name, "get_weather");
+        assert_eq!(tool.description, Some("Get weather info".to_string()));
+        assert!(tool.is_function());
+        assert!(tool.parameters.is_some());
+    }
+
+    #[test]
+    fn test_universal_tool_from_anthropic_builtin() {
+        let anthropic = json!({
+            "type": "bash_20250124",
+            "name": "bash"
+        });
+
+        let tool = UniversalTool::from_anthropic_value(&anthropic).unwrap();
+
+        assert_eq!(tool.name, "bash");
+        assert!(tool.is_builtin());
+        assert_eq!(tool.builtin_provider(), Some("anthropic"));
+
+        if let UniversalToolType::Builtin { builtin_type, .. } = &tool.tool_type {
+            assert_eq!(builtin_type, "bash_20250124");
+        } else {
+            panic!("Expected Builtin type");
+        }
+    }
+
+    #[test]
+    fn test_universal_tool_from_openai_chat() {
+        let openai = json!({
+            "type": "function",
+            "function": {
+                "name": "get_weather",
+                "description": "Get weather",
+                "parameters": {"type": "object"}
+            }
+        });
+
+        let tool = UniversalTool::from_openai_chat_value(&openai).unwrap();
+
+        assert_eq!(tool.name, "get_weather");
+        assert_eq!(tool.description, Some("Get weather".to_string()));
+        assert!(tool.is_function());
+    }
+
+    #[test]
+    fn test_universal_tool_from_responses_function() {
+        let responses = json!({
+            "type": "function",
+            "name": "get_weather",
+            "description": "Get weather",
+            "parameters": {"type": "object"},
+            "strict": false
+        });
+
+        let tool = UniversalTool::from_responses_value(&responses).unwrap();
+
+        assert_eq!(tool.name, "get_weather");
+        assert!(tool.is_function());
+    }
+
+    #[test]
+    fn test_universal_tool_from_responses_builtin() {
+        let responses = json!({
+            "type": "code_interpreter"
+        });
+
+        let tool = UniversalTool::from_responses_value(&responses).unwrap();
+
+        assert_eq!(tool.name, "code_interpreter");
+        assert!(tool.is_builtin());
+        assert_eq!(tool.builtin_provider(), Some("openai_responses"));
+    }
+
+    #[test]
+    fn test_universal_tool_to_anthropic_function() {
+        let tool = UniversalTool::function(
+            "get_weather",
+            Some("Get weather".to_string()),
+            Some(json!({"type": "object"})),
+        );
+
+        let value = tool.to_anthropic_value().unwrap();
+
+        assert_eq!(value["name"], "get_weather");
+        assert_eq!(value["description"], "Get weather");
+        assert!(value["input_schema"].is_object());
+        assert!(value.get("type").is_none()); // Custom tools don't have type field
+    }
+
+    #[test]
+    fn test_universal_tool_to_anthropic_builtin_passthrough() {
+        let config = json!({
+            "type": "bash_20250124",
+            "name": "bash"
+        });
+        let tool =
+            UniversalTool::builtin("bash", "anthropic", "bash_20250124", Some(config.clone()));
+
+        let value = tool.to_anthropic_value().unwrap();
+        assert_eq!(value, config);
+    }
+
+    #[test]
+    fn test_universal_tool_to_anthropic_builtin_wrong_provider() {
+        let tool = UniversalTool::builtin(
+            "code_interpreter",
+            "openai_responses",
+            "code_interpreter",
+            Some(json!({})),
+        );
+
+        let result = tool.to_anthropic_value();
+        assert!(result.is_err());
+    }
+
+    #[test]
+    fn test_universal_tool_to_openai_chat_function() {
+        let tool = UniversalTool::function(
+            "get_weather",
+            Some("Get weather".to_string()),
+            Some(json!({"type": "object"})),
+        );
+
+        let value = tool.to_openai_chat_value().unwrap();
+
+        assert_eq!(value["type"], "function");
+        assert_eq!(value["function"]["name"], "get_weather");
+        assert_eq!(value["function"]["description"], "Get weather");
+    }
+
+    #[test]
+    fn test_universal_tool_to_openai_chat_builtin_error() {
+        let tool = UniversalTool::builtin("bash", "anthropic", "bash_20250124", Some(json!({})));
+
+        let result = tool.to_openai_chat_value();
+        assert!(result.is_err());
+    }
+
+    #[test]
+    fn test_universal_tool_to_responses_function() {
+        let tool = UniversalTool::function(
+            "get_weather",
+            Some("Get weather".to_string()),
+            Some(json!({"type": "object"})),
+        );
+
+        let value = tool.to_responses_value().unwrap();
+
+        assert_eq!(value["type"], "function");
+        assert_eq!(value["name"], "get_weather");
+        assert_eq!(value["description"], "Get weather");
+        assert_eq!(value["strict"], false);
+    }
+
+    #[test]
+    fn test_universal_tool_to_responses_builtin_passthrough() {
+        let config = json!({"type": "code_interpreter"});
+        let tool = UniversalTool::builtin(
+            "code_interpreter",
+            "openai_responses",
+            "code_interpreter",
+            Some(config.clone()),
+        );
+
+        let value = tool.to_responses_value().unwrap();
+        assert_eq!(value, config);
+    }
+
+    #[test]
+    fn test_universal_tool_roundtrip_anthropic() {
+        let original = json!({
+            "name": "get_weather",
+            "description": "Get weather info",
+            "input_schema": {"type": "object", "properties": {"location": {"type": "string"}}}
+        });
+
+        let tool = UniversalTool::from_anthropic_value(&original).unwrap();
+        let back = tool.to_anthropic_value().unwrap();
+
+        assert_eq!(back["name"], original["name"]);
+        assert_eq!(back["description"], original["description"]);
+        // Note: input_schema may have empty object default if original was missing
+    }
+
+    #[test]
+    fn test_universal_tool_roundtrip_openai_chat() {
+        let original = json!({
+            "type": "function",
+            "function": {
+                "name": "get_weather",
+                "description": "Get weather",
+                "parameters": {"type": "object"}
+            }
+        });
+
+        let tool = UniversalTool::from_openai_chat_value(&original).unwrap();
+        let back = tool.to_openai_chat_value().unwrap();
+
+        assert_eq!(back["type"], "function");
+        assert_eq!(back["function"]["name"], original["function"]["name"]);
+        assert_eq!(
+            back["function"]["description"],
+            original["function"]["description"]
+        );
+    }
+
+    #[test]
+    fn test_universal_tool_cross_provider_anthropic_to_openai() {
+        let anthropic = json!({
+            "name": "get_weather",
+            "description": "Get weather",
+            "input_schema": {"type": "object"}
+        });
+
+        let tool = UniversalTool::from_anthropic_value(&anthropic).unwrap();
+        let openai = tool.to_openai_chat_value().unwrap();
+
+        assert_eq!(openai["type"], "function");
+        assert_eq!(openai["function"]["name"], "get_weather");
+        assert_eq!(openai["function"]["description"], "Get weather");
+    }
+
+    #[test]
+    fn test_universal_tool_cross_provider_openai_to_anthropic() {
+        let openai = json!({
+            "type": "function",
+            "function": {
+                "name": "get_weather",
+                "description": "Get weather",
+                "parameters": {"type": "object"}
+            }
+        });
+
+        let tool = UniversalTool::from_openai_chat_value(&openai).unwrap();
+        let anthropic = tool.to_anthropic_value().unwrap();
+
+        assert_eq!(anthropic["name"], "get_weather");
+        assert_eq!(anthropic["description"], "Get weather");
+        assert!(anthropic.get("type").is_none());
+    }
+
+    #[test]
+    fn test_batch_conversion_to_anthropic() {
+        let tools = vec![
+            UniversalTool::function("tool1", Some("desc1".to_string()), None),
+            UniversalTool::function("tool2", Some("desc2".to_string()), None),
+        ];
+
+        let result = tools_to_anthropic_value(&tools).unwrap();
+        let arr = result.unwrap().as_array().cloned().unwrap();
+
+        assert_eq!(arr.len(), 2);
+        assert_eq!(arr[0]["name"], "tool1");
+        assert_eq!(arr[1]["name"], "tool2");
+    }
+
+    #[test]
+    fn test_batch_conversion_to_anthropic_fails_on_wrong_provider() {
+        let tools = vec![
+            UniversalTool::function("tool1", Some("desc1".to_string()), None),
+            UniversalTool::builtin(
+                "code_interpreter",
+                "openai_responses",
+                "code_interpreter",
+                Some(json!({})),
+            ),
+        ];
+
+        let result = tools_to_anthropic_value(&tools);
+        assert!(result.is_err());
+    }
+
+    #[test]
+    fn test_batch_conversion_to_openai_chat() {
+        let tools = vec![
+            UniversalTool::function("tool1", Some("desc1".to_string()), None),
+            UniversalTool::function("tool2", Some("desc2".to_string()), None),
+        ];
+
+        let result = tools_to_openai_chat_value(&tools).unwrap();
+        let arr = result.unwrap().as_array().cloned().unwrap();
+
+        assert_eq!(arr.len(), 2);
+        assert_eq!(arr[0]["function"]["name"], "tool1");
+    }
+
+    #[test]
+    fn test_batch_conversion_to_openai_chat_fails_on_builtin() {
+        let tools = vec![
+            UniversalTool::function("tool1", Some("desc1".to_string()), None),
+            UniversalTool::builtin("bash", "anthropic", "bash_20250124", Some(json!({}))),
+        ];
+
+        let result = tools_to_openai_chat_value(&tools);
+        assert!(result.is_err());
+    }
+
+    #[test]
+    fn test_from_value_array_auto_detect() {
+        // OpenAI Chat format
+        let openai = json!([{
+            "type": "function",
+            "function": {"name": "test1", "description": "desc1", "parameters": {}}
+        }]);
+        let tools = UniversalTool::from_value_array(&openai);
+        assert_eq!(tools.len(), 1);
+        assert_eq!(tools[0].name, "test1");
+
+        // Anthropic format
+        let anthropic = json!([{
+            "name": "test2",
+            "description": "desc2",
+            "input_schema": {}
+        }]);
+        let tools = UniversalTool::from_value_array(&anthropic);
+        assert_eq!(tools.len(), 1);
+        assert_eq!(tools[0].name, "test2");
+
+        // Responses API format
+        let responses = json!([{
+            "type": "function",
+            "name": "test3",
+            "description": "desc3",
+            "parameters": {}
+        }]);
+        let tools = UniversalTool::from_value_array(&responses);
+        assert_eq!(tools.len(), 1);
+        assert_eq!(tools[0].name, "test3");
+    }
+}
diff --git a/crates/lingua/src/wasm.rs b/crates/lingua/src/wasm.rs
index c1c9f4e0..9caa1a1d 100644
--- a/crates/lingua/src/wasm.rs
+++ b/crates/lingua/src/wasm.rs
@@ -5,6 +5,7 @@ use wasm_bindgen::prelude::*;
 // Import our types and conversion traits
 use crate::providers::anthropic::generated as anthropic;
 use crate::providers::openai::generated as openai;
+use crate::providers::openai::ChatCompletionRequestMessageExt;
 use crate::universal::{convert::TryFromLLM, Message};
 
 fn convert_to_lingua<T, U>(value: JsValue) -> Result<JsValue, JsValue>
@@ -53,13 +54,13 @@ where
 /// Convert array of Chat Completions messages to Lingua Messages
 #[wasm_bindgen]
 pub fn chat_completions_messages_to_lingua(value: JsValue) -> Result<JsValue, JsValue> {
-    convert_to_lingua::<Vec<openai::ChatCompletionRequestMessage>, Vec<Message>>(value)
+    convert_to_lingua::<Vec<ChatCompletionRequestMessageExt>, Vec<Message>>(value)
 }
 
 /// Convert array of Lingua Messages to Chat Completions messages
 #[wasm_bindgen]
 pub fn lingua_to_chat_completions_messages(value: JsValue) -> Result<JsValue, JsValue> {
-    convert_from_lingua::<Vec<Message>, Vec<openai::ChatCompletionRequestMessage>>(value)
+    convert_from_lingua::<Vec<Message>, Vec<ChatCompletionRequestMessageExt>>(value)
 }
 
 /// Convert array of Responses API messages to Lingua Messages
diff --git a/payloads/scripts/providers/openai.ts b/payloads/scripts/providers/openai.ts
index da3ea416..3bca2253 100644
--- a/payloads/scripts/providers/openai.ts
+++ b/payloads/scripts/providers/openai.ts
@@ -215,6 +215,8 @@ export const openaiExecutor: ProviderExecutor<
     "service_tier",
     "system_fingerprint",
     "choices.*.message.content",
+    "choices.*.message.reasoning", // Extended thinking content varies per request
+    "choices.*.message.reasoning_signature", // Cryptographic signature for reasoning roundtrips
     "choices.*.message.tool_calls.*.id",
     "choices.*.delta.content",
     "choices.*.delta.tool_calls.*.id",
diff --git a/payloads/scripts/validate.ts b/payloads/scripts/validate.ts
index b237ca16..f0763c04 100644
--- a/payloads/scripts/validate.ts
+++ b/payloads/scripts/validate.ts
@@ -172,6 +172,7 @@ async function main(): Promise<void> {
     providers: options.providers,
     all: options.all,
     stream: options.stream,
+    verbose: options.verbose,
     onResult: (result) => {
       results.push(result);
       printer.printResult(result);
diff --git a/payloads/scripts/validation/index.ts b/payloads/scripts/validation/index.ts
index ff2e7e59..a4755aa5 100644
--- a/payloads/scripts/validation/index.ts
+++ b/payloads/scripts/validation/index.ts
@@ -18,7 +18,7 @@ import {
 } from "../../cases";
 import {
   OPENAI_CHAT_COMPLETIONS_MODEL,
-  ANTHROPIC_MODEL,
+  ANTHROPIC_STRUCTURED_OUTPUT_MODEL,
   GOOGLE_MODEL,
   BEDROCK_MODEL,
 } from "../../cases/models";
@@ -50,6 +50,42 @@ const formatRegistry: Record<string, ExecutorEntry> = {
 };
 /* eslint-enable @typescript-eslint/consistent-type-assertions */
 
+/**
+ * Type guard to check if value is a record with string keys.
+ */
+function isRecord(value: unknown): value is Record<string, unknown> {
+  return typeof value === "object" && value !== null && !Array.isArray(value);
+}
+
+/**
+ * Extract model name from actual API response.
+ * Handles both streaming (array) and non-streaming (object) responses.
+ */
+function extractModelFromResponse(
+  response: unknown,
+  isStreaming?: boolean
+): string | undefined {
+  if (!response) return undefined;
+
+  if (isStreaming && Array.isArray(response)) {
+    // Streaming: model is in response[0].response.model
+    const firstChunk: unknown = response[0];
+    if (isRecord(firstChunk) && isRecord(firstChunk.response)) {
+      const nested = firstChunk.response;
+      if (typeof nested.model === "string") {
+        return nested.model;
+      }
+    }
+  } else if (isRecord(response)) {
+    // Non-streaming: model is directly on response.model
+    if (typeof response.model === "string") {
+      return response.model;
+    }
+  }
+
+  return undefined;
+}
+
 export interface ValidationOptions {
   proxyUrl: string;
   apiKey?: string; // API key to use (e.g., BRAINTRUST_API_KEY)
@@ -58,6 +94,7 @@ export interface ValidationOptions {
   providers?: string[]; // provider aliases to test (default: uses snapshot model)
   all?: boolean; // run all cases including slow ones
   stream?: boolean; // default: false (non-streaming only)
+  verbose?: boolean; // include actual response in results
   onResult?: (result: ValidationResult) => void; // callback for streaming results
 }
 
@@ -70,6 +107,7 @@ export interface ValidationResult {
   durationMs: number;
   diff?: DiffResult; // only if success=false due to diff, or warning=true
   error?: string; // only if request failed
+  actualResponse?: unknown; // the actual response from the proxy (when verbose)
 }
 
 /**
@@ -102,7 +140,7 @@ const DEFAULT_CASES = ["simpleRequest", "toolCallRequest", "reasoningRequest"];
 // Provider registry - maps provider aliases to actual model names (uses canonical models.ts)
 const PROVIDER_REGISTRY: Record<string, string> = {
   openai: OPENAI_CHAT_COMPLETIONS_MODEL,
-  anthropic: ANTHROPIC_MODEL,
+  anthropic: ANTHROPIC_STRUCTURED_OUTPUT_MODEL,
   google: GOOGLE_MODEL,
   bedrock: BEDROCK_MODEL,
 };
@@ -262,17 +300,17 @@ export async function runValidation(
               return result;
             }
 
-            // Override model if not using default
-            // Only override if test uses the default chat-completions model
-            // Preserve explicit model choices (e.g., reasoning models like gpt-5-nano)
+            // Override model only for cross-provider testing
+            // OpenAI formats (chat-completions, responses) with non-OpenAI providers
             if (
               providerAlias !== "default" &&
+              providerAlias !== "openai" && // Don't override for OpenAI - tests have correct models
               PROVIDER_REGISTRY[providerAlias]
             ) {
-              if (
-                request.model === OPENAI_CHAT_COMPLETIONS_MODEL ||
-                !request.model
-              ) {
+              const isOpenAIFormat =
+                format === "chat-completions" || format === "responses";
+              if (isOpenAIFormat) {
+                // Override for cross-provider translation testing
                 request = {
                   ...request,
                   model: PROVIDER_REGISTRY[providerAlias],
@@ -304,6 +342,12 @@ export async function runValidation(
             const actualResponse = options.stream
               ? actual.streamingResponse
               : actual.response;
+
+            // Extract actual model from response (fallback to registry-based name)
+            const actualModel =
+              extractModelFromResponse(actualResponse, options.stream) ??
+              modelName;
+
             const diff = compareResponses(
               expectedResponse,
               actualResponse,
@@ -318,11 +362,12 @@ export async function runValidation(
             const result: ValidationResult = {
               format,
               caseName,
-              model: modelName,
+              model: actualModel,
               success: diff.match || onlyMinorDiffs,
               warning: onlyMinorDiffs ? true : undefined,
               durationMs: Date.now() - start,
               diff: diff.match ? undefined : diff, // Include diff for warnings too
+              actualResponse: options.verbose ? actualResponse : undefined,
             };
             options.onResult?.(result);
             return result;
diff --git a/payloads/scripts/validation/reporter.ts b/payloads/scripts/validation/reporter.ts
index 3d5b6a72..b25f8791 100644
--- a/payloads/scripts/validation/reporter.ts
+++ b/payloads/scripts/validation/reporter.ts
@@ -58,8 +58,8 @@ export function createStreamingPrinter(options: PrinterOptions) {
       const duration = `${colors.dim}(${result.durationMs}ms)${colors.reset}`;
       const modelLabel =
         result.model !== "default"
-          ? ` ${colors.cyan}[${result.model}]${colors.reset}`
-          : "";
+          ? ` ${colors.cyan}[${result.format} - ${result.model}]${colors.reset}`
+          : ` ${colors.cyan}[${result.format}]${colors.reset}`;
 
       if (result.success && !result.warning) {
         // Clean pass - no diffs
@@ -103,6 +103,17 @@ export function createStreamingPrinter(options: PrinterOptions) {
           );
         }
       }
+
+      // Print actual response when verbose mode is on
+      if (verbose && result.actualResponse !== undefined) {
+        console.log(`    ${colors.cyan}Actual response:${colors.reset}`);
+        console.log(
+          JSON.stringify(result.actualResponse, null, 2)
+            .split("\n")
+            .map((line) => `      ${colors.dim}${line}${colors.reset}`)
+            .join("\n")
+        );
+      }
     },
 
     printSummary(results: ValidationResult[]): void {

From 80528b17ca59208718ccc8104436a30fc90fee21 Mon Sep 17 00:00:00 2001
From: Ken Jiang <ken@braintrustdata.com>
Date: Sun, 25 Jan 2026 20:12:02 -0500
Subject: [PATCH 2/5] address PR comments

---
 .../cross-transformation-coverage.yml         |  12 +-
 .../src/requests_expected_differences.json    |  25 ++--
 .../tests/cross_provider_test.rs              |   3 +-
 crates/lingua/docs/ADDING_PROVIDER_FORMAT.md  |   5 +-
 crates/lingua/src/processing/adapters.rs      |  34 -----
 .../lingua/src/providers/anthropic/adapter.rs |  65 +++------
 .../lingua/src/providers/anthropic/convert.rs | 126 ++++++++++++++++++
 .../lingua/src/providers/bedrock/adapter.rs   |  31 ++---
 crates/lingua/src/providers/google/adapter.rs |  54 ++++----
 crates/lingua/src/providers/openai/adapter.rs |  92 ++++++-------
 .../src/providers/openai/responses_adapter.rs |  61 ++++-----
 crates/lingua/src/universal/reasoning.rs      | 114 +++++++++++++++-
 crates/lingua/src/universal/request.rs        | 115 ++++++++++------
 crates/lingua/src/universal/response.rs       |  52 ++++----
 crates/lingua/src/universal/tools.rs          |  66 +++++++--
 15 files changed, 532 insertions(+), 323 deletions(-)

diff --git a/.github/workflows/cross-transformation-coverage.yml b/.github/workflows/cross-transformation-coverage.yml
index 0acb96ac..5c24219a 100644
--- a/.github/workflows/cross-transformation-coverage.yml
+++ b/.github/workflows/cross-transformation-coverage.yml
@@ -42,25 +42,23 @@ jobs:
           sudo apt-get update
           sudo apt-get install -y protobuf-compiler
 
+      - name: Verify no unexpected failures
+        run: |
+          cargo test -p coverage-report --test cross_provider_test -- --nocapture
+
       - name: Generate coverage report
         run: |
           cargo run -p coverage-report > coverage_report.md
 
       - name: Post coverage to job summary
-        if: always()
         run: |
           echo "# 🔄 Cross-Provider Transformation Coverage" >> $GITHUB_STEP_SUMMARY
           echo "" >> $GITHUB_STEP_SUMMARY
           cat coverage_report.md >> $GITHUB_STEP_SUMMARY
 
       - name: Upload coverage artifact
-        if: always()
         uses: actions/upload-artifact@v4
         with:
           name: transformation-coverage-report
           path: coverage_report.md
-          retention-days: 30
-
-      - name: Verify no unexpected failures
-        run: |
-          cargo test -p coverage-report --test cross_provider_test -- --nocapture
+          retention-days: 30
\ No newline at end of file
diff --git a/crates/coverage-report/src/requests_expected_differences.json b/crates/coverage-report/src/requests_expected_differences.json
index 9e9d1f2f..2879210b 100644
--- a/crates/coverage-report/src/requests_expected_differences.json
+++ b/crates/coverage-report/src/requests_expected_differences.json
@@ -20,26 +20,23 @@
         { "pattern": "params.response_format", "reason": "Anthropic doesn't support Text format type" },
         { "pattern": "params.metadata", "reason": "Anthropic only accepts user_id in metadata" },
         { "pattern": "params.parallel_tool_calls", "reason": "Anthropic only supports disable_parallel via tool_choice" },
-        { "pattern": "params.tool_choice", "reason": "Anthropic requires tool_choice to express disable_parallel_tool_use" }
-      ],
-      "errors": [
-        { "pattern": "does not support logprobs", "reason": "Anthropic doesn't support logprobs parameter" },
-        { "pattern": "does not support top_logprobs", "reason": "Anthropic doesn't support top_logprobs parameter" },
-        { "pattern": "does not support frequency_penalty", "reason": "Anthropic doesn't support frequency_penalty parameter" },
-        { "pattern": "does not support presence_penalty", "reason": "Anthropic doesn't support presence_penalty parameter" },
-        { "pattern": "does not support seed", "reason": "Anthropic doesn't support seed parameter" },
-        { "pattern": "does not support store", "reason": "Anthropic doesn't support store parameter" },
-        { "pattern": "does not support n > 1", "reason": "Anthropic doesn't support multiple completions" }
+        { "pattern": "params.tool_choice", "reason": "Anthropic requires tool_choice to express disable_parallel_tool_use" },
+        { "pattern": "params.logprobs", "reason": "Anthropic doesn't support logprobs (silently dropped)" },
+        { "pattern": "params.top_logprobs", "reason": "Anthropic doesn't support top_logprobs (silently dropped)" },
+        { "pattern": "params.frequency_penalty", "reason": "Anthropic doesn't support frequency_penalty (silently dropped)" },
+        { "pattern": "params.presence_penalty", "reason": "Anthropic doesn't support presence_penalty (silently dropped)" },
+        { "pattern": "params.seed", "reason": "Anthropic doesn't support seed (silently dropped)" },
+        { "pattern": "params.store", "reason": "Anthropic doesn't support store (silently dropped)" }
       ]
     },
     {
       "source": "*",
       "target": "ChatCompletions",
       "fields": [
-        { "pattern": "params.reasoning.summary", "reason": "ChatCompletions doesn't support reasoning summary" }
+        { "pattern": "params.reasoning.summary", "reason": "ChatCompletions doesn't support reasoning summary" },
+        { "pattern": "params.top_k", "reason": "ChatCompletions doesn't support top_k (silently dropped)" }
       ],
       "errors": [
-        { "pattern": "does not support top_k", "reason": "OpenAI Chat Completions doesn't support top_k parameter" },
         { "pattern": "is not supported by OpenAI Chat Completions", "reason": "Provider-specific built-in tool has no OpenAI equivalent" },
         { "pattern": "Unsupported input type: UserContentPart variant: File", "reason": "Anthropic document blocks not supported in OpenAI" }
       ]
@@ -56,10 +53,10 @@
       "source": "*",
       "target": "Responses",
       "fields": [
+        { "pattern": "params.top_k", "reason": "Responses API doesn't support top_k (silently dropped)" },
+        { "pattern": "params.stop", "reason": "Responses API doesn't support stop sequences (silently dropped)" }
       ],
       "errors": [
-        { "pattern": "does not support top_k", "reason": "OpenAI Responses API doesn't support top_k parameter" },
-        { "pattern": "does not support stop sequences", "reason": "OpenAI Responses API doesn't support stop sequences" },
         { "pattern": "is not supported by OpenAI Responses API", "reason": "Provider-specific built-in tool has no OpenAI equivalent" },
         { "pattern": "Unsupported input type: UserContentPart variant: File", "reason": "Anthropic document blocks not supported in OpenAI" },
         { "pattern": "ToolResult { tool_name: \"web_search\"", "reason": "Anthropic web_search encrypted results cannot be transformed to OpenAI" }
diff --git a/crates/coverage-report/tests/cross_provider_test.rs b/crates/coverage-report/tests/cross_provider_test.rs
index 31f5d5e7..168203d3 100644
--- a/crates/coverage-report/tests/cross_provider_test.rs
+++ b/crates/coverage-report/tests/cross_provider_test.rs
@@ -11,7 +11,8 @@ use coverage_report::types::TestFilter;
 use lingua::capabilities::ProviderFormat;
 use lingua::processing::adapters::adapters;
 
-/// Required providers for CI: Anthropic <-> ChatCompletions <-> Responses
+/// TODO: remove REQUIRED_PROVIDERS once all formats are fully supported by coverage-report.
+/// this is temporary as we make incremental progress.
 const REQUIRED_PROVIDERS: &[ProviderFormat] = &[
     ProviderFormat::Responses,
     ProviderFormat::OpenAI, // ChatCompletions
diff --git a/crates/lingua/docs/ADDING_PROVIDER_FORMAT.md b/crates/lingua/docs/ADDING_PROVIDER_FORMAT.md
index 5539a27f..dda56933 100644
--- a/crates/lingua/docs/ADDING_PROVIDER_FORMAT.md
+++ b/crates/lingua/docs/ADDING_PROVIDER_FORMAT.md
@@ -707,7 +707,10 @@ impl TryFromLLM<MyProviderMessage> for Message {
             "system" => Ok(Message::System {
                 content: UserContent::String(msg.content),
             }),
-            other => Err(ConvertError::InvalidRole { role: other.to_string() }),
+            other => Err(ConvertError::InvalidEnumValue {
+                type_name: "role",
+                value: other,
+             }),
         }
     }
 }
diff --git a/crates/lingua/src/processing/adapters.rs b/crates/lingua/src/processing/adapters.rs
index f7bf1eb7..fc027136 100644
--- a/crates/lingua/src/processing/adapters.rs
+++ b/crates/lingua/src/processing/adapters.rs
@@ -12,40 +12,6 @@ provider-specific logic into a single interface.
 3. Register it in `adapters()` with the appropriate feature gate
 */
 
-/// Macro to reject unsupported parameters in provider adapters.
-///
-/// This macro reduces boilerplate when validating that a UniversalRequest doesn't
-/// contain parameters that a provider doesn't support.
-///
-/// # Example
-///
-/// ```ignore
-/// reject_params!(req, ProviderFormat::Anthropic,
-///     logprobs,
-///     top_logprobs,
-///     presence_penalty,
-///     frequency_penalty,
-///     seed,
-///     store
-/// );
-/// ```
-///
-/// This expands to individual checks for each field, returning a ValidationFailed
-/// error if any unsupported field is present.
-#[macro_export]
-macro_rules! reject_params {
-    ($req:expr, $target:expr, $($field:ident),+ $(,)?) => {
-        $(
-            if $req.params.$field.is_some() {
-                return Err($crate::processing::transform::TransformError::ValidationFailed {
-                    target: $target,
-                    reason: concat!("does not support ", stringify!($field)).to_string(),
-                });
-            }
-        )+
-    };
-}
-
 use std::sync::LazyLock;
 
 use crate::capabilities::ProviderFormat;
diff --git a/crates/lingua/src/providers/anthropic/adapter.rs b/crates/lingua/src/providers/anthropic/adapter.rs
index 32aa66b8..bde7ec79 100644
--- a/crates/lingua/src/providers/anthropic/adapter.rs
+++ b/crates/lingua/src/providers/anthropic/adapter.rs
@@ -15,7 +15,6 @@ use crate::processing::transform::TransformError;
 use crate::providers::anthropic::generated::{ContentBlock, InputMessage};
 use crate::providers::anthropic::params::AnthropicParams;
 use crate::providers::anthropic::try_parse_anthropic;
-use crate::reject_params;
 use crate::serde_json::{self, Map, Value};
 use crate::universal::convert::TryFromLLM;
 use crate::universal::message::{Message, UserContent};
@@ -26,7 +25,6 @@ use crate::universal::{
     parse_stop_sequences, FinishReason, UniversalParams, UniversalRequest, UniversalResponse,
     UniversalStreamChoice, UniversalStreamChunk, UniversalUsage, PLACEHOLDER_ID, PLACEHOLDER_MODEL,
 };
-use std::collections::HashMap;
 use std::convert::TryInto;
 
 /// Default max_tokens for Anthropic requests (matches legacy proxy behavior).
@@ -65,7 +63,7 @@ impl ProviderAdapter for AnthropicAdapter {
         let messages = <Vec<Message> as TryFromLLM<Vec<_>>>::try_from(input_messages)
             .map_err(|e| TransformError::ToUniversalFailed(e.to_string()))?;
 
-        let params = UniversalParams {
+        let mut params = UniversalParams {
             temperature: typed_params.temperature,
             top_p: typed_params.top_p,
             top_k: typed_params.top_k,
@@ -106,12 +104,12 @@ impl ProviderAdapter for AnthropicAdapter {
             service_tier: typed_params.service_tier,
             logprobs: None,     // Anthropic doesn't support logprobs
             top_logprobs: None, // Anthropic doesn't support top_logprobs
+            extras: Default::default(),
         };
 
         // Use extras captured automatically via #[serde(flatten)]
-        let mut provider_extras = HashMap::new();
         if !typed_params.extras.is_empty() {
-            provider_extras.insert(
+            params.extras.insert(
                 ProviderFormat::Anthropic,
                 typed_params.extras.into_iter().collect(),
             );
@@ -121,7 +119,6 @@ impl ProviderAdapter for AnthropicAdapter {
             model: typed_params.model,
             messages,
             params,
-            provider_extras,
         })
     }
 
@@ -131,29 +128,6 @@ impl ProviderAdapter for AnthropicAdapter {
             reason: "missing model".to_string(),
         })?;
 
-        // Validate unsupported parameters
-        reject_params!(
-            req,
-            ProviderFormat::Anthropic,
-            logprobs,
-            top_logprobs,
-            presence_penalty,
-            frequency_penalty,
-            seed,
-            store
-        );
-        // Anthropic doesn't support multiple completions (n > 1)
-        if let Some(openai_extras) = req.provider_extras.get(&ProviderFormat::OpenAI) {
-            if let Some(n) = openai_extras.get("n").and_then(Value::as_i64) {
-                if n > 1 {
-                    return Err(TransformError::ValidationFailed {
-                        target: ProviderFormat::Anthropic,
-                        reason: "does not support n > 1 (multiple completions)".to_string(),
-                    });
-                }
-            }
-        }
-
         // Clone messages and extract system messages (Anthropic uses separate `system` param)
         let mut msgs = req.messages.clone();
         let system_contents = extract_system_messages(&mut msgs);
@@ -261,7 +235,7 @@ impl ProviderAdapter for AnthropicAdapter {
         }
 
         // Merge back provider-specific extras (only for Anthropic)
-        if let Some(extras) = req.provider_extras.get(&ProviderFormat::Anthropic) {
+        if let Some(extras) = req.params.extras.get(&ProviderFormat::Anthropic) {
             for (k, v) in extras {
                 // Don't overwrite canonical fields we already handled
                 if !obj.contains_key(k) {
@@ -341,22 +315,25 @@ impl ProviderAdapter for AnthropicAdapter {
             .map(|r| r.to_provider_string(self.format()).to_string())
             .unwrap_or_else(|| "end_turn".to_string());
 
-        let mut obj = serde_json::json!({
-            "id": format!("msg_{}", PLACEHOLDER_ID),
-            "type": "message",
-            "role": "assistant",
-            "content": content_value,
-            "model": resp.model.as_deref().unwrap_or(PLACEHOLDER_MODEL),
-            "stop_reason": stop_reason
-        });
+        let mut map = serde_json::Map::new();
+        map.insert(
+            "id".into(),
+            Value::String(format!("msg_{}", PLACEHOLDER_ID)),
+        );
+        map.insert("type".into(), Value::String("message".into()));
+        map.insert("role".into(), Value::String("assistant".into()));
+        map.insert("content".into(), content_value);
+        map.insert(
+            "model".into(),
+            Value::String(resp.model.as_deref().unwrap_or(PLACEHOLDER_MODEL).into()),
+        );
+        map.insert("stop_reason".into(), Value::String(stop_reason));
 
         if let Some(usage) = &resp.usage {
-            obj.as_object_mut()
-                .unwrap()
-                .insert("usage".into(), usage.to_provider_value(self.format()));
+            map.insert("usage".into(), usage.to_provider_value(self.format()));
         }
 
-        Ok(obj)
+        Ok(Value::Object(map))
     }
 
     // =========================================================================
@@ -680,7 +657,6 @@ mod tests {
             model: Some("claude-3-5-sonnet-20241022".to_string()),
             messages: vec![],
             params: UniversalParams::default(),
-            provider_extras: HashMap::new(),
         };
 
         assert!(req.params.max_tokens.is_none());
@@ -698,7 +674,6 @@ mod tests {
                 max_tokens: Some(8192),
                 ..Default::default()
             },
-            provider_extras: HashMap::new(),
         };
 
         adapter.apply_defaults(&mut req);
@@ -728,7 +703,6 @@ mod tests {
                 max_tokens: Some(4096),
                 ..Default::default()
             },
-            provider_extras: HashMap::new(),
         };
 
         let result = adapter.request_from_universal(&req).unwrap();
@@ -764,7 +738,6 @@ mod tests {
                 max_tokens: Some(1024),
                 ..Default::default()
             },
-            provider_extras: HashMap::new(),
         };
 
         let result = adapter.request_from_universal(&req).unwrap();
diff --git a/crates/lingua/src/providers/anthropic/convert.rs b/crates/lingua/src/providers/anthropic/convert.rs
index cdca8528..e57b4249 100644
--- a/crates/lingua/src/providers/anthropic/convert.rs
+++ b/crates/lingua/src/providers/anthropic/convert.rs
@@ -1048,3 +1048,129 @@ impl TryFromLLM<Vec<Message>> for Vec<generated::ContentBlock> {
         Ok(content_blocks)
     }
 }
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::universal::convert::TryFromLLM;
+
+    #[test]
+    fn test_file_to_anthropic_document_with_provider_options() {
+        // Create a File content part marked as a document (via provider_options)
+        let mut opts = serde_json::Map::new();
+        opts.insert(
+            "anthropic_type".into(),
+            serde_json::Value::String("document".to_string()),
+        );
+        opts.insert(
+            "title".into(),
+            serde_json::Value::String("Test Document".to_string()),
+        );
+
+        let file_part = UserContentPart::File {
+            data: serde_json::Value::String("base64encodeddata".to_string()),
+            filename: Some("test.pdf".to_string()),
+            media_type: "application/pdf".to_string(),
+            provider_options: Some(ProviderOptions { options: opts }),
+        };
+
+        // Create a user message with the file part
+        let message = Message::User {
+            content: UserContent::Array(vec![file_part]),
+        };
+
+        // Convert to Anthropic InputMessage
+        let result: Result<generated::InputMessage, _> =
+            <generated::InputMessage as TryFromLLM<Message>>::try_from(message);
+
+        assert!(result.is_ok(), "File conversion should succeed");
+        let input_msg = result.unwrap();
+
+        // Verify it's a user message with document block
+        assert!(matches!(input_msg.role, generated::MessageRole::User));
+        if let generated::MessageContent::InputContentBlockArray(blocks) = input_msg.content {
+            assert_eq!(blocks.len(), 1, "Should have exactly one content block");
+            let block = &blocks[0];
+            assert!(
+                matches!(
+                    block.input_content_block_type,
+                    generated::InputContentBlockType::Document
+                ),
+                "Should be a Document block"
+            );
+            assert_eq!(block.title, Some("Test Document".to_string()));
+        } else {
+            panic!("Expected InputContentBlockArray");
+        }
+    }
+
+    #[test]
+    fn test_regular_file_without_anthropic_marker_is_skipped() {
+        // Create a regular File content part (no anthropic_type marker)
+        let file_part = UserContentPart::File {
+            data: serde_json::Value::String("base64encodeddata".to_string()),
+            filename: Some("test.pdf".to_string()),
+            media_type: "application/pdf".to_string(),
+            provider_options: None, // No anthropic_type marker
+        };
+
+        let message = Message::User {
+            content: UserContent::Array(vec![file_part]),
+        };
+
+        let result: Result<generated::InputMessage, _> =
+            <generated::InputMessage as TryFromLLM<Message>>::try_from(message);
+
+        assert!(result.is_ok());
+        let input_msg = result.unwrap();
+
+        // Regular files without anthropic_type marker are currently skipped
+        if let generated::MessageContent::InputContentBlockArray(blocks) = input_msg.content {
+            // The file was skipped, so blocks should be empty
+            assert!(
+                blocks.is_empty(),
+                "Regular files without anthropic_type should be skipped (current behavior)"
+            );
+        }
+    }
+
+    #[test]
+    fn test_image_url_to_anthropic() {
+        let image_part = UserContentPart::Image {
+            image: serde_json::Value::String("https://example.com/image.jpg".to_string()),
+            media_type: Some("image/jpeg".to_string()),
+            provider_options: None,
+        };
+
+        let message = Message::User {
+            content: UserContent::Array(vec![image_part]),
+        };
+
+        let result: Result<generated::InputMessage, _> =
+            <generated::InputMessage as TryFromLLM<Message>>::try_from(message);
+
+        assert!(result.is_ok());
+        let input_msg = result.unwrap();
+
+        if let generated::MessageContent::InputContentBlockArray(blocks) = input_msg.content {
+            assert_eq!(blocks.len(), 1);
+            let block = &blocks[0];
+            assert!(matches!(
+                block.input_content_block_type,
+                generated::InputContentBlockType::Image
+            ));
+            // Verify URL source type is used
+            if let Some(generated::Source::SourceSource(source)) = &block.source {
+                assert!(matches!(source.source_type, generated::FluffyType::Url));
+                assert_eq!(
+                    source.url,
+                    Some("https://example.com/image.jpg".to_string())
+                );
+            } else {
+                panic!("Expected SourceSource");
+            }
+        } else {
+            panic!("Expected InputContentBlockArray");
+        }
+    }
+}
diff --git a/crates/lingua/src/providers/bedrock/adapter.rs b/crates/lingua/src/providers/bedrock/adapter.rs
index 987e8609..6cd214ac 100644
--- a/crates/lingua/src/providers/bedrock/adapter.rs
+++ b/crates/lingua/src/providers/bedrock/adapter.rs
@@ -26,7 +26,6 @@ use crate::universal::{
     FinishReason, UniversalParams, UniversalRequest, UniversalResponse, UniversalStreamChoice,
     UniversalStreamChunk, UniversalUsage,
 };
-use std::collections::HashMap;
 
 /// Adapter for Amazon Bedrock Converse API.
 pub struct BedrockAdapter;
@@ -84,7 +83,7 @@ impl ProviderAdapter for BedrockAdapter {
             .and_then(|v| serde_json::from_value::<Thinking>(v.clone()).ok())
             .map(|t| ReasoningConfig::from(&t));
 
-        let params = UniversalParams {
+        let mut params = UniversalParams {
             temperature,
             top_p,
             top_k: None, // Bedrock doesn't expose top_k in Converse API
@@ -111,6 +110,7 @@ impl ProviderAdapter for BedrockAdapter {
                             name,
                             description,
                             parameters,
+                            None,
                         ));
                     }
                 }
@@ -141,12 +141,12 @@ impl ProviderAdapter for BedrockAdapter {
             service_tier: None,
             logprobs: None,
             top_logprobs: None,
+            extras: Default::default(),
         };
 
         // Use extras captured automatically via #[serde(flatten)]
-        let mut provider_extras = HashMap::new();
         if !typed_params.extras.is_empty() {
-            provider_extras.insert(
+            params.extras.insert(
                 ProviderFormat::Converse,
                 typed_params.extras.into_iter().collect(),
             );
@@ -156,7 +156,6 @@ impl ProviderAdapter for BedrockAdapter {
             model: typed_params.model_id,
             messages,
             params,
-            provider_extras,
         })
     }
 
@@ -273,7 +272,7 @@ impl ProviderAdapter for BedrockAdapter {
         }
 
         // Merge back provider-specific extras (only for Bedrock/Converse)
-        if let Some(extras) = req.provider_extras.get(&ProviderFormat::Converse) {
+        if let Some(extras) = req.params.extras.get(&ProviderFormat::Converse) {
             for (k, v) in extras {
                 // Don't overwrite canonical fields we already handled
                 if !obj.contains_key(k) {
@@ -347,20 +346,20 @@ impl ProviderAdapter for BedrockAdapter {
             .map(|r| r.to_provider_string(self.format()).to_string())
             .unwrap_or_else(|| "end_turn".to_string());
 
-        let mut obj = serde_json::json!({
-            "output": {
+        let mut map = serde_json::Map::new();
+        map.insert(
+            "output".into(),
+            serde_json::json!({
                 "message": message_value
-            },
-            "stopReason": stop_reason
-        });
+            }),
+        );
+        map.insert("stopReason".into(), Value::String(stop_reason));
 
         if let Some(usage) = &resp.usage {
-            obj.as_object_mut()
-                .unwrap()
-                .insert("usage".into(), usage.to_provider_value(self.format()));
+            map.insert("usage".into(), usage.to_provider_value(self.format()));
         }
 
-        Ok(obj)
+        Ok(Value::Object(map))
     }
 
     // =========================================================================
@@ -666,7 +665,6 @@ mod tests {
                 max_tokens: Some(4096),
                 ..Default::default()
             },
-            provider_extras: Default::default(),
         };
 
         let reconstructed = adapter.request_from_universal(&universal).unwrap();
@@ -698,7 +696,6 @@ mod tests {
                 max_tokens: Some(4096),
                 ..Default::default()
             },
-            provider_extras: Default::default(),
         };
 
         let reconstructed = adapter.request_from_universal(&universal).unwrap();
diff --git a/crates/lingua/src/providers/google/adapter.rs b/crates/lingua/src/providers/google/adapter.rs
index 3d56a650..1a7aee6d 100644
--- a/crates/lingua/src/providers/google/adapter.rs
+++ b/crates/lingua/src/providers/google/adapter.rs
@@ -26,7 +26,6 @@ use crate::universal::{
     UniversalRequest, UniversalResponse, UniversalStreamChoice, UniversalStreamChunk,
     UniversalUsage, UserContent,
 };
-use std::collections::HashMap;
 
 /// Adapter for Google AI GenerateContent API.
 pub struct GoogleAdapter;
@@ -93,7 +92,7 @@ impl ProviderAdapter for GoogleAdapter {
                 (None, None, None, None, None, None)
             };
 
-        let params = UniversalParams {
+        let mut params = UniversalParams {
             temperature,
             top_p,
             top_k,
@@ -121,6 +120,7 @@ impl ProviderAdapter for GoogleAdapter {
                                     name,
                                     description,
                                     parameters,
+                                    None,
                                 ));
                             }
                         }
@@ -153,12 +153,12 @@ impl ProviderAdapter for GoogleAdapter {
             service_tier: None,
             logprobs: None,
             top_logprobs: None,
+            extras: Default::default(),
         };
 
         // Use extras captured automatically via #[serde(flatten)]
-        let mut provider_extras = HashMap::new();
         if !typed_params.extras.is_empty() {
-            provider_extras.insert(
+            params.extras.insert(
                 ProviderFormat::Google,
                 typed_params.extras.into_iter().collect(),
             );
@@ -168,7 +168,6 @@ impl ProviderAdapter for GoogleAdapter {
             model,
             messages,
             params,
-            provider_extras,
         })
     }
 
@@ -324,7 +323,7 @@ impl ProviderAdapter for GoogleAdapter {
         }
 
         // Merge back provider-specific extras (only for Google)
-        if let Some(extras) = req.provider_extras.get(&ProviderFormat::Google) {
+        if let Some(extras) = req.params.extras.get(&ProviderFormat::Google) {
             for (k, v) in extras {
                 // Don't overwrite canonical fields we already handled
                 if !obj.contains_key(k) {
@@ -413,18 +412,17 @@ impl ProviderAdapter for GoogleAdapter {
             })
             .collect::<Result<Vec<_>, TransformError>>()?;
 
-        let mut obj = serde_json::json!({
-            "candidates": candidates
-        });
+        let mut map = serde_json::Map::new();
+        map.insert("candidates".into(), Value::Array(candidates));
 
         if let Some(usage) = &resp.usage {
-            obj.as_object_mut().unwrap().insert(
+            map.insert(
                 "usageMetadata".into(),
                 usage.to_provider_value(self.format()),
             );
         }
 
-        Ok(obj)
+        Ok(Value::Object(map))
     }
 
     // =========================================================================
@@ -528,45 +526,41 @@ impl ProviderAdapter for GoogleAdapter {
                     other => other,
                 });
 
-                let mut candidate = serde_json::json!({
-                    "index": c.index,
-                    "content": {
+                let mut candidate_map = serde_json::Map::new();
+                candidate_map.insert("index".into(), serde_json::json!(c.index));
+                candidate_map.insert(
+                    "content".into(),
+                    serde_json::json!({
                         "parts": [{"text": text}],
                         "role": "model"
-                    }
-                });
+                    }),
+                );
 
                 if let Some(reason) = finish_reason {
-                    candidate
-                        .as_object_mut()
-                        .unwrap()
-                        .insert("finishReason".into(), Value::String(reason.to_string()));
+                    candidate_map.insert("finishReason".into(), Value::String(reason.to_string()));
                 }
 
-                candidate
+                Value::Object(candidate_map)
             })
             .collect();
 
-        let mut obj = serde_json::json!({
-            "candidates": candidates
-        });
-
-        let obj_map = obj.as_object_mut().unwrap();
+        let mut map = serde_json::Map::new();
+        map.insert("candidates".into(), Value::Array(candidates));
 
         if let Some(ref id) = chunk.id {
-            obj_map.insert("responseId".into(), Value::String(id.clone()));
+            map.insert("responseId".into(), Value::String(id.clone()));
         }
         if let Some(ref model) = chunk.model {
-            obj_map.insert("modelVersion".into(), Value::String(model.clone()));
+            map.insert("modelVersion".into(), Value::String(model.clone()));
         }
         if let Some(ref usage) = chunk.usage {
-            obj_map.insert(
+            map.insert(
                 "usageMetadata".into(),
                 usage.to_provider_value(self.format()),
             );
         }
 
-        Ok(obj)
+        Ok(Value::Object(map))
     }
 }
 
diff --git a/crates/lingua/src/providers/openai/adapter.rs b/crates/lingua/src/providers/openai/adapter.rs
index 6eb4164f..528a6a34 100644
--- a/crates/lingua/src/providers/openai/adapter.rs
+++ b/crates/lingua/src/providers/openai/adapter.rs
@@ -8,8 +8,6 @@ Vertex, and Mistral.
 
 use crate::capabilities::ProviderFormat;
 use crate::error::ConvertError;
-use crate::reject_params;
-use std::collections::HashMap;
 
 use crate::processing::adapters::{
     insert_opt_bool, insert_opt_f64, insert_opt_i64, insert_opt_value, ProviderAdapter,
@@ -127,6 +125,7 @@ impl ProviderAdapter for OpenAIAdapter {
             service_tier: typed_params.service_tier,
             logprobs: typed_params.logprobs,
             top_logprobs: typed_params.top_logprobs,
+            extras: Default::default(),
         };
 
         // Sync parallel_tool_calls with tool_choice.disable_parallel for roundtrip fidelity
@@ -167,16 +166,14 @@ impl ProviderAdapter for OpenAIAdapter {
             extras_map.insert("prompt_cache_key".into(), Value::String(prompt_cache_key));
         }
 
-        let mut provider_extras = HashMap::new();
         if !extras_map.is_empty() {
-            provider_extras.insert(ProviderFormat::OpenAI, extras_map);
+            params.extras.insert(ProviderFormat::OpenAI, extras_map);
         }
 
         Ok(UniversalRequest {
             model: typed_params.model,
             messages,
             params,
-            provider_extras,
         })
     }
 
@@ -186,9 +183,6 @@ impl ProviderAdapter for OpenAIAdapter {
             reason: "missing model".to_string(),
         })?;
 
-        // Validate unsupported parameters
-        reject_params!(req, ProviderFormat::OpenAI, top_k);
-
         let openai_messages: Vec<ChatCompletionRequestMessageExt> =
             <Vec<ChatCompletionRequestMessageExt> as TryFromLLM<Vec<Message>>>::try_from(
                 req.messages.clone(),
@@ -276,7 +270,7 @@ impl ProviderAdapter for OpenAIAdapter {
         }
 
         // Merge back provider-specific extras (only for OpenAI)
-        if let Some(extras) = req.provider_extras.get(&ProviderFormat::OpenAI) {
+        if let Some(extras) = req.params.extras.get(&ProviderFormat::OpenAI) {
             for (k, v) in extras {
                 obj.insert(k.clone(), v.clone());
             }
@@ -375,21 +369,24 @@ impl ProviderAdapter for OpenAIAdapter {
             .as_ref()
             .map(|u| u.to_provider_value(self.format()));
 
-        let mut obj = serde_json::json!({
-            "id": format!("chatcmpl-{}", PLACEHOLDER_ID),
-            "object": "chat.completion",
-            "created": 0,
-            "model": resp.model.as_deref().unwrap_or(PLACEHOLDER_MODEL),
-            "choices": choices
-        });
+        let mut map = serde_json::Map::new();
+        map.insert(
+            "id".into(),
+            Value::String(format!("chatcmpl-{}", PLACEHOLDER_ID)),
+        );
+        map.insert("object".into(), Value::String("chat.completion".into()));
+        map.insert("created".into(), serde_json::json!(0));
+        map.insert(
+            "model".into(),
+            Value::String(resp.model.as_deref().unwrap_or(PLACEHOLDER_MODEL).into()),
+        );
+        map.insert("choices".into(), Value::Array(choices));
 
         if let Some(usage_val) = usage {
-            obj.as_object_mut()
-                .unwrap()
-                .insert("usage".into(), usage_val);
+            map.insert("usage".into(), usage_val);
         }
 
-        Ok(obj)
+        Ok(Value::Object(map))
     }
 
     // =========================================================================
@@ -471,48 +468,45 @@ impl ProviderAdapter for OpenAIAdapter {
             .choices
             .iter()
             .map(|c| {
-                let mut choice = serde_json::json!({
-                    "index": c.index,
-                    "delta": c.delta.clone().unwrap_or(Value::Object(Map::new()))
-                });
-                if let Some(ref reason) = c.finish_reason {
-                    choice
-                        .as_object_mut()
-                        .unwrap()
-                        .insert("finish_reason".into(), Value::String(reason.clone()));
-                } else {
-                    choice
-                        .as_object_mut()
-                        .unwrap()
-                        .insert("finish_reason".into(), Value::Null);
-                }
-                choice
+                let mut choice_map = Map::new();
+                choice_map.insert("index".into(), serde_json::json!(c.index));
+                choice_map.insert(
+                    "delta".into(),
+                    c.delta.clone().unwrap_or(Value::Object(Map::new())),
+                );
+                let finish_reason_val = match &c.finish_reason {
+                    Some(reason) => Value::String(reason.clone()),
+                    None => Value::Null,
+                };
+                choice_map.insert("finish_reason".into(), finish_reason_val);
+                Value::Object(choice_map)
             })
             .collect();
 
-        let mut obj = serde_json::json!({
-            "object": "chat.completion.chunk",
-            "choices": choices
-        });
+        let mut map = Map::new();
+        map.insert(
+            "object".into(),
+            Value::String("chat.completion.chunk".into()),
+        );
+        map.insert("choices".into(), Value::Array(choices));
 
-        let obj_map = obj.as_object_mut().unwrap();
         if let Some(ref id) = chunk.id {
-            obj_map.insert("id".into(), Value::String(id.clone()));
+            map.insert("id".into(), Value::String(id.clone()));
         }
         if let Some(ref model) = chunk.model {
-            obj_map.insert("model".into(), Value::String(model.clone()));
+            map.insert("model".into(), Value::String(model.clone()));
         }
         if let Some(created) = chunk.created {
-            obj_map.insert("created".into(), Value::Number(created.into()));
+            map.insert("created".into(), Value::Number(created.into()));
         }
         if let Some(ref usage) = chunk.usage {
-            obj_map.insert(
+            map.insert(
                 "usage".into(),
                 usage.to_provider_value(ProviderFormat::OpenAI),
             );
         }
 
-        Ok(obj)
+        Ok(Value::Object(map))
     }
 }
 
@@ -826,7 +820,8 @@ mod tests {
 
         let universal = adapter.request_to_universal(payload).unwrap();
         let openai_extras = universal
-            .provider_extras
+            .params
+            .extras
             .get(&ProviderFormat::OpenAI)
             .expect("should have OpenAI extras");
         assert!(openai_extras.contains_key("user"));
@@ -871,7 +866,6 @@ mod tests {
                 },
             ],
             params: Default::default(),
-            provider_extras: Default::default(),
         };
 
         // Convert universal to ChatCompletions format
@@ -941,7 +935,6 @@ mod tests {
                 },
             ],
             params: Default::default(),
-            provider_extras: Default::default(),
         };
 
         // Convert universal to ChatCompletions format
@@ -1015,7 +1008,6 @@ mod tests {
                 },
             ],
             params: Default::default(),
-            provider_extras: Default::default(),
         };
 
         // Convert universal to ChatCompletions format
diff --git a/crates/lingua/src/providers/openai/responses_adapter.rs b/crates/lingua/src/providers/openai/responses_adapter.rs
index f6adca93..0b23cdb9 100644
--- a/crates/lingua/src/providers/openai/responses_adapter.rs
+++ b/crates/lingua/src/providers/openai/responses_adapter.rs
@@ -6,8 +6,6 @@ which is used by reasoning models like o1 and o3.
 */
 
 use crate::capabilities::ProviderFormat;
-use crate::reject_params;
-use std::collections::HashMap;
 
 use crate::error::ConvertError;
 use crate::processing::adapters::{
@@ -156,6 +154,7 @@ impl ProviderAdapter for ResponsesAdapter {
             service_tier: typed_params.service_tier,
             logprobs: None, // Responses API doesn't support logprobs boolean
             top_logprobs: typed_params.top_logprobs,
+            extras: Default::default(),
         };
 
         // Sync parallel_tool_calls with tool_choice.disable_parallel for roundtrip fidelity
@@ -193,16 +192,14 @@ impl ProviderAdapter for ResponsesAdapter {
             extras_map.insert("prompt_cache_key".into(), Value::String(prompt_cache_key));
         }
 
-        let mut provider_extras = HashMap::new();
         if !extras_map.is_empty() {
-            provider_extras.insert(ProviderFormat::Responses, extras_map);
+            params.extras.insert(ProviderFormat::Responses, extras_map);
         }
 
         Ok(UniversalRequest {
             model: typed_params.model,
             messages,
             params,
-            provider_extras,
         })
     }
 
@@ -212,22 +209,7 @@ impl ProviderAdapter for ResponsesAdapter {
             reason: "missing model".to_string(),
         })?;
 
-        // Validate unsupported parameters
-        reject_params!(req, ProviderFormat::Responses, top_k);
-        // Stop sequences need special handling (check if non-empty)
-        if req
-            .params
-            .stop
-            .as_ref()
-            .is_some_and(|stop| !stop.is_empty())
-        {
-            return Err(TransformError::ValidationFailed {
-                target: ProviderFormat::Responses,
-                reason: "does not support stop sequences".to_string(),
-            });
-        }
-
-        let responses_extras = req.provider_extras.get(&ProviderFormat::Responses);
+        let responses_extras = req.params.extras.get(&ProviderFormat::Responses);
         let mut messages_for_input = req.messages.clone();
         if let Some(extras) = responses_extras {
             if let Some(instructions) = extras.get("instructions").and_then(Value::as_str) {
@@ -263,7 +245,7 @@ impl ProviderAdapter for ResponsesAdapter {
         insert_opt_bool(&mut obj, "stream", req.params.stream);
 
         // Get provider-specific extras for Responses API
-        let responses_extras = req.provider_extras.get(&ProviderFormat::Responses);
+        let responses_extras = req.params.extras.get(&ProviderFormat::Responses);
 
         // Convert tools to Responses API format
         if let Some(tools) = req.params.tools.as_ref() {
@@ -493,26 +475,29 @@ impl ProviderAdapter for ResponsesAdapter {
             .unwrap_or_else(|| "completed".to_string());
 
         // Build response with all required fields for TheResponseObject
-        let mut obj = serde_json::json!({
-            "id": format!("resp_{}", PLACEHOLDER_ID),
-            "object": "response",
-            "model": resp.model.as_deref().unwrap_or(PLACEHOLDER_MODEL),
-            "output": output,
-            "output_text": output_text,
-            "status": status,
-            "created_at": 0.0,
-            "tool_choice": "none",
-            "tools": [],
-            "parallel_tool_calls": false
-        });
+        let mut map = serde_json::Map::new();
+        map.insert(
+            "id".into(),
+            Value::String(format!("resp_{}", PLACEHOLDER_ID)),
+        );
+        map.insert("object".into(), Value::String("response".into()));
+        map.insert(
+            "model".into(),
+            Value::String(resp.model.as_deref().unwrap_or(PLACEHOLDER_MODEL).into()),
+        );
+        map.insert("output".into(), Value::Array(output));
+        map.insert("output_text".into(), Value::String(output_text));
+        map.insert("status".into(), Value::String(status));
+        map.insert("created_at".into(), serde_json::json!(0.0));
+        map.insert("tool_choice".into(), Value::String("none".into()));
+        map.insert("tools".into(), Value::Array(vec![]));
+        map.insert("parallel_tool_calls".into(), Value::Bool(false));
 
         if let Some(usage) = &resp.usage {
-            obj.as_object_mut()
-                .unwrap()
-                .insert("usage".into(), usage.to_provider_value(self.format()));
+            map.insert("usage".into(), usage.to_provider_value(self.format()));
         }
 
-        Ok(obj)
+        Ok(Value::Object(map))
     }
 
     // =========================================================================
diff --git a/crates/lingua/src/universal/reasoning.rs b/crates/lingua/src/universal/reasoning.rs
index 749722bb..f5a309c5 100644
--- a/crates/lingua/src/universal/reasoning.rs
+++ b/crates/lingua/src/universal/reasoning.rs
@@ -97,8 +97,20 @@ pub const ANTHROPIC_THINKING_TEMPERATURE: f64 = 1.0;
 /// - high: 75% of max_tokens
 ///
 /// Result is clamped to minimum of 1024 tokens (Anthropic requirement).
+///
+/// # Parameters
+/// - `effort`: The reasoning effort level
+/// - `max_tokens`: Maximum tokens (must be positive, uses DEFAULT_MAX_TOKENS if None/invalid)
+///
+/// # Validation
+/// - If `max_tokens` is None, zero, or negative, uses `DEFAULT_MAX_TOKENS` (4096)
 pub fn effort_to_budget(effort: ReasoningEffort, max_tokens: Option<i64>) -> i64 {
-    let max = max_tokens.unwrap_or(DEFAULT_MAX_TOKENS);
+    // Validate max_tokens - must be strictly positive
+    let max = match max_tokens {
+        Some(value) if value > 0 => value,
+        _ => DEFAULT_MAX_TOKENS, // Use default for None, zero, or negative
+    };
+
     let multiplier = match effort {
         ReasoningEffort::Low => EFFORT_LOW_MULTIPLIER,
         ReasoningEffort::Medium => EFFORT_MEDIUM_MULTIPLIER,
@@ -114,8 +126,26 @@ pub fn effort_to_budget(effort: ReasoningEffort, max_tokens: Option<i64>) -> i64
 /// - ratio < 0.35: low
 /// - 0.35 <= ratio < 0.65: medium
 /// - ratio >= 0.65: high
+///
+/// # Parameters
+/// - `budget`: Token budget (must be positive, returns default effort if <= 0)
+/// - `max_tokens`: Maximum tokens (must be positive, uses DEFAULT_MAX_TOKENS if None/invalid)
+///
+/// # Validation
+/// - If `max_tokens` is None, zero, or negative, uses `DEFAULT_MAX_TOKENS` (4096)
+/// - If `budget` is zero or negative, returns `DEFAULT_REASONING_EFFORT` (Medium)
 pub fn budget_to_effort(budget: i64, max_tokens: Option<i64>) -> ReasoningEffort {
-    let max = max_tokens.unwrap_or(DEFAULT_MAX_TOKENS);
+    // Validate max_tokens - must be strictly positive
+    let max = match max_tokens {
+        Some(value) if value > 0 => value,
+        _ => DEFAULT_MAX_TOKENS, // Use default for None, zero, or negative
+    };
+
+    // Validate budget - if invalid, return default effort
+    if budget <= 0 {
+        return DEFAULT_REASONING_EFFORT;
+    }
+
     let ratio = budget as f64 / max as f64;
 
     if ratio < EFFORT_LOW_THRESHOLD {
@@ -524,4 +554,84 @@ mod tests {
             .unwrap();
         assert!(result.is_none());
     }
+
+    #[test]
+    fn test_budget_to_effort_edge_cases() {
+        let test_cases = vec![
+            // (budget, max_tokens, expected_effort, description)
+            (
+                2048,
+                Some(0),
+                ReasoningEffort::Medium,
+                "zero max_tokens uses DEFAULT",
+            ),
+            (
+                1200,
+                Some(-100),
+                ReasoningEffort::Low,
+                "negative max_tokens uses DEFAULT (1200/4096=0.29<0.35)",
+            ),
+            (
+                0,
+                Some(4096),
+                DEFAULT_REASONING_EFFORT,
+                "zero budget returns default",
+            ),
+            (
+                -1000,
+                Some(4096),
+                DEFAULT_REASONING_EFFORT,
+                "negative budget returns default",
+            ),
+            (
+                -500,
+                Some(-200),
+                DEFAULT_REASONING_EFFORT,
+                "both negative returns default",
+            ),
+        ];
+
+        for (budget, max_tokens, expected, description) in test_cases {
+            assert_eq!(
+                budget_to_effort(budget, max_tokens),
+                expected,
+                "Failed: {}",
+                description
+            );
+        }
+    }
+
+    #[test]
+    fn test_effort_to_budget_edge_cases() {
+        let test_cases = vec![
+            // (effort, max_tokens, expected_budget, description)
+            (
+                ReasoningEffort::Medium,
+                Some(0),
+                2048,
+                "zero max_tokens uses DEFAULT (4096*0.5)",
+            ),
+            (
+                ReasoningEffort::High,
+                Some(-1000),
+                3072,
+                "negative max_tokens uses DEFAULT (4096*0.75)",
+            ),
+            (
+                ReasoningEffort::Low,
+                Some(-50),
+                1024,
+                "negative max_tokens clamped to minimum",
+            ),
+        ];
+
+        for (effort, max_tokens, expected, description) in test_cases {
+            assert_eq!(
+                effort_to_budget(effort, max_tokens),
+                expected,
+                "Failed: {}",
+                description
+            );
+        }
+    }
 }
diff --git a/crates/lingua/src/universal/request.rs b/crates/lingua/src/universal/request.rs
index b2afc6b8..1bd22d58 100644
--- a/crates/lingua/src/universal/request.rs
+++ b/crates/lingua/src/universal/request.rs
@@ -7,7 +7,7 @@ converted to/from any provider format.
 ## Design principles
 
 1. **Round-trip preservation**: Provider-specific fields are stored in
-   `provider_extras` keyed by `ProviderFormat`, and restored when converting
+   `params.extras` keyed by `ProviderFormat`, and restored when converting
    back to the same provider format.
 
 2. **Canonical naming**: Uses consistent field names (e.g., `max_tokens`, `top_p`)
@@ -19,6 +19,14 @@ converted to/from any provider format.
 4. **Provider isolation**: Provider-specific extras are scoped by `ProviderFormat`
    to prevent cross-provider contamination (e.g., OpenAI extras don't bleed into
    Anthropic requests).
+
+## Provider API references
+
+- **OpenAI Chat**: <https://platform.openai.com/docs/api-reference/chat>
+- **OpenAI Responses**: <https://platform.openai.com/docs/api-reference/responses>
+- **Anthropic**: <https://docs.anthropic.com/en/api/messages>
+- **Google**: <https://ai.google.dev/api/generate-content>
+- **Bedrock**: <https://docs.aws.amazon.com/bedrock/latest/APIReference/API_runtime_Converse.html>
 */
 
 use std::collections::HashMap;
@@ -36,8 +44,6 @@ use crate::universal::tools::UniversalTool;
 /// Universal request envelope for LLM API calls.
 ///
 /// This type captures the common structure across all provider request formats.
-/// Provider-specific fields are stored in `provider_extras`, keyed by the source
-/// provider format to prevent cross-provider contamination.
 #[derive(Debug, Clone, Serialize)]
 pub struct UniversalRequest {
     /// Model identifier (may be None for providers that use endpoint-based model selection)
@@ -46,105 +52,126 @@ pub struct UniversalRequest {
     /// Conversation messages in universal format
     pub messages: Vec<Message>,
 
-    /// Common request parameters (canonical fields only)
+    /// Request parameters (canonical fields + provider-specific extras)
     pub params: UniversalParams,
-
-    /// Provider-specific fields, keyed by the source ProviderFormat.
-    ///
-    /// When transforming back to the same provider, these extras are merged back.
-    /// When transforming to a different provider, they are ignored (no cross-pollination).
-    ///
-    /// Example: OpenAI Chat extras stay in `provider_extras[ProviderFormat::OpenAI]`
-    /// and are only merged back when converting to OpenAI Chat, not to Anthropic.
-    #[serde(skip)]
-    pub provider_extras: HashMap<ProviderFormat, Map<String, Value>>,
 }
 
 /// Common request parameters across providers.
 ///
 /// Uses canonical names - adapters handle mapping to provider-specific names.
-/// This struct contains ONLY canonical fields - no extras or provider-specific baggage.
+/// Provider-specific fields without canonical mappings are stored in `extras`.
 #[derive(Debug, Clone, Default, Serialize)]
 pub struct UniversalParams {
     // === Sampling parameters ===
-    /// Sampling temperature (0.0 to 2.0 typically)
+    /// Controls randomness: 0 = deterministic, 2 = maximum randomness.
+    ///
+    /// **Providers:** OpenAI, Anthropic, Google (`generationConfig.temperature`), Bedrock (`inferenceConfig.temperature`)
     pub temperature: Option<f64>,
 
-    /// Nucleus sampling probability
+    /// Nucleus sampling: only consider tokens with cumulative probability ≤ top_p.
+    ///
+    /// **Providers:** OpenAI, Anthropic, Google (`generationConfig.topP`), Bedrock (`inferenceConfig.topP`)
     pub top_p: Option<f64>,
 
-    /// Top-k sampling (not supported by all providers)
+    /// Only sample from the top K most likely tokens.
+    ///
+    /// **Providers:** Anthropic, Google (`generationConfig.topK`)
     pub top_k: Option<i64>,
 
-    /// Random seed for deterministic generation
+    /// Random seed for deterministic generation.
+    ///
+    /// **Providers:** OpenAI
     pub seed: Option<i64>,
 
-    /// Presence penalty (-2.0 to 2.0)
+    /// Penalize tokens based on whether they've appeared at all (-2.0 to 2.0).
+    ///
+    /// **Providers:** OpenAI
     pub presence_penalty: Option<f64>,
 
-    /// Frequency penalty (-2.0 to 2.0)
+    /// Penalize tokens based on how often they've appeared (-2.0 to 2.0).
+    ///
+    /// **Providers:** OpenAI
     pub frequency_penalty: Option<f64>,
 
     // === Output control ===
-    /// Maximum tokens to generate
+    /// Maximum tokens to generate in the response.
+    ///
+    /// **Providers:** OpenAI (`max_completion_tokens`), Anthropic, Google (`generationConfig.maxOutputTokens`), Bedrock (`inferenceConfig.maxTokens`)
     pub max_tokens: Option<i64>,
 
-    /// Stop sequences for generation termination.
+    /// Sequences that stop generation when encountered.
     ///
-    /// All providers accept arrays of strings. OpenAI also accepts a single string,
-    /// but we normalize to arrays for simplicity - OpenAI accepts both forms.
+    /// **Providers:** OpenAI, Anthropic (`stop_sequences`), Google (`generationConfig.stopSequences`), Bedrock (`inferenceConfig.stopSequences`)
     pub stop: Option<Vec<String>>,
 
-    /// Whether to return log probabilities (OpenAI-specific but canonical)
+    /// Return log probabilities of output tokens.
+    ///
+    /// **Providers:** OpenAI
     pub logprobs: Option<bool>,
 
-    /// Number of top logprobs to return (0-20)
+    /// Number of most likely tokens to return log probabilities for (0-20).
+    ///
+    /// **Providers:** OpenAI
     pub top_logprobs: Option<i64>,
 
     // === Tools and function calling ===
-    /// Tool definitions in universal format.
+    /// Tool/function definitions the model can call.
     ///
-    /// Tools are normalized to `UniversalTool` which handles the different formats:
-    /// - Anthropic: `{"name", "description", "input_schema"}` for custom, `{"type": "bash_20250124"}` for builtins
-    /// - OpenAI Chat: `{"type": "function", "function": {...}}`
-    /// - OpenAI Responses: `{"type": "function", "name", ...}` or `{"type": "code_interpreter"}`
+    /// **Providers:** OpenAI, Anthropic, Google (`tools[].functionDeclarations`), Bedrock (`toolConfig.tools[].toolSpec`)
     pub tools: Option<Vec<UniversalTool>>,
 
-    /// Tool selection strategy configuration.
+    /// How the model should choose which tool to call.
     ///
-    /// Uses canonical fields (`mode`, `tool_name`) for cross-provider conversion.
+    /// **Providers:** OpenAI, Anthropic
     pub tool_choice: Option<ToolChoiceConfig>,
 
-    /// Whether tools can be called in parallel
+    /// Allow multiple tool calls in a single response.
+    ///
+    /// **Providers:** OpenAI, Anthropic (`tool_choice.disable_parallel_tool_use`)
     pub parallel_tool_calls: Option<bool>,
 
     // === Response format ===
-    /// Response format configuration.
+    /// Constrain output format (text, JSON, or JSON schema).
     ///
-    /// Uses canonical fields (`format_type`, `json_schema`) for cross-provider conversion.
+    /// **Providers:** OpenAI, Anthropic (`output_format`)
     pub response_format: Option<ResponseFormatConfig>,
 
     // === Reasoning / Extended thinking ===
-    /// Reasoning configuration for extended thinking / chain-of-thought.
+    /// Enable extended thinking / chain-of-thought reasoning.
     ///
-    /// Uses canonical fields (`effort`, `budget_tokens`) for cross-provider conversion.
-    /// Skipped when disabled or empty to normalize `{enabled: false}` to `null`.
+    /// **Providers:** OpenAI (`reasoning_effort`), Anthropic (`thinking`), Google (`generationConfig.thinkingConfig`), Bedrock (`additionalModelRequestFields.thinking`)
     #[serde(skip_serializing_if = "reasoning_should_skip")]
     pub reasoning: Option<ReasoningConfig>,
 
     // === Metadata and identification ===
-    /// Request metadata (user tracking, experiment tags, etc.)
+    /// Key-value metadata attached to the request.
+    ///
+    /// **Providers:** OpenAI, Anthropic (only `user_id`)
     pub metadata: Option<Value>,
 
-    /// Whether to store completion for training/evals (OpenAI-specific but canonical)
+    /// Store the completion for later use in fine-tuning or evals.
+    ///
+    /// **Providers:** OpenAI
     pub store: Option<bool>,
 
-    /// Service tier preference
+    /// Request priority tier (e.g., "auto", "default").
+    ///
+    /// **Providers:** OpenAI, Anthropic
     pub service_tier: Option<String>,
 
     // === Streaming ===
-    /// Whether to stream the response
+    /// Stream the response as server-sent events.
+    ///
+    /// **Providers:** OpenAI, Anthropic
     pub stream: Option<bool>,
+
+    // === Provider-specific extras ===
+    /// Provider-specific parameters without canonical mappings.
+    ///
+    /// Keyed by source `ProviderFormat` - only restored when converting back to
+    /// the same provider (no cross-provider contamination).
+    #[serde(skip)]
+    pub extras: HashMap<ProviderFormat, Map<String, Value>>,
 }
 
 // =============================================================================
diff --git a/crates/lingua/src/universal/response.rs b/crates/lingua/src/universal/response.rs
index a22a656d..42d63ac8 100644
--- a/crates/lingua/src/universal/response.rs
+++ b/crates/lingua/src/universal/response.rs
@@ -286,75 +286,75 @@ impl UniversalUsage {
         match provider {
             // OpenAI, Mistral, and Unknown use OpenAI format
             ProviderFormat::OpenAI | ProviderFormat::Mistral | ProviderFormat::Unknown => {
-                let mut obj = serde_json::json!({
-                    "prompt_tokens": prompt,
-                    "completion_tokens": completion,
-                    "total_tokens": prompt + completion
-                });
-                let obj_map = obj.as_object_mut().unwrap();
+                let mut map = serde_json::Map::new();
+                map.insert("prompt_tokens".into(), serde_json::json!(prompt));
+                map.insert("completion_tokens".into(), serde_json::json!(completion));
+                map.insert(
+                    "total_tokens".into(),
+                    serde_json::json!(prompt + completion),
+                );
 
                 if let Some(cached_tokens) = self.prompt_cached_tokens {
-                    obj_map.insert(
+                    map.insert(
                         "prompt_tokens_details".into(),
                         serde_json::json!({ "cached_tokens": cached_tokens }),
                     );
                 }
 
                 if let Some(reasoning_tokens) = self.completion_reasoning_tokens {
-                    obj_map.insert(
+                    map.insert(
                         "completion_tokens_details".into(),
                         serde_json::json!({ "reasoning_tokens": reasoning_tokens }),
                     );
                 }
 
-                obj
+                Value::Object(map)
             }
             ProviderFormat::Responses => {
-                let mut obj = serde_json::json!({
-                    "input_tokens": prompt,
-                    "output_tokens": completion,
-                    "total_tokens": prompt + completion
-                });
-                let obj_map = obj.as_object_mut().unwrap();
+                let mut map = serde_json::Map::new();
+                map.insert("input_tokens".into(), serde_json::json!(prompt));
+                map.insert("output_tokens".into(), serde_json::json!(completion));
+                map.insert(
+                    "total_tokens".into(),
+                    serde_json::json!(prompt + completion),
+                );
 
                 if let Some(cached_tokens) = self.prompt_cached_tokens {
-                    obj_map.insert(
+                    map.insert(
                         "input_tokens_details".into(),
                         serde_json::json!({ "cached_tokens": cached_tokens }),
                     );
                 }
 
                 if let Some(reasoning_tokens) = self.completion_reasoning_tokens {
-                    obj_map.insert(
+                    map.insert(
                         "output_tokens_details".into(),
                         serde_json::json!({ "reasoning_tokens": reasoning_tokens }),
                     );
                 }
 
-                obj
+                Value::Object(map)
             }
             ProviderFormat::Anthropic => {
-                let mut obj = serde_json::json!({
-                    "input_tokens": prompt,
-                    "output_tokens": completion
-                });
-                let obj_map = obj.as_object_mut().unwrap();
+                let mut map = serde_json::Map::new();
+                map.insert("input_tokens".into(), serde_json::json!(prompt));
+                map.insert("output_tokens".into(), serde_json::json!(completion));
 
                 if let Some(cache_creation) = self.prompt_cache_creation_tokens {
-                    obj_map.insert(
+                    map.insert(
                         "cache_creation_input_tokens".into(),
                         serde_json::json!(cache_creation),
                     );
                 }
 
                 if let Some(cache_read) = self.prompt_cached_tokens {
-                    obj_map.insert(
+                    map.insert(
                         "cache_read_input_tokens".into(),
                         serde_json::json!(cache_read),
                     );
                 }
 
-                obj
+                Value::Object(map)
             }
             ProviderFormat::Converse => serde_json::json!({
                 "inputTokens": prompt,
diff --git a/crates/lingua/src/universal/tools.rs b/crates/lingua/src/universal/tools.rs
index 2a7a3e4e..2840538a 100644
--- a/crates/lingua/src/universal/tools.rs
+++ b/crates/lingua/src/universal/tools.rs
@@ -50,6 +50,10 @@ pub struct UniversalTool {
     #[serde(skip_serializing_if = "Option::is_none")]
     pub parameters: Option<Value>,
 
+    /// Whether to enforce strict schema validation (OpenAI Responses API)
+    #[serde(skip_serializing_if = "Option::is_none")]
+    pub strict: Option<bool>,
+
     /// Tool type classification
     #[serde(flatten)]
     pub tool_type: UniversalToolType,
@@ -87,11 +91,13 @@ impl UniversalTool {
         name: impl Into<String>,
         description: Option<String>,
         parameters: Option<Value>,
+        strict: Option<bool>,
     ) -> Self {
         Self {
             name: name.into(),
             description,
             parameters,
+            strict,
             tool_type: UniversalToolType::Function,
         }
     }
@@ -107,6 +113,7 @@ impl UniversalTool {
             name: name.into(),
             description: None,
             parameters: None,
+            strict: None,
             tool_type: UniversalToolType::Builtin {
                 provider: provider.into(),
                 builtin_type: builtin_type.into(),
@@ -165,15 +172,16 @@ impl UniversalTool {
             }
         }
 
-        // Custom tool format: {"name", "description", "input_schema"}
+        // Custom tool format: {"name", "description", "input_schema", "strict"}
         let name = value.get("name").and_then(Value::as_str)?;
         let description = value
             .get("description")
             .and_then(Value::as_str)
             .map(String::from);
         let parameters = value.get("input_schema").cloned();
+        let strict = value.get("strict").and_then(Value::as_bool);
 
-        Some(Self::function(name, description, parameters))
+        Some(Self::function(name, description, parameters, strict))
     }
 
     /// Parse a tool from OpenAI Chat Completions format (JSON Value).
@@ -192,8 +200,9 @@ impl UniversalTool {
             .and_then(Value::as_str)
             .map(String::from);
         let parameters = func.get("parameters").cloned();
+        let strict = func.get("strict").and_then(Value::as_bool);
 
-        Some(Self::function(name, description, parameters))
+        Some(Self::function(name, description, parameters, strict))
     }
 
     /// Parse a tool from OpenAI Responses API format (JSON Value).
@@ -212,8 +221,9 @@ impl UniversalTool {
                     .and_then(Value::as_str)
                     .map(String::from);
                 let parameters = value.get("parameters").cloned();
+                let strict = value.get("strict").and_then(Value::as_bool);
 
-                Some(Self::function(name, description, parameters))
+                Some(Self::function(name, description, parameters, strict))
             }
             "code_interpreter"
             | "web_search_preview"
@@ -281,6 +291,10 @@ impl UniversalTool {
                     self.parameters.clone().unwrap_or_else(|| json!({})),
                 );
 
+                if let Some(strict) = self.strict {
+                    obj.insert("strict".into(), Value::Bool(strict));
+                }
+
                 Ok(Value::Object(obj))
             }
             UniversalToolType::Builtin {
@@ -323,6 +337,10 @@ impl UniversalTool {
                     self.parameters.clone().unwrap_or_else(|| json!({})),
                 );
 
+                if let Some(strict) = self.strict {
+                    func.insert("strict".into(), Value::Bool(strict));
+                }
+
                 Ok(json!({
                     "type": "function",
                     "function": Value::Object(func)
@@ -357,8 +375,9 @@ impl UniversalTool {
                     self.parameters.clone().unwrap_or_else(|| json!({})),
                 );
 
-                // Responses API function tools have strict: false by default
-                obj.insert("strict".into(), Value::Bool(false));
+                if let Some(strict) = self.strict {
+                    obj.insert("strict".into(), Value::Bool(strict));
+                }
 
                 Ok(Value::Object(obj))
             }
@@ -507,6 +526,7 @@ mod tests {
             "get_weather",
             Some("Get the weather".to_string()),
             Some(json!({"type": "object"})),
+            None,
         );
 
         assert_eq!(tool.name, "get_weather");
@@ -514,6 +534,7 @@ mod tests {
         assert!(tool.is_function());
         assert!(!tool.is_builtin());
         assert!(tool.builtin_provider().is_none());
+        assert_eq!(tool.strict, None);
     }
 
     #[test]
@@ -620,6 +641,7 @@ mod tests {
             "get_weather",
             Some("Get weather".to_string()),
             Some(json!({"type": "object"})),
+            None,
         );
 
         let value = tool.to_anthropic_value().unwrap();
@@ -662,6 +684,7 @@ mod tests {
             "get_weather",
             Some("Get weather".to_string()),
             Some(json!({"type": "object"})),
+            None,
         );
 
         let value = tool.to_openai_chat_value().unwrap();
@@ -685,6 +708,7 @@ mod tests {
             "get_weather",
             Some("Get weather".to_string()),
             Some(json!({"type": "object"})),
+            None,
         );
 
         let value = tool.to_responses_value().unwrap();
@@ -692,7 +716,23 @@ mod tests {
         assert_eq!(value["type"], "function");
         assert_eq!(value["name"], "get_weather");
         assert_eq!(value["description"], "Get weather");
-        assert_eq!(value["strict"], false);
+        assert!(value.get("strict").is_none()); // strict only output when explicitly set
+    }
+
+    #[test]
+    fn test_universal_tool_to_responses_function_with_strict() {
+        let tool = UniversalTool::function(
+            "get_weather",
+            Some("Get weather".to_string()),
+            Some(json!({"type": "object"})),
+            Some(true),
+        );
+
+        let value = tool.to_responses_value().unwrap();
+
+        assert_eq!(value["type"], "function");
+        assert_eq!(value["name"], "get_weather");
+        assert_eq!(value["strict"], true);
     }
 
     #[test]
@@ -785,8 +825,8 @@ mod tests {
     #[test]
     fn test_batch_conversion_to_anthropic() {
         let tools = vec![
-            UniversalTool::function("tool1", Some("desc1".to_string()), None),
-            UniversalTool::function("tool2", Some("desc2".to_string()), None),
+            UniversalTool::function("tool1", Some("desc1".to_string()), None, None),
+            UniversalTool::function("tool2", Some("desc2".to_string()), None, None),
         ];
 
         let result = tools_to_anthropic_value(&tools).unwrap();
@@ -800,7 +840,7 @@ mod tests {
     #[test]
     fn test_batch_conversion_to_anthropic_fails_on_wrong_provider() {
         let tools = vec![
-            UniversalTool::function("tool1", Some("desc1".to_string()), None),
+            UniversalTool::function("tool1", Some("desc1".to_string()), None, None),
             UniversalTool::builtin(
                 "code_interpreter",
                 "openai_responses",
@@ -816,8 +856,8 @@ mod tests {
     #[test]
     fn test_batch_conversion_to_openai_chat() {
         let tools = vec![
-            UniversalTool::function("tool1", Some("desc1".to_string()), None),
-            UniversalTool::function("tool2", Some("desc2".to_string()), None),
+            UniversalTool::function("tool1", Some("desc1".to_string()), None, None),
+            UniversalTool::function("tool2", Some("desc2".to_string()), None, None),
         ];
 
         let result = tools_to_openai_chat_value(&tools).unwrap();
@@ -830,7 +870,7 @@ mod tests {
     #[test]
     fn test_batch_conversion_to_openai_chat_fails_on_builtin() {
         let tools = vec![
-            UniversalTool::function("tool1", Some("desc1".to_string()), None),
+            UniversalTool::function("tool1", Some("desc1".to_string()), None, None),
             UniversalTool::builtin("bash", "anthropic", "bash_20250124", Some(json!({}))),
         ];
 

From f1340cbcc805b1ede43035063eb10f2af8826d0a Mon Sep 17 00:00:00 2001
From: Ken Jiang <ken@braintrustdata.com>
Date: Wed, 28 Jan 2026 11:07:26 -0500
Subject: [PATCH 3/5] add proxy test cases

---
 payloads/cases/index.ts                       |    6 +-
 payloads/cases/proxy.ts                       | 1584 +++++++++++++++++
 payloads/cases/types.ts                       |   16 +
 payloads/cases/utils.ts                       |   17 +
 payloads/scripts/providers/anthropic.ts       |   12 +-
 payloads/scripts/providers/bedrock.ts         |    6 +
 payloads/scripts/providers/google.ts          |    6 +
 .../scripts/providers/openai-responses.ts     |   12 +-
 payloads/scripts/providers/openai.ts          |   12 +-
 payloads/scripts/validation/index.ts          |  122 ++
 10 files changed, 1789 insertions(+), 4 deletions(-)
 create mode 100644 payloads/cases/proxy.ts

diff --git a/payloads/cases/index.ts b/payloads/cases/index.ts
index 49087574..9a654b26 100644
--- a/payloads/cases/index.ts
+++ b/payloads/cases/index.ts
@@ -7,18 +7,21 @@ export * from "./models";
 export { simpleCases } from "./simple";
 export { advancedCases } from "./advanced";
 export { paramsCases } from "./params";
+export { proxyCases } from "./proxy";
 
 // Import and merge all collections for convenience
 import { simpleCases } from "./simple";
 import { advancedCases } from "./advanced";
 import { paramsCases } from "./params";
+import { proxyCases } from "./proxy";
 import { mergeCollections, getCaseNames } from "./utils";
 
 // Combined collection of all test cases
 export const allTestCases = mergeCollections(
   simpleCases,
   advancedCases,
-  paramsCases
+  paramsCases,
+  proxyCases
 );
 
 // Map of collection names to their case names (for --cases flag)
@@ -26,6 +29,7 @@ export const caseCollections: Record<string, string[]> = {
   simple: getCaseNames(simpleCases),
   advanced: getCaseNames(advancedCases),
   params: getCaseNames(paramsCases),
+  proxy: getCaseNames(proxyCases),
 };
 
 // Legacy export for backward compatibility (can be removed later)
diff --git a/payloads/cases/proxy.ts b/payloads/cases/proxy.ts
new file mode 100644
index 00000000..20aa6144
--- /dev/null
+++ b/payloads/cases/proxy.ts
@@ -0,0 +1,1584 @@
+/**
+ * Test cases ported from proxy integration tests.
+ * These test OpenAI chat-completions compatibility with various providers.
+ */
+
+import OpenAI from "openai";
+import { TestCaseCollection } from "./types";
+import { ANTHROPIC_MODEL } from "./models";
+
+// Text file: "Hello world!\n"
+const TEXT_BASE64 = "SGVsbG8gd29ybGQhCg==";
+
+// Minimal WAV header for audio error test (triggers unsupported media type)
+const AUDIO_BASE64 =
+  "UklGRiQAAABXQVZFZm10IBAAAAABAAEARKwAAIhYAQACABAAZGF0YQAAAAA=";
+
+// Minimal MP4 for video error test (triggers unsupported media type)
+const VIDEO_BASE64 = "AAAAIGZ0eXBpc29tAAACAGlzb21pc28yYXZjMW1wNDE=";
+
+// Small valid PDF (minimal structure)
+const PDF_BASE64 =
+  "JVBERi0xLjQKMSAwIG9iago8PC9UeXBlL0NhdGFsb2cvUGFnZXMgMiAwIFI+PgplbmRvYmoKMiAwIG9iago8PC9UeXBlL1BhZ2VzL0tpZHNbMyAwIFJdL0NvdW50IDE+PgplbmRvYmoKMyAwIG9iago8PC9UeXBlL1BhZ2UvTWVkaWFCb3hbMCAwIDYxMiA3OTJdL1BhcmVudCAyIDAgUi9SZXNvdXJjZXM8PD4+Pj4KZW5kb2JqCnhyZWYKMCA0CjAwMDAwMDAwMDAgNjU1MzUgZiAKMDAwMDAwMDAxNSAwMDAwMCBuIAowMDAwMDAwMDYxIDAwMDAwIG4gCjAwMDAwMDAxMTggMDAwMDAgbiAKdHJhaWxlcgo8PC9TaXplIDQvUm9vdCAxIDAgUj4+CnN0YXJ0eHJlZgoyMTUKJSVFT0YK";
+
+// Small 1x1 PNG
+const IMAGE_BASE64 =
+  "iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAYAAAAfFcSJAAAADUlEQVR42mNk+M9QDwADhgGAWjR9awAAAABJRU5ErkJggg==";
+
+// Markdown file: "# Title\n\nThis is a paragraph.\n"
+const MD_BASE64 = "IyBUaXRsZQoKVGhpcyBpcyBhIHBhcmFncmFwaC4K";
+
+// CSV file: "name,age\nAlice,30\nBob,25\n"
+const CSV_BASE64 = "bmFtZSxhZ2UKQWxpY2UsMzAKQm9iLDI1Cg==";
+
+// Test cases ported from proxy/packages/proxy/src/providers/anthropic.test.ts
+export const proxyCases: TestCaseCollection = {
+  /**
+   * Basic non-streaming request with system message.
+   * Tests: Response format with logprobs field, finish_reason, usage.
+   * From: anthropic.test.ts "should convert OpenAI non-streaming request to Anthropic and back"
+   */
+  proxyAnthropicBasic: {
+    "chat-completions": {
+      model: "claude-3-haiku-20240307",
+      messages: [
+        { role: "system", content: "You are a helpful assistant." },
+        { role: "user", content: "Tell me a short joke about programming." },
+      ],
+      stream: false,
+      max_tokens: 150,
+    },
+    responses: null, // Not testing responses API
+    anthropic: {
+      model: ANTHROPIC_MODEL,
+      max_tokens: 150,
+      system: "You are a helpful assistant.",
+      messages: [
+        { role: "user", content: "Tell me a short joke about programming." },
+      ],
+    },
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+        "choices[0].finish_reason": "stop",
+        object: "chat.completion",
+      },
+    },
+  },
+
+  /**
+   * Reasoning/thinking with multi-turn conversation.
+   * Tests: reasoning_effort param, reasoning blocks in response.
+   * From: anthropic.test.ts "should accept and return reasoning/thinking params"
+   */
+  proxyAnthropicReasoning: {
+    "chat-completions": {
+      model: "claude-3-7-sonnet-20250219",
+      reasoning_effort: "medium",
+      stream: false,
+      messages: [
+        {
+          role: "user",
+          content: "How many rs in 'ferrocarril'",
+        },
+        {
+          role: "assistant",
+          content: "There are 4 letter 'r's in the word \"ferrocarril\".",
+        },
+        {
+          role: "user",
+          content: "How many e in what you said?",
+        },
+      ],
+    },
+    responses: null,
+    anthropic: {
+      model: "claude-3-7-sonnet-20250219",
+      max_tokens: 16000,
+      messages: [
+        {
+          role: "user",
+          content: "How many rs in 'ferrocarril'",
+        },
+        {
+          role: "assistant",
+          content: [
+            {
+              type: "thinking",
+              thinking:
+                "Let me count: f-e-r-r-o-c-a-r-r-i-l. The 'r' appears at positions 3, 4, 8, 9. So 4 total.",
+              // Signature is required for thinking blocks
+              signature: "thinking-signature-placeholder",
+            },
+            {
+              type: "text",
+              text: "There are 4 letter 'r's in the word \"ferrocarril\".",
+            },
+          ],
+        },
+        {
+          role: "user",
+          content: "How many e in what you said?",
+        },
+      ],
+    },
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+        object: "chat.completion",
+      },
+    },
+  },
+
+  /**
+   * Tool call with max_tokens causing truncation.
+   * Tests: tool_calls in response, finish_reason handling.
+   * From: anthropic.test.ts "should handle max_tokens stop reason correctly with tool calls"
+   */
+  proxyAnthropicToolCall: {
+    "chat-completions": {
+      model: "claude-3-haiku-20240307",
+      messages: [
+        {
+          role: "user",
+          content:
+            "Use the calculate function to add 2 and 3 together. Explain your reasoning in detail.",
+        },
+      ],
+      tools: [
+        {
+          type: "function",
+          function: {
+            name: "calculate",
+            description: "Perform a mathematical calculation",
+            parameters: {
+              type: "object",
+              properties: {
+                operation: {
+                  type: "string",
+                  enum: ["add", "subtract", "multiply", "divide"],
+                  description: "The operation to perform",
+                },
+                a: { type: "number", description: "First operand" },
+                b: { type: "number", description: "Second operand" },
+              },
+              required: ["operation", "a", "b"],
+            },
+          },
+        },
+      ],
+      tool_choice: "auto",
+      max_tokens: 50, // Low to potentially cause truncation
+    },
+    responses: null,
+    anthropic: {
+      model: ANTHROPIC_MODEL,
+      max_tokens: 50,
+      messages: [
+        {
+          role: "user",
+          content:
+            "Use the calculate function to add 2 and 3 together. Explain your reasoning in detail.",
+        },
+      ],
+      tools: [
+        {
+          name: "calculate",
+          description: "Perform a mathematical calculation",
+          input_schema: {
+            type: "object",
+            properties: {
+              operation: {
+                type: "string",
+                enum: ["add", "subtract", "multiply", "divide"],
+                description: "The operation to perform",
+              },
+              a: { type: "number", description: "First operand" },
+              b: { type: "number", description: "Second operand" },
+            },
+            required: ["operation", "a", "b"],
+          },
+        },
+      ],
+    },
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+        object: "chat.completion",
+      },
+    },
+  },
+
+  /**
+   * PDF file content handling.
+   * Tests: file content part conversion to Anthropic document format.
+   * From: anthropic.test.ts "should handle file content parts with PDF data"
+   */
+  proxyAnthropicPdfFile: {
+    "chat-completions": {
+      model: "claude-3-5-sonnet-20241022",
+      messages: [
+        {
+          role: "user",
+          content: [
+            { type: "text", text: "What is in this PDF?" },
+            {
+              // Using image_url with PDF data URL (Braintrust converts to document)
+              type: "image_url",
+              image_url: {
+                url: `data:application/pdf;base64,${PDF_BASE64}`,
+              },
+            },
+          ],
+        },
+      ],
+      max_tokens: 200,
+    },
+    responses: null,
+    anthropic: {
+      model: "claude-3-5-sonnet-20241022",
+      max_tokens: 200,
+      messages: [
+        {
+          role: "user",
+          content: [
+            { type: "text", text: "What is in this PDF?" },
+            {
+              type: "document",
+              source: {
+                type: "base64",
+                media_type: "application/pdf",
+                data: PDF_BASE64,
+              },
+            },
+          ],
+        },
+      ],
+    },
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+        object: "chat.completion",
+      },
+    },
+  },
+
+  /**
+   * Image file content handling.
+   * Tests: image content part handling.
+   * From: anthropic.test.ts "should handle file content parts with image data"
+   */
+  proxyAnthropicImageFile: {
+    "chat-completions": {
+      model: "claude-3-5-sonnet-20241022",
+      messages: [
+        {
+          role: "user",
+          content: [
+            { type: "text", text: "What color is this pixel?" },
+            {
+              type: "image_url",
+              image_url: {
+                url: `data:image/png;base64,${IMAGE_BASE64}`,
+              },
+            },
+          ],
+        },
+      ],
+      max_tokens: 100,
+    },
+    responses: null,
+    anthropic: {
+      model: "claude-3-5-sonnet-20241022",
+      max_tokens: 100,
+      messages: [
+        {
+          role: "user",
+          content: [
+            { type: "text", text: "What color is this pixel?" },
+            {
+              type: "image",
+              source: {
+                type: "base64",
+                media_type: "image/png",
+                data: IMAGE_BASE64,
+              },
+            },
+          ],
+        },
+      ],
+    },
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+        object: "chat.completion",
+      },
+    },
+  },
+
+  /**
+   * Streaming request.
+   * Tests: SSE event format, delta structure.
+   * From: anthropic.test.ts "should convert OpenAI streaming request to Anthropic and back"
+   */
+  proxyAnthropicStreaming: {
+    "chat-completions": {
+      model: "claude-3-haiku-20240307",
+      messages: [
+        { role: "system", content: "You are a helpful assistant." },
+        { role: "user", content: "Say hello in 3 words." },
+      ],
+      stream: true,
+      max_tokens: 50,
+    },
+    responses: null,
+    anthropic: {
+      model: ANTHROPIC_MODEL,
+      max_tokens: 50,
+      stream: true,
+      system: "You are a helpful assistant.",
+      messages: [{ role: "user", content: "Say hello in 3 words." }],
+    },
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+    },
+  },
+
+  // ============================================================
+  // Expectation-based tests (skip capture, validated by expectations)
+  // ============================================================
+
+  /**
+   * Audio file error - Anthropic doesn't support audio input.
+   * Tests: 400 error for unsupported media type.
+   * From: anthropic.test.ts "should return 400 for unsupported audio file"
+   */
+  proxyAnthropicAudioError: {
+    "chat-completions": {
+      model: "claude-3-7-sonnet-latest",
+      messages: [
+        {
+          role: "user",
+          content: [
+            { type: "text", text: "What is in this audio?" },
+            {
+              type: "input_audio",
+              input_audio: {
+                data: AUDIO_BASE64,
+                format: "wav",
+              },
+            },
+          ],
+        },
+      ],
+      max_tokens: 100,
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 400,
+      error: { type: "invalid_request_error" },
+    },
+  },
+
+  /**
+   * Video file error - Anthropic doesn't support video input.
+   * Tests: 400 error for unsupported media type.
+   * From: anthropic.test.ts "should return 400 for unsupported video file"
+   */
+  proxyAnthropicVideoError: {
+    "chat-completions": {
+      model: "claude-3-7-sonnet-latest",
+      messages: [
+        {
+          role: "user",
+          content: [
+            { type: "text", text: "What is in this video?" },
+            {
+              type: "image_url",
+              image_url: {
+                url: `data:video/mp4;base64,${VIDEO_BASE64}`,
+              },
+            },
+          ],
+        },
+      ],
+      max_tokens: 100,
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 400,
+      error: { type: "invalid_request_error" },
+    },
+  },
+
+  /**
+   * Max tokens exceeds model limit.
+   * Tests: 400 error when max_tokens exceeds Anthropic's limit.
+   * From: anthropic.test.ts "should return 400 when max_tokens exceeds limit"
+   */
+  proxyAnthropicMaxTokensExceeds: {
+    "chat-completions": {
+      model: "claude-sonnet-4-5-20250514",
+      messages: [{ role: "user", content: "Hello" }],
+      max_tokens: 200000, // Exceeds Anthropic's max
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 400,
+    },
+  },
+
+  /**
+   * Reasoning disabled via reasoning_enabled: false.
+   * Tests: Response should not contain reasoning block.
+   * From: anthropic.test.ts "should disable reasoning when reasoning_enabled is false"
+   */
+  proxyAnthropicReasoningDisabled: {
+    // Cast needed: reasoning_enabled is a Braintrust proxy extension
+    // eslint-disable-next-line @typescript-eslint/consistent-type-assertions
+    "chat-completions": {
+      model: "claude-3-7-sonnet-20250219",
+      messages: [{ role: "user", content: "What is 2+2?" }],
+      reasoning_enabled: false,
+      max_tokens: 100,
+    } as OpenAI.Chat.Completions.ChatCompletionCreateParams,
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.reasoning": { exists: false },
+        "choices[0].message.role": "assistant",
+      },
+    },
+  },
+
+  /**
+   * JSON object response format.
+   * Tests: response_format: json_object triggers tool-based workaround.
+   * From: anthropic.test.ts "should handle json_object response format"
+   */
+  proxyAnthropicJsonObject: {
+    "chat-completions": {
+      model: "claude-3-haiku-20240307",
+      messages: [
+        {
+          role: "user",
+          content: "Return a JSON object with a greeting field.",
+        },
+      ],
+      response_format: { type: "json_object" },
+      max_tokens: 150,
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+        "choices[0].finish_reason": "stop",
+      },
+    },
+  },
+
+  /**
+   * Tool call with tool_choice: required.
+   * Tests: finish_reason should be "tool_calls".
+   * From: anthropic.test.ts "should handle tool_choice required"
+   */
+  proxyAnthropicToolCallRequired: {
+    "chat-completions": {
+      model: "claude-3-haiku-20240307",
+      messages: [{ role: "user", content: "Get the weather in San Francisco" }],
+      tools: [
+        {
+          type: "function",
+          function: {
+            name: "get_weather",
+            description: "Get the current weather",
+            parameters: {
+              type: "object",
+              properties: {
+                location: { type: "string", description: "City name" },
+              },
+              required: ["location"],
+            },
+          },
+        },
+      ],
+      tool_choice: "required",
+      max_tokens: 150,
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].finish_reason": "tool_calls",
+        "choices[0].message.tool_calls[0].type": "function",
+      },
+    },
+  },
+
+  /**
+   * Plain text file support.
+   * Tests: text/plain files are properly handled.
+   * From: anthropic.test.ts "should handle plain text file"
+   */
+  proxyAnthropicPlainTextFile: {
+    "chat-completions": {
+      model: "claude-3-5-sonnet-20241022",
+      messages: [
+        {
+          role: "user",
+          content: [
+            { type: "text", text: "What does this text file say?" },
+            {
+              type: "image_url",
+              image_url: {
+                url: `data:text/plain;base64,${TEXT_BASE64}`,
+              },
+            },
+          ],
+        },
+      ],
+      max_tokens: 100,
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+      },
+    },
+  },
+
+  /**
+   * Default max_tokens injection.
+   * Tests: Request without max_tokens still works (proxy injects default).
+   * From: anthropic.test.ts "should inject default max_tokens"
+   */
+  proxyAnthropicDefaultMaxTokens: {
+    "chat-completions": {
+      model: "claude-3-haiku-20240307",
+      messages: [{ role: "user", content: "Say hi" }],
+      // Note: no max_tokens - proxy should inject default
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+        object: "chat.completion",
+      },
+    },
+  },
+
+  /**
+   * OpenAI reasoning_effort on non-reasoning model.
+   * Tests: gpt-4o-mini doesn't support reasoning_effort.
+   * From: openai.test.ts "should reject reasoning_effort on non-reasoning model"
+   */
+  proxyOpenAIReasoningDenied: {
+    "chat-completions": {
+      model: "gpt-4o-mini",
+      messages: [{ role: "user", content: "Hello" }],
+      reasoning_effort: "high",
+      max_tokens: 50,
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 400,
+      error: {
+        message: "Unrecognized request argument supplied: reasoning_effort",
+      },
+    },
+  },
+
+  /**
+   * OpenAI o3-mini with reasoning_effort.
+   * Tests: o3-mini supports reasoning_effort parameter.
+   * From: openai.test.ts "should support reasoning_effort on o3-mini"
+   */
+  proxyOpenAIO3MiniReasoning: {
+    "chat-completions": {
+      model: "o3-mini-2025-01-31",
+      messages: [{ role: "user", content: "What is 2+2?" }],
+      reasoning_effort: "medium",
+      max_tokens: 1000,
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].finish_reason": "stop",
+        object: "chat.completion",
+      },
+    },
+  },
+
+  // ============================================================
+  // Google Provider Tests
+  // ============================================================
+
+  /**
+   * Basic Google request translation.
+   * Tests: OpenAI format → Google format via proxy.
+   * From: google.test.ts basic request handling
+   */
+  proxyGoogleBasic: {
+    "chat-completions": {
+      model: "gemini-2.0-flash",
+      messages: [
+        { role: "system", content: "You are a helpful assistant." },
+        { role: "user", content: "Say hello in exactly 3 words." },
+      ],
+      max_tokens: 50,
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+        object: "chat.completion",
+      },
+    },
+  },
+
+  /**
+   * Google parameter translation.
+   * Tests: temperature, top_p, max_tokens → Google format.
+   * From: google.params.test.ts parameter mapping
+   */
+  proxyGoogleParamTranslation: {
+    "chat-completions": {
+      model: "gemini-2.0-flash",
+      messages: [{ role: "user", content: "Count to 3." }],
+      temperature: 0.7,
+      top_p: 0.9,
+      max_tokens: 100,
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+      },
+    },
+  },
+
+  /**
+   * Google tool calling.
+   * Tests: OpenAI tools format → Google function declarations.
+   * From: google.test.ts tool calling tests
+   */
+  proxyGoogleToolCall: {
+    "chat-completions": {
+      model: "gemini-2.0-flash",
+      messages: [{ role: "user", content: "What's the weather in Tokyo?" }],
+      tools: [
+        {
+          type: "function",
+          function: {
+            name: "get_weather",
+            description: "Get the current weather in a location",
+            parameters: {
+              type: "object",
+              properties: {
+                location: { type: "string", description: "City name" },
+              },
+              required: ["location"],
+            },
+          },
+        },
+      ],
+      tool_choice: "auto",
+      max_tokens: 200,
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.tool_calls[0].type": "function",
+      },
+    },
+  },
+
+  /**
+   * Google reasoning/thinking config.
+   * Tests: reasoning_effort → thinkingConfig translation.
+   * From: google.test.ts reasoning tests
+   */
+  proxyGoogleReasoning: {
+    "chat-completions": {
+      model: "gemini-2.5-flash-preview-04-17",
+      messages: [{ role: "user", content: "What is the square root of 144?" }],
+      reasoning_effort: "medium",
+      max_tokens: 500,
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+      },
+    },
+  },
+
+  /**
+   * Google image content support.
+   * Tests: image_url handling for Google.
+   * From: google.test.ts multimodal tests
+   */
+  proxyGoogleImageContent: {
+    "chat-completions": {
+      model: "gemini-2.0-flash",
+      messages: [
+        {
+          role: "user",
+          content: [
+            { type: "text", text: "What do you see in this image?" },
+            {
+              type: "image_url",
+              image_url: {
+                url: `data:image/png;base64,${IMAGE_BASE64}`,
+              },
+            },
+          ],
+        },
+      ],
+      max_tokens: 100,
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+      },
+    },
+  },
+
+  /**
+   * Google audio support (Google DOES support audio unlike Anthropic).
+   * Tests: audio content handling for Google.
+   * From: google.test.ts audio support
+   */
+  proxyGoogleAudioSupport: {
+    "chat-completions": {
+      model: "gemini-2.0-flash",
+      messages: [
+        {
+          role: "user",
+          content: [
+            { type: "text", text: "What do you hear in this audio?" },
+            {
+              type: "input_audio",
+              input_audio: {
+                data: AUDIO_BASE64,
+                format: "wav",
+              },
+            },
+          ],
+        },
+      ],
+      max_tokens: 100,
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+      },
+    },
+  },
+
+  /**
+   * Google video support (Google DOES support video unlike Anthropic).
+   * Tests: video content handling for Google.
+   * From: google.test.ts video support
+   */
+  proxyGoogleVideoSupport: {
+    "chat-completions": {
+      model: "gemini-2.0-flash",
+      messages: [
+        {
+          role: "user",
+          content: [
+            { type: "text", text: "What do you see in this video?" },
+            {
+              type: "image_url",
+              image_url: {
+                url: `data:video/mp4;base64,${VIDEO_BASE64}`,
+              },
+            },
+          ],
+        },
+      ],
+      max_tokens: 100,
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+      },
+    },
+  },
+
+  /**
+   * Google stop sequences.
+   * Tests: stop sequences translation.
+   * From: google.params.test.ts stop sequences
+   */
+  proxyGoogleStopSequences: {
+    "chat-completions": {
+      model: "gemini-2.0-flash",
+      messages: [{ role: "user", content: "Count from 1 to 10." }],
+      stop: ["5", "END"],
+      max_tokens: 100,
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+      },
+    },
+  },
+
+  // ============================================================
+  // Additional Anthropic Tests
+  // ============================================================
+
+  /**
+   * Markdown file support.
+   * Tests: text/markdown files are properly handled.
+   * From: anthropic.test.ts "should handle markdown file"
+   */
+  proxyAnthropicMarkdownFile: {
+    "chat-completions": {
+      model: "claude-3-5-sonnet-20241022",
+      messages: [
+        {
+          role: "user",
+          content: [
+            {
+              type: "text",
+              text: "What is the heading in this markdown file?",
+            },
+            {
+              type: "image_url",
+              image_url: {
+                url: `data:text/markdown;base64,${MD_BASE64}`,
+              },
+            },
+          ],
+        },
+      ],
+      max_tokens: 100,
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+      },
+    },
+  },
+
+  /**
+   * CSV file support.
+   * Tests: text/csv files are properly handled.
+   * From: anthropic.test.ts "should handle CSV file"
+   */
+  proxyAnthropicCSVFile: {
+    "chat-completions": {
+      model: "claude-3-5-sonnet-20241022",
+      messages: [
+        {
+          role: "user",
+          content: [
+            { type: "text", text: "How many rows are in this CSV file?" },
+            {
+              type: "image_url",
+              image_url: {
+                url: `data:text/csv;base64,${CSV_BASE64}`,
+              },
+            },
+          ],
+        },
+      ],
+      max_tokens: 100,
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+      },
+    },
+  },
+
+  /**
+   * Tool call with sufficient tokens.
+   * Tests: finish_reason is "tool_calls" not "length" when tokens are sufficient.
+   * From: anthropic.test.ts "should handle tool_use stop reason"
+   */
+  proxyAnthropicToolCallSufficientTokens: {
+    "chat-completions": {
+      model: "claude-3-haiku-20240307",
+      messages: [{ role: "user", content: "Get the weather in Paris" }],
+      tools: [
+        {
+          type: "function",
+          function: {
+            name: "get_weather",
+            description: "Get the current weather",
+            parameters: {
+              type: "object",
+              properties: {
+                location: { type: "string", description: "City name" },
+              },
+              required: ["location"],
+            },
+          },
+        },
+      ],
+      tool_choice: "required",
+      max_tokens: 500, // Sufficient tokens - should not truncate
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].finish_reason": "tool_calls",
+      },
+    },
+  },
+
+  /**
+   * Streaming with reasoning.
+   * Tests: SSE events work correctly with reasoning enabled.
+   * From: anthropic.test.ts "should stream reasoning content"
+   */
+  proxyAnthropicStreamingReasoning: {
+    "chat-completions": {
+      model: "claude-3-7-sonnet-20250219",
+      messages: [{ role: "user", content: "What is 15 * 17?" }],
+      reasoning_effort: "low",
+      stream: true,
+      max_tokens: 2000,
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+    },
+  },
+
+  /**
+   * Multi-turn conversation with tool results.
+   * Tests: Tool result handling in conversation flow.
+   * From: anthropic.test.ts "should handle multi-turn with tool results"
+   */
+  proxyAnthropicToolResultConversation: {
+    "chat-completions": {
+      model: "claude-3-haiku-20240307",
+      messages: [
+        { role: "user", content: "What's the weather in London?" },
+        {
+          role: "assistant",
+          content: null,
+          tool_calls: [
+            {
+              id: "call_123",
+              type: "function",
+              function: {
+                name: "get_weather",
+                arguments: '{"location": "London"}',
+              },
+            },
+          ],
+        },
+        {
+          role: "tool",
+          tool_call_id: "call_123",
+          content: "Currently 15°C and cloudy in London.",
+        },
+      ],
+      tools: [
+        {
+          type: "function",
+          function: {
+            name: "get_weather",
+            description: "Get the current weather",
+            parameters: {
+              type: "object",
+              properties: {
+                location: { type: "string", description: "City name" },
+              },
+              required: ["location"],
+            },
+          },
+        },
+      ],
+      max_tokens: 200,
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+        "choices[0].finish_reason": "stop",
+      },
+    },
+  },
+
+  /**
+   * Streaming with tool calls.
+   * Tests: SSE events work correctly with tool calling.
+   * From: anthropic.test.ts "should stream tool calls"
+   */
+  proxyAnthropicStreamingToolCall: {
+    "chat-completions": {
+      model: "claude-3-haiku-20240307",
+      messages: [{ role: "user", content: "Get weather in Berlin" }],
+      tools: [
+        {
+          type: "function",
+          function: {
+            name: "get_weather",
+            description: "Get the current weather",
+            parameters: {
+              type: "object",
+              properties: {
+                location: { type: "string", description: "City name" },
+              },
+              required: ["location"],
+            },
+          },
+        },
+      ],
+      tool_choice: "required",
+      stream: true,
+      max_tokens: 200,
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+    },
+  },
+
+  // ============================================================
+  // Additional OpenAI Tests
+  // ============================================================
+
+  /**
+   * OpenAI PDF file handling.
+   * Tests: OpenAI doesn't support PDFs in chat completions.
+   * From: openai.test.ts "should reject PDF files"
+   */
+  proxyOpenAIPdfError: {
+    "chat-completions": {
+      model: "gpt-4o",
+      messages: [
+        {
+          role: "user",
+          content: [
+            { type: "text", text: "What is in this PDF?" },
+            {
+              type: "image_url",
+              image_url: {
+                url: `data:application/pdf;base64,${PDF_BASE64}`,
+              },
+            },
+          ],
+        },
+      ],
+      max_tokens: 100,
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 400,
+    },
+  },
+
+  /**
+   * OpenAI text file handling.
+   * Tests: OpenAI doesn't support text files like Anthropic does.
+   * From: openai.test.ts "should reject text files"
+   */
+  proxyOpenAITextFileError: {
+    "chat-completions": {
+      model: "gpt-4o",
+      messages: [
+        {
+          role: "user",
+          content: [
+            { type: "text", text: "What is in this text file?" },
+            {
+              type: "image_url",
+              image_url: {
+                url: `data:text/plain;base64,${TEXT_BASE64}`,
+              },
+            },
+          ],
+        },
+      ],
+      max_tokens: 100,
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 400,
+    },
+  },
+
+  /**
+   * OpenAI structured output with json_schema.
+   * Tests: response_format with json_schema type.
+   * From: openai.test.ts "should handle structured output"
+   */
+  proxyOpenAIStructuredOutput: {
+    "chat-completions": {
+      model: "gpt-4o",
+      messages: [
+        { role: "user", content: "What is 2+2? Answer with just the number." },
+      ],
+      response_format: {
+        type: "json_schema",
+        json_schema: {
+          name: "math_result",
+          schema: {
+            type: "object",
+            properties: {
+              result: { type: "number" },
+            },
+            required: ["result"],
+          },
+        },
+      },
+      max_tokens: 50,
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+        "choices[0].finish_reason": "stop",
+      },
+    },
+  },
+
+  /**
+   * OpenAI reasoning_effort with null value.
+   * Tests: null reasoning_effort should fallback to medium.
+   * From: openai.test.ts "should fallback to medium when reasoning_effort is null"
+   */
+  proxyOpenAIReasoningEffortNull: {
+    "chat-completions": {
+      model: "o3-mini-2025-01-31",
+      messages: [{ role: "user", content: "What is 5+5?" }],
+      reasoning_effort: null,
+      max_tokens: 500,
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+      },
+    },
+  },
+
+  // ============================================================
+  // Cross-Provider Behavior Tests
+  // ============================================================
+
+  /**
+   * Azure parameter filtering.
+   * Tests: Braintrust-specific params are filtered for Azure.
+   * From: azure.test.ts "should filter Braintrust parameters"
+   */
+  proxyAzureParamFiltering: {
+    // Cast needed: reasoning_enabled/reasoning_budget are Braintrust proxy extensions
+    // eslint-disable-next-line @typescript-eslint/consistent-type-assertions
+    "chat-completions": {
+      model: "azure/gpt-4o",
+      messages: [{ role: "user", content: "Hello" }],
+      reasoning_enabled: true,
+      reasoning_budget: 1000,
+      max_tokens: 50,
+    } as OpenAI.Chat.Completions.ChatCompletionCreateParams,
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+      },
+    },
+  },
+
+  /**
+   * Claude 3.7 model-specific max_tokens default.
+   * Tests: Claude 3.7 gets 128k default with beta header.
+   * From: anthropic.test.ts "should use model-specific max_tokens"
+   */
+  proxyModelSpecificDefaults: {
+    "chat-completions": {
+      model: "claude-3-7-sonnet-20250219",
+      messages: [{ role: "user", content: "Hi" }],
+      // No max_tokens - should get model-specific default
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+      },
+    },
+  },
+
+  /**
+   * Anthropic stop sequences.
+   * Tests: stop sequences are properly translated.
+   * From: anthropic.test.ts stop sequences handling
+   */
+  proxyAnthropicStopSequences: {
+    "chat-completions": {
+      model: "claude-3-haiku-20240307",
+      messages: [{ role: "user", content: "Count from 1 to 10." }],
+      stop: ["5", "END"],
+      max_tokens: 100,
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+      },
+    },
+  },
+
+  /**
+   * OpenAI stop sequences consistency.
+   * Tests: stop sequences work on native OpenAI.
+   * From: schema tests for cross-provider consistency
+   */
+  proxyOpenAIStopSequences: {
+    "chat-completions": {
+      model: "gpt-4o-mini",
+      messages: [{ role: "user", content: "Count from 1 to 10." }],
+      stop: ["5", "END"],
+      max_tokens: 100,
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+      },
+    },
+  },
+
+  // ============================================================
+  // Additional Missing Tests (from proxy test analysis)
+  // ============================================================
+
+  /**
+   * Google response_format: json_object.
+   * Tests: json_object → generationConfig.response_mime_type: "application/json".
+   * From: google.params.test.ts "should translate json_object response format"
+   */
+  proxyGoogleJsonObjectFormat: {
+    "chat-completions": {
+      model: "gemini-2.0-flash",
+      messages: [
+        {
+          role: "user",
+          content: "Return a JSON object with a greeting field set to hello.",
+        },
+      ],
+      response_format: { type: "json_object" },
+      max_tokens: 100,
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+        "choices[0].finish_reason": "stop",
+      },
+    },
+  },
+
+  /**
+   * Google response_format: json_schema.
+   * Tests: json_schema → response_mime_type + response_schema translation.
+   * From: google.params.test.ts "should translate json_schema response format"
+   */
+  proxyGoogleJsonSchemaFormat: {
+    "chat-completions": {
+      model: "gemini-2.0-flash",
+      messages: [
+        {
+          role: "user",
+          content: "What is 10 + 5? Answer with just the number.",
+        },
+      ],
+      response_format: {
+        type: "json_schema",
+        json_schema: {
+          name: "math_result",
+          schema: {
+            type: "object",
+            properties: {
+              result: { type: "number" },
+            },
+            required: ["result"],
+          },
+        },
+      },
+      max_tokens: 50,
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+        "choices[0].finish_reason": "stop",
+      },
+    },
+  },
+
+  /**
+   * Google unsupported parameter filtering.
+   * Tests: frequency_penalty, presence_penalty are filtered (not sent to Google).
+   * From: google.params.test.ts "should filter unsupported parameters"
+   */
+  proxyGoogleUnsupportedParamsFilter: {
+    "chat-completions": {
+      model: "gemini-2.0-flash",
+      messages: [{ role: "user", content: "Say hello." }],
+      frequency_penalty: 0.5, // Google doesn't support this
+      presence_penalty: 0.5, // Google doesn't support this
+      max_tokens: 50,
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+      },
+    },
+  },
+
+  /**
+   * OpenAI PDF URL conversion.
+   * Tests: Remote PDF URL (in image_url format) → proxy fetches and converts to file block.
+   * From: openai.test.ts "should convert PDF file URL to file block"
+   * Note: Proxy detects .pdf extension and converts to native file format.
+   */
+  proxyOpenAIPdfUrlConversion: {
+    "chat-completions": {
+      model: "gpt-4o",
+      messages: [
+        {
+          role: "user",
+          content: [
+            { type: "text", text: "What type of document is this?" },
+            {
+              // Proxy detects PDF URLs in image_url and converts to file block
+              type: "image_url",
+              image_url: {
+                // Using a small, publicly available PDF
+                url: "https://www.w3.org/WAI/WCAG21/Techniques/pdf/img/table-word.pdf",
+              },
+            },
+          ],
+        },
+      ],
+      max_tokens: 100,
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+      },
+    },
+  },
+
+  /**
+   * Anthropic claude-3-7 128k output beta header.
+   * Tests: claude-3-7 without max_tokens gets 128k default and beta header.
+   * From: anthropic.test.ts "should use 128k max_tokens and beta header for claude-3-7"
+   * Note: Different from proxyModelSpecificDefaults - this tests with high output expectation.
+   */
+  proxyAnthropic128kBetaHeader: {
+    "chat-completions": {
+      model: "claude-3-7-sonnet-latest",
+      messages: [
+        {
+          role: "user",
+          content: "Write a very short poem (2 lines) about coding.",
+        },
+      ],
+      // No max_tokens - proxy should inject 128000 and add beta header
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+        "choices[0].finish_reason": "stop",
+        object: "chat.completion",
+      },
+    },
+  },
+
+  /**
+   * OpenAI o3-mini streaming with reasoning.
+   * Tests: o3-mini streaming returns reasoning content in delta.
+   * From: openai.test.ts "should accept reasoning with o3-mini (streaming)"
+   */
+  proxyOpenAIO3MiniStreamingReasoning: {
+    "chat-completions": {
+      model: "o3-mini-2025-01-31",
+      messages: [{ role: "user", content: "What is 7 * 8?" }],
+      reasoning_effort: "medium",
+      stream: true,
+      max_tokens: 1000,
+    },
+    responses: null,
+    anthropic: null,
+    google: null,
+    bedrock: null,
+    expect: {
+      status: 200,
+    },
+  },
+};
diff --git a/payloads/cases/types.ts b/payloads/cases/types.ts
index 5f35be68..4f10cfab 100644
--- a/payloads/cases/types.ts
+++ b/payloads/cases/types.ts
@@ -21,6 +21,20 @@ export type AnthropicMessageCreateParams =
     output_format?: Anthropic.Beta.Messages.BetaJSONOutputFormat | null;
   };
 
+// Expectation-based validation for proxy compatibility tests
+// When present, capture.ts skips the case and validate.ts checks expectations
+export interface TestExpectation {
+  // Expected HTTP status code
+  status?: number;
+  // Expected field values using dot notation paths (e.g., "choices[0].logprobs")
+  fields?: Record<string, unknown>;
+  // Expected error response shape
+  error?: {
+    type?: string;
+    message?: string;
+  };
+}
+
 // Well-defined types for test cases
 export interface TestCase {
   "chat-completions": OpenAI.Chat.Completions.ChatCompletionCreateParams | null;
@@ -28,6 +42,8 @@ export interface TestCase {
   anthropic: AnthropicMessageCreateParams | null;
   google: GoogleGenerateContentRequest | null;
   bedrock: BedrockConverseRequest | null;
+  // Optional expectations for proxy compatibility tests
+  expect?: TestExpectation;
 }
 
 // Collection of test cases organized by name
diff --git a/payloads/cases/utils.ts b/payloads/cases/utils.ts
index 938f2faa..4d1ce322 100644
--- a/payloads/cases/utils.ts
+++ b/payloads/cases/utils.ts
@@ -47,3 +47,20 @@ export function mergeCollections(
     return { ...merged, ...collection };
   }, {});
 }
+
+// Helper to get the full test case (including expect field)
+export function getFullTestCase(
+  collection: TestCaseCollection,
+  caseName: string
+): TestCase | undefined {
+  return collection[caseName];
+}
+
+// Helper to check if a test case has expectations (should skip capture)
+export function hasExpectation(
+  collection: TestCaseCollection,
+  caseName: string
+): boolean {
+  const testCase = collection[caseName];
+  return testCase?.expect !== undefined;
+}
diff --git a/payloads/scripts/providers/anthropic.ts b/payloads/scripts/providers/anthropic.ts
index 4aef4923..a8e783c7 100644
--- a/payloads/scripts/providers/anthropic.ts
+++ b/payloads/scripts/providers/anthropic.ts
@@ -1,8 +1,14 @@
 import Anthropic from "@anthropic-ai/sdk";
 import { CaptureResult, ExecuteOptions, ProviderExecutor } from "../types";
-import { allTestCases, getCaseNames, getCaseForProvider } from "../../cases";
+import {
+  allTestCases,
+  getCaseNames,
+  getCaseForProvider,
+  hasExpectation,
+} from "../../cases";
 
 // Anthropic cases - extracted from unified cases
+// Skips cases with expectations (those are validated, not captured)
 export const anthropicCases: Record<
   string,
   Anthropic.Messages.MessageCreateParams
@@ -10,6 +16,10 @@ export const anthropicCases: Record<
 
 // Populate cases from unified structure
 getCaseNames(allTestCases).forEach((caseName) => {
+  // Skip cases with expectations - they use validate.ts, not capture.ts
+  if (hasExpectation(allTestCases, caseName)) {
+    return;
+  }
   const caseData = getCaseForProvider(allTestCases, caseName, "anthropic");
   if (caseData) {
     anthropicCases[caseName] = caseData;
diff --git a/payloads/scripts/providers/bedrock.ts b/payloads/scripts/providers/bedrock.ts
index 2b5bf034..92c7b891 100644
--- a/payloads/scripts/providers/bedrock.ts
+++ b/payloads/scripts/providers/bedrock.ts
@@ -11,14 +11,20 @@ import {
   allTestCases,
   getCaseNames,
   getCaseForProvider,
+  hasExpectation,
   BedrockConverseRequest,
 } from "../../cases";
 
 // Bedrock cases - extracted from unified cases
+// Skips cases with expectations (those are validated, not captured)
 export const bedrockCases: Record<string, BedrockConverseRequest> = {};
 
 // Populate cases from unified structure
 getCaseNames(allTestCases).forEach((caseName) => {
+  // Skip cases with expectations - they use validate.ts, not capture.ts
+  if (hasExpectation(allTestCases, caseName)) {
+    return;
+  }
   const caseData = getCaseForProvider(allTestCases, caseName, "bedrock");
   if (caseData) {
     bedrockCases[caseName] = caseData;
diff --git a/payloads/scripts/providers/google.ts b/payloads/scripts/providers/google.ts
index 521dcdf5..e176ff33 100644
--- a/payloads/scripts/providers/google.ts
+++ b/payloads/scripts/providers/google.ts
@@ -5,15 +5,21 @@ import {
   allTestCases,
   getCaseNames,
   getCaseForProvider,
+  hasExpectation,
   GoogleGenerateContentRequest,
   GOOGLE_MODEL,
 } from "../../cases";
 
 // Google cases - extracted from unified cases
+// Skips cases with expectations (those are validated, not captured)
 export const googleCases: Record<string, GoogleGenerateContentRequest> = {};
 
 // Populate cases from unified structure
 getCaseNames(allTestCases).forEach((caseName) => {
+  // Skip cases with expectations - they use validate.ts, not capture.ts
+  if (hasExpectation(allTestCases, caseName)) {
+    return;
+  }
   const caseData = getCaseForProvider(allTestCases, caseName, "google");
   if (caseData) {
     googleCases[caseName] = caseData;
diff --git a/payloads/scripts/providers/openai-responses.ts b/payloads/scripts/providers/openai-responses.ts
index 8c507dbe..c6fe9ae2 100644
--- a/payloads/scripts/providers/openai-responses.ts
+++ b/payloads/scripts/providers/openai-responses.ts
@@ -1,12 +1,18 @@
 import OpenAI from "openai";
 import { CaptureResult, ExecuteOptions, ProviderExecutor } from "../types";
-import { allTestCases, getCaseNames, getCaseForProvider } from "../../cases";
+import {
+  allTestCases,
+  getCaseNames,
+  getCaseForProvider,
+  hasExpectation,
+} from "../../cases";
 import {
   ResponseInputItem,
   ResponseStreamEvent,
 } from "openai/resources/responses/responses";
 
 // OpenAI Responses API cases - extracted from unified cases
+// Skips cases with expectations (those are validated, not captured)
 export const openaiResponsesCases: Record<
   string,
   OpenAI.Responses.ResponseCreateParams
@@ -14,6 +20,10 @@ export const openaiResponsesCases: Record<
 
 // Populate cases from unified structure
 getCaseNames(allTestCases).forEach((caseName) => {
+  // Skip cases with expectations - they use validate.ts, not capture.ts
+  if (hasExpectation(allTestCases, caseName)) {
+    return;
+  }
   const caseData = getCaseForProvider(allTestCases, caseName, "responses");
   if (caseData) {
     openaiResponsesCases[caseName] = caseData;
diff --git a/payloads/scripts/providers/openai.ts b/payloads/scripts/providers/openai.ts
index 3bca2253..9198ac2f 100644
--- a/payloads/scripts/providers/openai.ts
+++ b/payloads/scripts/providers/openai.ts
@@ -1,6 +1,11 @@
 import OpenAI from "openai";
 import { CaptureResult, ExecuteOptions, ProviderExecutor } from "../types";
-import { allTestCases, getCaseNames, getCaseForProvider } from "../../cases";
+import {
+  allTestCases,
+  getCaseNames,
+  getCaseForProvider,
+  hasExpectation,
+} from "../../cases";
 
 // Define specific types for OpenAI
 type OpenAIRequest = OpenAI.Chat.Completions.ChatCompletionCreateParams;
@@ -8,10 +13,15 @@ type OpenAIResponse = OpenAI.Chat.Completions.ChatCompletion;
 type OpenAIStreamChunk = OpenAI.Chat.Completions.ChatCompletionChunk;
 
 // OpenAI Chat Completions cases - extracted from unified cases
+// Skips cases with expectations (those are validated, not captured)
 export const openaiCases: Record<string, OpenAIRequest> = {};
 
 // Populate cases from unified structure
 getCaseNames(allTestCases).forEach((caseName) => {
+  // Skip cases with expectations - they use validate.ts, not capture.ts
+  if (hasExpectation(allTestCases, caseName)) {
+    return;
+  }
   const caseData = getCaseForProvider(
     allTestCases,
     caseName,
diff --git a/payloads/scripts/validation/index.ts b/payloads/scripts/validation/index.ts
index a4755aa5..41e8a5a8 100644
--- a/payloads/scripts/validation/index.ts
+++ b/payloads/scripts/validation/index.ts
@@ -14,7 +14,9 @@ import {
   allTestCases,
   getCaseNames,
   getCaseForProvider,
+  getFullTestCase,
   caseCollections,
+  TestExpectation,
 } from "../../cases";
 import {
   OPENAI_CHAT_COMPLETIONS_MODEL,
@@ -57,6 +59,74 @@ function isRecord(value: unknown): value is Record<string, unknown> {
   return typeof value === "object" && value !== null && !Array.isArray(value);
 }
 
+/**
+ * Get a nested value from an object using dot notation path.
+ * Supports array indexing like "choices[0].message".
+ */
+function getPath(obj: unknown, path: string): unknown {
+  const parts = path.split(/\.|\[|\]/).filter(Boolean);
+  let current: unknown = obj;
+  for (const part of parts) {
+    if (!isRecord(current) && !Array.isArray(current)) {
+      return undefined;
+    }
+    // eslint-disable-next-line @typescript-eslint/consistent-type-assertions
+    current = (current as Record<string, unknown>)[part];
+  }
+  return current;
+}
+
+/**
+ * Validate response against expectations.
+ * Returns null if all expectations pass, or an error message if any fail.
+ */
+function validateExpectations(
+  expect: TestExpectation,
+  response: unknown,
+  httpStatus?: number
+): string | null {
+  // Check HTTP status code
+  if (expect.status !== undefined && httpStatus !== expect.status) {
+    return `Expected status ${expect.status}, got ${httpStatus}`;
+  }
+
+  // Check error fields
+  if (expect.error && isRecord(response)) {
+    const errorObj = response.error;
+    if (!isRecord(errorObj)) {
+      return `Expected error response, got: ${JSON.stringify(response)}`;
+    }
+    if (expect.error.type && errorObj.type !== expect.error.type) {
+      return `Expected error.type "${expect.error.type}", got "${errorObj.type}"`;
+    }
+    if (expect.error.message) {
+      const actualMessage = String(errorObj.message ?? "");
+      if (!actualMessage.includes(expect.error.message)) {
+        return `Expected error.message to contain "${expect.error.message}", got "${actualMessage}"`;
+      }
+    }
+  }
+
+  // Check specific fields
+  if (expect.fields) {
+    for (const [path, expected] of Object.entries(expect.fields)) {
+      const actual = getPath(response, path);
+      // Handle special case: checking existence
+      if (isRecord(expected) && "exists" in expected) {
+        const shouldExist = expected.exists;
+        const doesExist = actual !== undefined;
+        if (shouldExist !== doesExist) {
+          return `Expected ${path} to ${shouldExist ? "exist" : "not exist"}`;
+        }
+      } else if (actual !== expected) {
+        return `Expected ${path} = ${JSON.stringify(expected)}, got ${JSON.stringify(actual)}`;
+      }
+    }
+  }
+
+  return null; // All expectations passed
+}
+
 /**
  * Extract model name from actual API response.
  * Handles both streaming (array) and non-streaming (object) responses.
@@ -287,6 +357,58 @@ export async function runValidation(
               return result;
             }
 
+            // Check if this is an expectation-based test
+            const fullTestCase = getFullTestCase(allTestCases, caseName);
+            const expectations = fullTestCase?.expect;
+
+            // For expectation-based tests, use direct HTTP request to get status codes
+            if (expectations) {
+              const endpoint =
+                format === "chat-completions"
+                  ? "/v1/chat/completions"
+                  : "/v1/responses";
+              const fetchResponse = await fetch(
+                `${options.proxyUrl}${endpoint}`,
+                {
+                  method: "POST",
+                  headers: {
+                    "Content-Type": "application/json",
+                    ...(options.apiKey
+                      ? { Authorization: `Bearer ${options.apiKey}` }
+                      : {}),
+                  },
+                  body: JSON.stringify(request),
+                }
+              );
+
+              const httpStatus = fetchResponse.status;
+              let responseBody: unknown;
+              try {
+                responseBody = await fetchResponse.json();
+              } catch {
+                responseBody = { error: "Failed to parse response JSON" };
+              }
+
+              const validationError = validateExpectations(
+                expectations,
+                responseBody,
+                httpStatus
+              );
+
+              const result: ValidationResult = {
+                format,
+                caseName,
+                model: modelName,
+                success: validationError === null,
+                durationMs: Date.now() - start,
+                error: validationError ?? undefined,
+                actualResponse: options.verbose ? responseBody : undefined,
+              };
+              options.onResult?.(result);
+              return result;
+            }
+
+            // Standard snapshot-based validation
             if (!expectedResponse) {
               const result: ValidationResult = {
                 format,

From af4a5958f18c09657a2b8a868b063df90b7c6efb Mon Sep 17 00:00:00 2001
From: Ken Jiang <ken@braintrustdata.com>
Date: Wed, 28 Jan 2026 13:35:13 -0500
Subject: [PATCH 4/5] address proxy edge cases

---
 crates/braintrust-llm-router/src/error.rs     |    8 +-
 crates/lingua/src/processing/transform.rs     |    6 +-
 .../lingua/src/providers/anthropic/adapter.rs |    8 +-
 .../lingua/src/providers/anthropic/convert.rs |   55 +-
 .../lingua/src/providers/anthropic/detect.rs  |    8 +
 .../lingua/src/providers/bedrock/adapter.rs   |    9 +-
 crates/lingua/src/providers/google/adapter.rs |    4 +-
 crates/lingua/src/providers/openai/adapter.rs |  198 ++-
 crates/lingua/src/providers/openai/params.rs  |    7 +
 crates/lingua/src/universal/reasoning.rs      |  119 +-
 payloads/cases/index.ts                       |   11 +-
 payloads/cases/proxy.ts                       | 1584 -----------------
 payloads/proxy/cases.ts                       |  915 ++++++++++
 payloads/proxy/index.ts                       |    8 +
 payloads/proxy/types.ts                       |   24 +
 payloads/scripts/validation/index.ts          |  410 +++--
 16 files changed, 1555 insertions(+), 1819 deletions(-)
 delete mode 100644 payloads/cases/proxy.ts
 create mode 100644 payloads/proxy/cases.ts
 create mode 100644 payloads/proxy/index.ts
 create mode 100644 payloads/proxy/types.ts

diff --git a/crates/braintrust-llm-router/src/error.rs b/crates/braintrust-llm-router/src/error.rs
index bd6e6495..e50e7db6 100644
--- a/crates/braintrust-llm-router/src/error.rs
+++ b/crates/braintrust-llm-router/src/error.rs
@@ -170,10 +170,12 @@ mod tests {
         assert!(TransformError::UnsupportedTargetFormat(ProviderFormat::OpenAI).is_client_error());
         assert!(TransformError::UnsupportedSourceFormat(ProviderFormat::OpenAI).is_client_error());
 
-        // Server errors
+        // Conversion errors are client errors (user sent unsupported content)
+        assert!(TransformError::FromUniversalFailed("test".into()).is_client_error());
+        assert!(TransformError::ToUniversalFailed("test".into()).is_client_error());
+
+        // Server errors (internal issues)
         assert!(!TransformError::SerializationFailed("test".into()).is_client_error());
-        assert!(!TransformError::FromUniversalFailed("test".into()).is_client_error());
-        assert!(!TransformError::ToUniversalFailed("test".into()).is_client_error());
         assert!(!TransformError::StreamingNotImplemented("test".into()).is_client_error());
     }
 
diff --git a/crates/lingua/src/processing/transform.rs b/crates/lingua/src/processing/transform.rs
index 6c2e5e5f..6e54fd5c 100644
--- a/crates/lingua/src/processing/transform.rs
+++ b/crates/lingua/src/processing/transform.rs
@@ -62,7 +62,9 @@ impl TransformError {
     /// Returns true if this is a client-side error (user's fault).
     ///
     /// Client errors indicate invalid input or unsupported configurations
-    /// that the user should fix in their request.
+    /// that the user should fix in their request. This includes conversion
+    /// failures which typically mean the user tried to use features that
+    /// the target provider doesn't support.
     pub fn is_client_error(&self) -> bool {
         matches!(
             self,
@@ -71,6 +73,8 @@ impl TransformError {
                 | TransformError::DeserializationFailed(_)
                 | TransformError::UnsupportedTargetFormat(_)
                 | TransformError::UnsupportedSourceFormat(_)
+                | TransformError::ToUniversalFailed(_)
+                | TransformError::FromUniversalFailed(_)
         )
     }
 }
diff --git a/crates/lingua/src/providers/anthropic/adapter.rs b/crates/lingua/src/providers/anthropic/adapter.rs
index bde7ec79..66d9b233 100644
--- a/crates/lingua/src/providers/anthropic/adapter.rs
+++ b/crates/lingua/src/providers/anthropic/adapter.rs
@@ -163,8 +163,14 @@ impl ProviderAdapter for AnthropicAdapter {
         obj.insert("max_tokens".into(), Value::Number(max_tokens.into()));
 
         // Check if reasoning/thinking is enabled (needed for temperature override)
+        // Note: thinking_val can be { type: "disabled" } or { type: "enabled", ... }
+        // Only override temperature when type is "enabled"
         let thinking_val = req.params.reasoning_for(ProviderFormat::Anthropic);
-        let reasoning_enabled = thinking_val.is_some();
+        let reasoning_enabled = thinking_val
+            .as_ref()
+            .and_then(|v| v.get("type"))
+            .and_then(|t| t.as_str())
+            .is_some_and(|t| t == "enabled");
 
         // Insert other params
         // Anthropic requires temperature=1.0 when extended thinking is enabled
diff --git a/crates/lingua/src/providers/anthropic/convert.rs b/crates/lingua/src/providers/anthropic/convert.rs
index e57b4249..f6050560 100644
--- a/crates/lingua/src/providers/anthropic/convert.rs
+++ b/crates/lingua/src/providers/anthropic/convert.rs
@@ -6,6 +6,7 @@ use crate::universal::{
     TextContentPart, ToolCallArguments, ToolContentPart, ToolResultContentPart, UserContent,
     UserContentPart,
 };
+use crate::util::media::parse_base64_data_url;
 
 impl TryFromLLM<generated::InputMessage> for Message {
     type Error = ConvertError;
@@ -406,6 +407,43 @@ impl TryFromLLM<Message> for generated::InputMessage {
                                         let is_url = image_data.starts_with("http://")
                                             || image_data.starts_with("https://");
 
+                                        // Handle text content types - decode to text block instead of document
+                                        // Anthropic's Document block only accepts PDFs, not text files
+                                        if !is_url {
+                                            if let Some(mt) = &media_type {
+                                                if mt.starts_with("text/") {
+                                                    // Parse data URL and decode base64 to text
+                                                    if let Some(media_block) = parse_base64_data_url(&image_data) {
+                                                        use base64::Engine;
+                                                        if let Ok(bytes) = base64::engine::general_purpose::STANDARD.decode(&media_block.data) {
+                                                            if let Ok(text) = String::from_utf8(bytes) {
+                                                                return Some(generated::InputContentBlock {
+                                                                    cache_control: None,
+                                                                    citations: None,
+                                                                    text: Some(text),
+                                                                    input_content_block_type: generated::InputContentBlockType::Text,
+                                                                    source: None,
+                                                                    context: None,
+                                                                    title: None,
+                                                                    content: None,
+                                                                    signature: None,
+                                                                    thinking: None,
+                                                                    data: None,
+                                                                    id: None,
+                                                                    input: None,
+                                                                    name: None,
+                                                                    is_error: None,
+                                                                    tool_use_id: None,
+                                                                });
+                                                            }
+                                                        }
+                                                    }
+                                                    // Skip if can't decode text
+                                                    return None;
+                                                }
+                                            }
+                                        }
+
                                         let (source_type, source_url, source_data, anthropic_media_type) = if is_url {
                                             (
                                                 generated::FluffyType::Url,
@@ -414,7 +452,7 @@ impl TryFromLLM<Message> for generated::InputMessage {
                                                 None,
                                             )
                                         } else {
-                                            // Base64 data - parse media_type
+                                            // Base64 data - parse media_type (images and PDFs only)
                                             let anthropic_media_type =
                                                 media_type.as_ref().and_then(|mt| match mt.as_str() {
                                                     "image/jpeg" => {
@@ -432,9 +470,7 @@ impl TryFromLLM<Message> for generated::InputMessage {
                                                     "application/pdf" => {
                                                         Some(generated::FluffyMediaType::ApplicationPdf)
                                                     }
-                                                    "text/plain" => {
-                                                        Some(generated::FluffyMediaType::TextPlain)
-                                                    }
+                                                    // Text types are handled above, shouldn't reach here
                                                     _ => None,
                                                 });
                                             (
@@ -445,12 +481,19 @@ impl TryFromLLM<Message> for generated::InputMessage {
                                             )
                                         };
 
+                                        // Block type: only PDF uses Document, everything else is Image
+                                        let block_type = match anthropic_media_type {
+                                            Some(generated::FluffyMediaType::ApplicationPdf) => {
+                                                generated::InputContentBlockType::Document
+                                            }
+                                            _ => generated::InputContentBlockType::Image,
+                                        };
+
                                         Some(generated::InputContentBlock {
                                             cache_control: None,
                                             citations: None,
                                             text: None,
-                                            input_content_block_type:
-                                                generated::InputContentBlockType::Image,
+                                            input_content_block_type: block_type,
                                             source: Some(generated::Source::SourceSource(
                                                 generated::SourceSource {
                                                     data: source_data,
diff --git a/crates/lingua/src/providers/anthropic/detect.rs b/crates/lingua/src/providers/anthropic/detect.rs
index bc101abb..fdc982f6 100644
--- a/crates/lingua/src/providers/anthropic/detect.rs
+++ b/crates/lingua/src/providers/anthropic/detect.rs
@@ -26,6 +26,14 @@ const OPENAI_ONLY_FIELDS: &[&str] = &[
     "service_tier",
     "store",
     "parallel_tool_calls",
+    // OpenAI uses `stop`, Anthropic uses `stop_sequences`
+    "stop",
+    // OpenAI reasoning parameter
+    "reasoning_effort",
+    // Braintrust extension for disabling reasoning
+    "reasoning_enabled",
+    // OpenAI alias for max_tokens
+    "max_completion_tokens",
 ];
 
 /// Attempt to parse a JSON Value as Anthropic CreateMessageParams.
diff --git a/crates/lingua/src/providers/bedrock/adapter.rs b/crates/lingua/src/providers/bedrock/adapter.rs
index 6cd214ac..a1abafe6 100644
--- a/crates/lingua/src/providers/bedrock/adapter.rs
+++ b/crates/lingua/src/providers/bedrock/adapter.rs
@@ -179,11 +179,18 @@ impl ProviderAdapter for BedrockAdapter {
         );
 
         // Check if reasoning/thinking is enabled (for temperature override)
+        // Note: thinking_config can be { type: "disabled" } or { type: "enabled", ... }
+        // Only override temperature when type is "enabled"
         let thinking_config = req.params.reasoning_for(ProviderFormat::Converse);
+        let reasoning_enabled = thinking_config
+            .as_ref()
+            .and_then(|v| v.get("type"))
+            .and_then(|t| t.as_str())
+            .is_some_and(|t| t == "enabled");
 
         // Build inferenceConfig if any params are set
         // Note: Claude on Bedrock requires temperature=1.0 when extended thinking is enabled
-        let temperature = if thinking_config.is_some() {
+        let temperature = if reasoning_enabled {
             Some(ANTHROPIC_THINKING_TEMPERATURE)
         } else {
             req.params.temperature
diff --git a/crates/lingua/src/providers/google/adapter.rs b/crates/lingua/src/providers/google/adapter.rs
index 1a7aee6d..34532470 100644
--- a/crates/lingua/src/providers/google/adapter.rs
+++ b/crates/lingua/src/providers/google/adapter.rs
@@ -67,9 +67,11 @@ impl ProviderAdapter for GoogleAdapter {
             if let Some(config) = &typed_params.generation_config {
                 let max_tokens = config.max_output_tokens.map(|t| t as i64);
                 // Convert Google's thinkingConfig to ReasoningConfig
+                // thinkingBudget: 0 means disabled
                 let reasoning = config.thinking_config.as_ref().map(|tc| {
+                    let is_disabled = tc.thinking_budget == Some(0);
                     crate::universal::ReasoningConfig {
-                        enabled: tc.include_thoughts.or(Some(true)), // If thinking_config exists, it's enabled
+                        enabled: Some(!is_disabled),
                         budget_tokens: tc.thinking_budget.map(|b| b as i64),
                         ..Default::default()
                     }
diff --git a/crates/lingua/src/providers/openai/adapter.rs b/crates/lingua/src/providers/openai/adapter.rs
index 528a6a34..ce2acb9b 100644
--- a/crates/lingua/src/providers/openai/adapter.rs
+++ b/crates/lingua/src/providers/openai/adapter.rs
@@ -29,6 +29,8 @@ use crate::providers::openai::try_parse_openai;
 use crate::serde_json::{self, Map, Value};
 use crate::universal::convert::TryFromLLM;
 use crate::universal::message::Message;
+use crate::universal::reasoning::effort_to_budget;
+use crate::universal::request::{ReasoningConfig, ReasoningEffort};
 use crate::universal::tools::{tools_to_openai_chat_value, UniversalTool};
 use crate::universal::{
     parse_stop_sequences, UniversalParams, UniversalRequest, UniversalResponse,
@@ -89,10 +91,14 @@ impl ProviderAdapter for OpenAIAdapter {
             .max_tokens
             .or(typed_params.max_completion_tokens);
 
-        // Convert reasoning effort to ReasoningConfig, computing budget_tokens with max_tokens context
-        let reasoning = typed_params
-            .reasoning_effort
-            .map(|effort| (effort, max_tokens).into());
+        // Build ReasoningConfig from all reasoning-related fields
+        // Priority: reasoning_enabled: false takes precedence, then reasoning_budget, then reasoning_effort
+        let reasoning = build_reasoning_config(
+            typed_params.reasoning_enabled,
+            typed_params.reasoning_budget,
+            typed_params.reasoning_effort,
+            max_tokens,
+        );
 
         // Build canonical params from typed fields
         let mut params = UniversalParams {
@@ -510,6 +516,61 @@ impl ProviderAdapter for OpenAIAdapter {
     }
 }
 
+// =============================================================================
+// Helper Functions
+// =============================================================================
+
+use crate::providers::openai::generated::ReasoningEffort as OpenAIReasoningEffort;
+
+/// Build ReasoningConfig from OpenAI reasoning-related fields.
+///
+/// Priority:
+/// - `reasoning_enabled: false` OR `reasoning_budget: 0` → disabled
+/// - `reasoning_budget: N` (N > 0) → enabled with explicit budget
+/// - `reasoning_effort` → enabled with computed budget from effort level
+/// - `reasoning_enabled: true` (without budget/effort) → enabled with default
+fn build_reasoning_config(
+    reasoning_enabled: Option<bool>,
+    reasoning_budget: Option<i64>,
+    reasoning_effort: Option<OpenAIReasoningEffort>,
+    max_tokens: Option<i64>,
+) -> Option<ReasoningConfig> {
+    // Check if any reasoning field is set
+    if reasoning_enabled.is_none() && reasoning_budget.is_none() && reasoning_effort.is_none() {
+        return None;
+    }
+
+    // Determine if reasoning is disabled
+    // reasoning_enabled: false OR reasoning_budget: 0 means disabled
+    let is_disabled = reasoning_enabled == Some(false) || reasoning_budget == Some(0);
+
+    if is_disabled {
+        return Some(ReasoningConfig {
+            enabled: Some(false),
+            budget_tokens: None,
+            ..Default::default()
+        });
+    }
+
+    // Calculate budget_tokens: reasoning_budget takes precedence over reasoning_effort
+    let budget_tokens = reasoning_budget.or_else(|| {
+        reasoning_effort.map(|effort| {
+            let universal_effort = match effort {
+                OpenAIReasoningEffort::Low | OpenAIReasoningEffort::Minimal => ReasoningEffort::Low,
+                OpenAIReasoningEffort::Medium => ReasoningEffort::Medium,
+                OpenAIReasoningEffort::High => ReasoningEffort::High,
+            };
+            effort_to_budget(universal_effort, max_tokens)
+        })
+    });
+
+    Some(ReasoningConfig {
+        enabled: Some(true),
+        budget_tokens,
+        ..Default::default()
+    })
+}
+
 // =============================================================================
 // OpenAI Target-Specific Transformations
 // =============================================================================
@@ -1047,4 +1108,133 @@ mod tests {
             _ => panic!("Expected Assistant message, got {:?}", msg),
         }
     }
+
+    // =========================================================================
+    // Braintrust reasoning extension tests
+    // =========================================================================
+
+    #[test]
+    fn test_build_reasoning_config_disabled() {
+        // reasoning_enabled: false should result in disabled
+        let config = build_reasoning_config(Some(false), None, None, None);
+        assert!(config.is_some());
+        let config = config.unwrap();
+        assert_eq!(config.enabled, Some(false));
+    }
+
+    #[test]
+    fn test_build_reasoning_config_budget_zero_disabled() {
+        // reasoning_budget: 0 should result in disabled
+        let config = build_reasoning_config(None, Some(0), None, None);
+        assert!(config.is_some());
+        let config = config.unwrap();
+        assert_eq!(config.enabled, Some(false));
+    }
+
+    #[test]
+    fn test_build_reasoning_config_budget_positive() {
+        // reasoning_budget: 2000 should result in enabled with explicit budget
+        let config = build_reasoning_config(None, Some(2000), None, None);
+        assert!(config.is_some());
+        let config = config.unwrap();
+        assert_eq!(config.enabled, Some(true));
+        assert_eq!(config.budget_tokens, Some(2000));
+    }
+
+    #[test]
+    fn test_build_reasoning_config_effort_only() {
+        // reasoning_effort: high should result in enabled with computed budget
+        let config =
+            build_reasoning_config(None, None, Some(OpenAIReasoningEffort::High), Some(4096));
+        assert!(config.is_some());
+        let config = config.unwrap();
+        assert_eq!(config.enabled, Some(true));
+        assert_eq!(config.budget_tokens, Some(3072)); // 75% of 4096
+    }
+
+    #[test]
+    fn test_build_reasoning_config_budget_overrides_effort() {
+        // reasoning_budget should take precedence over reasoning_effort
+        let config = build_reasoning_config(
+            None,
+            Some(5000),
+            Some(OpenAIReasoningEffort::Low),
+            Some(4096),
+        );
+        assert!(config.is_some());
+        let config = config.unwrap();
+        assert_eq!(config.enabled, Some(true));
+        assert_eq!(config.budget_tokens, Some(5000)); // Not the computed effort budget
+    }
+
+    #[test]
+    fn test_build_reasoning_config_enabled_true_budget_zero_disabled() {
+        // reasoning_enabled: true with reasoning_budget: 0 should still be disabled
+        // (budget: 0 takes precedence)
+        let config = build_reasoning_config(Some(true), Some(0), None, None);
+        assert!(config.is_some());
+        let config = config.unwrap();
+        assert_eq!(config.enabled, Some(false));
+    }
+
+    #[test]
+    fn test_build_reasoning_config_none() {
+        // No reasoning fields should result in None
+        let config = build_reasoning_config(None, None, None, None);
+        assert!(config.is_none());
+    }
+
+    #[test]
+    fn test_openai_reasoning_enabled_false_to_anthropic() {
+        // Full integration test: OpenAI request with reasoning_enabled: false
+        // should produce Anthropic { type: "disabled" }
+        let adapter = OpenAIAdapter;
+        let payload = json!({
+            "model": "claude-3-7-sonnet-20250219",
+            "messages": [{"role": "user", "content": "Hello"}],
+            "reasoning_enabled": false,
+            "max_tokens": 100
+        });
+
+        let universal = adapter.request_to_universal(payload).unwrap();
+
+        // Verify ReasoningConfig has enabled: false
+        assert!(universal.params.reasoning.is_some());
+        let reasoning = universal.params.reasoning.as_ref().unwrap();
+        assert_eq!(reasoning.enabled, Some(false));
+
+        // Verify the output for Anthropic
+        let anthropic_thinking = universal.params.reasoning_for(ProviderFormat::Anthropic);
+        assert!(anthropic_thinking.is_some());
+        let thinking = anthropic_thinking.unwrap();
+        assert_eq!(thinking.get("type").unwrap(), "disabled");
+    }
+
+    #[test]
+    fn test_openai_reasoning_budget_to_anthropic() {
+        // Full integration test: OpenAI request with reasoning_budget
+        // should produce Anthropic { type: "enabled", budget_tokens: N }
+        let adapter = OpenAIAdapter;
+        let payload = json!({
+            "model": "claude-3-7-sonnet-20250219",
+            "messages": [{"role": "user", "content": "Hello"}],
+            "reasoning_budget": 3000,
+            "max_tokens": 100
+        });
+
+        let universal = adapter.request_to_universal(payload).unwrap();
+
+        // Verify ReasoningConfig
+        assert!(universal.params.reasoning.is_some());
+        let reasoning = universal.params.reasoning.as_ref().unwrap();
+        assert_eq!(reasoning.enabled, Some(true));
+        assert_eq!(reasoning.budget_tokens, Some(3000));
+
+        // Verify the output for Anthropic
+        let anthropic_thinking = universal.params.reasoning_for(ProviderFormat::Anthropic);
+        assert!(anthropic_thinking.is_some());
+        let thinking = anthropic_thinking.unwrap();
+        assert_eq!(thinking.get("type").unwrap(), "enabled");
+        assert_eq!(thinking.get("budget_tokens").unwrap(), 3000);
+    }
 }
diff --git a/crates/lingua/src/providers/openai/params.rs b/crates/lingua/src/providers/openai/params.rs
index bb7e85ed..5c499846 100644
--- a/crates/lingua/src/providers/openai/params.rs
+++ b/crates/lingua/src/providers/openai/params.rs
@@ -53,6 +53,13 @@ pub struct OpenAIChatParams {
     // === Reasoning (o-series models) ===
     pub reasoning_effort: Option<ReasoningEffort>,
 
+    // === Reasoning (Braintrust proxy extensions) ===
+    /// Explicitly enable/disable reasoning (Braintrust proxy extension)
+    pub reasoning_enabled: Option<bool>,
+
+    /// Token budget for reasoning (Braintrust proxy extension)
+    pub reasoning_budget: Option<i64>,
+
     // === Metadata and identification ===
     pub metadata: Option<Value>,
     pub store: Option<bool>,
diff --git a/crates/lingua/src/universal/reasoning.rs b/crates/lingua/src/universal/reasoning.rs
index f5a309c5..ebf4ed68 100644
--- a/crates/lingua/src/universal/reasoning.rs
+++ b/crates/lingua/src/universal/reasoning.rs
@@ -364,33 +364,49 @@ fn to_openai_responses(config: &ReasoningConfig, max_tokens: Option<i64>) -> Opt
 }
 
 /// Convert ReasoningConfig to Anthropic `thinking` object.
+///
+/// Returns:
+/// - `Some({ type: "disabled" })` when explicitly disabled
+/// - `Some({ type: "enabled", budget_tokens: N })` when enabled
+/// - `None` when not specified (no thinking field)
 fn to_anthropic(config: &ReasoningConfig, _max_tokens: Option<i64>) -> Option<Value> {
-    if config.enabled != Some(true) {
-        return None;
+    match config.enabled {
+        // Explicitly disabled - return disabled payload
+        Some(false) => Some(json!({ "type": "disabled" })),
+        // Enabled - return enabled payload with budget
+        Some(true) => {
+            let budget = config.budget_tokens.unwrap_or(MIN_THINKING_BUDGET);
+            Some(json!({
+                "type": "enabled",
+                "budget_tokens": budget
+            }))
+        }
+        // Not specified - no thinking field
+        None => None,
     }
-
-    // Use budget_tokens or default minimum
-    let budget = config.budget_tokens.unwrap_or(MIN_THINKING_BUDGET);
-
-    Some(json!({
-        "type": "enabled",
-        "budget_tokens": budget
-    }))
 }
 
 /// Convert ReasoningConfig to Google `thinkingConfig` object.
+///
+/// Returns:
+/// - `Some({ thinkingBudget: 0 })` when explicitly disabled
+/// - `Some({ includeThoughts: true, thinkingBudget: N })` when enabled
+/// - `None` when not specified (no thinkingConfig field)
 fn to_google(config: &ReasoningConfig, _max_tokens: Option<i64>) -> Option<Value> {
-    if config.enabled != Some(true) {
-        return None;
+    match config.enabled {
+        // Explicitly disabled - return disabled payload
+        Some(false) => Some(json!({ "thinkingBudget": 0 })),
+        // Enabled - return enabled payload with budget
+        Some(true) => {
+            let budget = config.budget_tokens.unwrap_or(MIN_THINKING_BUDGET);
+            Some(json!({
+                "includeThoughts": true,
+                "thinkingBudget": budget
+            }))
+        }
+        // Not specified - no thinkingConfig field
+        None => None,
     }
-
-    // Use budget_tokens or default minimum
-    let budget = config.budget_tokens.unwrap_or(MIN_THINKING_BUDGET);
-
-    Some(json!({
-        "includeThoughts": true,
-        "thinkingBudget": budget
-    }))
 }
 
 #[cfg(test)]
@@ -544,6 +560,7 @@ mod tests {
 
     #[test]
     fn test_to_bedrock_thinking_disabled() {
+        // When explicitly disabled, should return { type: "disabled" }
         let config = ReasoningConfig {
             enabled: Some(false),
             ..Default::default()
@@ -551,6 +568,68 @@ mod tests {
 
         let result = config
             .to_provider(ProviderFormat::Converse, Some(4096))
+            .unwrap()
+            .unwrap();
+        assert_eq!(result.get("type").unwrap(), "disabled");
+    }
+
+    #[test]
+    fn test_to_anthropic_thinking_disabled() {
+        // When explicitly disabled, should return { type: "disabled" }
+        let config = ReasoningConfig {
+            enabled: Some(false),
+            ..Default::default()
+        };
+
+        let result = config
+            .to_provider(ProviderFormat::Anthropic, Some(4096))
+            .unwrap()
+            .unwrap();
+        assert_eq!(result.get("type").unwrap(), "disabled");
+    }
+
+    #[test]
+    fn test_to_anthropic_thinking_not_specified() {
+        // When not specified (enabled: None), should return None
+        let config = ReasoningConfig {
+            enabled: None,
+            budget_tokens: None,
+            ..Default::default()
+        };
+
+        let result = config
+            .to_provider(ProviderFormat::Anthropic, Some(4096))
+            .unwrap();
+        assert!(result.is_none());
+    }
+
+    #[test]
+    fn test_to_google_thinking_disabled() {
+        // When explicitly disabled, should return { thinkingBudget: 0 }
+        let config = ReasoningConfig {
+            enabled: Some(false),
+            ..Default::default()
+        };
+
+        let result = config
+            .to_provider(ProviderFormat::Google, Some(4096))
+            .unwrap()
+            .unwrap();
+        assert_eq!(result.get("thinkingBudget").unwrap(), 0);
+        assert!(result.get("includeThoughts").is_none());
+    }
+
+    #[test]
+    fn test_to_google_thinking_not_specified() {
+        // When not specified (enabled: None), should return None
+        let config = ReasoningConfig {
+            enabled: None,
+            budget_tokens: None,
+            ..Default::default()
+        };
+
+        let result = config
+            .to_provider(ProviderFormat::Google, Some(4096))
             .unwrap();
         assert!(result.is_none());
     }
diff --git a/payloads/cases/index.ts b/payloads/cases/index.ts
index 9a654b26..cd6d8533 100644
--- a/payloads/cases/index.ts
+++ b/payloads/cases/index.ts
@@ -3,33 +3,30 @@ export * from "./types";
 export * from "./utils";
 export * from "./models";
 
-// Export all case collections
+// Export all case collections (snapshot-based cases only)
 export { simpleCases } from "./simple";
 export { advancedCases } from "./advanced";
 export { paramsCases } from "./params";
-export { proxyCases } from "./proxy";
 
 // Import and merge all collections for convenience
 import { simpleCases } from "./simple";
 import { advancedCases } from "./advanced";
 import { paramsCases } from "./params";
-import { proxyCases } from "./proxy";
 import { mergeCollections, getCaseNames } from "./utils";
 
-// Combined collection of all test cases
+// Combined collection of all snapshot-based test cases
 export const allTestCases = mergeCollections(
   simpleCases,
   advancedCases,
-  paramsCases,
-  proxyCases
+  paramsCases
 );
 
 // Map of collection names to their case names (for --cases flag)
+// Note: proxy cases are handled separately in the validation library
 export const caseCollections: Record<string, string[]> = {
   simple: getCaseNames(simpleCases),
   advanced: getCaseNames(advancedCases),
   params: getCaseNames(paramsCases),
-  proxy: getCaseNames(proxyCases),
 };
 
 // Legacy export for backward compatibility (can be removed later)
diff --git a/payloads/cases/proxy.ts b/payloads/cases/proxy.ts
deleted file mode 100644
index 20aa6144..00000000
--- a/payloads/cases/proxy.ts
+++ /dev/null
@@ -1,1584 +0,0 @@
-/**
- * Test cases ported from proxy integration tests.
- * These test OpenAI chat-completions compatibility with various providers.
- */
-
-import OpenAI from "openai";
-import { TestCaseCollection } from "./types";
-import { ANTHROPIC_MODEL } from "./models";
-
-// Text file: "Hello world!\n"
-const TEXT_BASE64 = "SGVsbG8gd29ybGQhCg==";
-
-// Minimal WAV header for audio error test (triggers unsupported media type)
-const AUDIO_BASE64 =
-  "UklGRiQAAABXQVZFZm10IBAAAAABAAEARKwAAIhYAQACABAAZGF0YQAAAAA=";
-
-// Minimal MP4 for video error test (triggers unsupported media type)
-const VIDEO_BASE64 = "AAAAIGZ0eXBpc29tAAACAGlzb21pc28yYXZjMW1wNDE=";
-
-// Small valid PDF (minimal structure)
-const PDF_BASE64 =
-  "JVBERi0xLjQKMSAwIG9iago8PC9UeXBlL0NhdGFsb2cvUGFnZXMgMiAwIFI+PgplbmRvYmoKMiAwIG9iago8PC9UeXBlL1BhZ2VzL0tpZHNbMyAwIFJdL0NvdW50IDE+PgplbmRvYmoKMyAwIG9iago8PC9UeXBlL1BhZ2UvTWVkaWFCb3hbMCAwIDYxMiA3OTJdL1BhcmVudCAyIDAgUi9SZXNvdXJjZXM8PD4+Pj4KZW5kb2JqCnhyZWYKMCA0CjAwMDAwMDAwMDAgNjU1MzUgZiAKMDAwMDAwMDAxNSAwMDAwMCBuIAowMDAwMDAwMDYxIDAwMDAwIG4gCjAwMDAwMDAxMTggMDAwMDAgbiAKdHJhaWxlcgo8PC9TaXplIDQvUm9vdCAxIDAgUj4+CnN0YXJ0eHJlZgoyMTUKJSVFT0YK";
-
-// Small 1x1 PNG
-const IMAGE_BASE64 =
-  "iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAYAAAAfFcSJAAAADUlEQVR42mNk+M9QDwADhgGAWjR9awAAAABJRU5ErkJggg==";
-
-// Markdown file: "# Title\n\nThis is a paragraph.\n"
-const MD_BASE64 = "IyBUaXRsZQoKVGhpcyBpcyBhIHBhcmFncmFwaC4K";
-
-// CSV file: "name,age\nAlice,30\nBob,25\n"
-const CSV_BASE64 = "bmFtZSxhZ2UKQWxpY2UsMzAKQm9iLDI1Cg==";
-
-// Test cases ported from proxy/packages/proxy/src/providers/anthropic.test.ts
-export const proxyCases: TestCaseCollection = {
-  /**
-   * Basic non-streaming request with system message.
-   * Tests: Response format with logprobs field, finish_reason, usage.
-   * From: anthropic.test.ts "should convert OpenAI non-streaming request to Anthropic and back"
-   */
-  proxyAnthropicBasic: {
-    "chat-completions": {
-      model: "claude-3-haiku-20240307",
-      messages: [
-        { role: "system", content: "You are a helpful assistant." },
-        { role: "user", content: "Tell me a short joke about programming." },
-      ],
-      stream: false,
-      max_tokens: 150,
-    },
-    responses: null, // Not testing responses API
-    anthropic: {
-      model: ANTHROPIC_MODEL,
-      max_tokens: 150,
-      system: "You are a helpful assistant.",
-      messages: [
-        { role: "user", content: "Tell me a short joke about programming." },
-      ],
-    },
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].message.role": "assistant",
-        "choices[0].finish_reason": "stop",
-        object: "chat.completion",
-      },
-    },
-  },
-
-  /**
-   * Reasoning/thinking with multi-turn conversation.
-   * Tests: reasoning_effort param, reasoning blocks in response.
-   * From: anthropic.test.ts "should accept and return reasoning/thinking params"
-   */
-  proxyAnthropicReasoning: {
-    "chat-completions": {
-      model: "claude-3-7-sonnet-20250219",
-      reasoning_effort: "medium",
-      stream: false,
-      messages: [
-        {
-          role: "user",
-          content: "How many rs in 'ferrocarril'",
-        },
-        {
-          role: "assistant",
-          content: "There are 4 letter 'r's in the word \"ferrocarril\".",
-        },
-        {
-          role: "user",
-          content: "How many e in what you said?",
-        },
-      ],
-    },
-    responses: null,
-    anthropic: {
-      model: "claude-3-7-sonnet-20250219",
-      max_tokens: 16000,
-      messages: [
-        {
-          role: "user",
-          content: "How many rs in 'ferrocarril'",
-        },
-        {
-          role: "assistant",
-          content: [
-            {
-              type: "thinking",
-              thinking:
-                "Let me count: f-e-r-r-o-c-a-r-r-i-l. The 'r' appears at positions 3, 4, 8, 9. So 4 total.",
-              // Signature is required for thinking blocks
-              signature: "thinking-signature-placeholder",
-            },
-            {
-              type: "text",
-              text: "There are 4 letter 'r's in the word \"ferrocarril\".",
-            },
-          ],
-        },
-        {
-          role: "user",
-          content: "How many e in what you said?",
-        },
-      ],
-    },
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].message.role": "assistant",
-        object: "chat.completion",
-      },
-    },
-  },
-
-  /**
-   * Tool call with max_tokens causing truncation.
-   * Tests: tool_calls in response, finish_reason handling.
-   * From: anthropic.test.ts "should handle max_tokens stop reason correctly with tool calls"
-   */
-  proxyAnthropicToolCall: {
-    "chat-completions": {
-      model: "claude-3-haiku-20240307",
-      messages: [
-        {
-          role: "user",
-          content:
-            "Use the calculate function to add 2 and 3 together. Explain your reasoning in detail.",
-        },
-      ],
-      tools: [
-        {
-          type: "function",
-          function: {
-            name: "calculate",
-            description: "Perform a mathematical calculation",
-            parameters: {
-              type: "object",
-              properties: {
-                operation: {
-                  type: "string",
-                  enum: ["add", "subtract", "multiply", "divide"],
-                  description: "The operation to perform",
-                },
-                a: { type: "number", description: "First operand" },
-                b: { type: "number", description: "Second operand" },
-              },
-              required: ["operation", "a", "b"],
-            },
-          },
-        },
-      ],
-      tool_choice: "auto",
-      max_tokens: 50, // Low to potentially cause truncation
-    },
-    responses: null,
-    anthropic: {
-      model: ANTHROPIC_MODEL,
-      max_tokens: 50,
-      messages: [
-        {
-          role: "user",
-          content:
-            "Use the calculate function to add 2 and 3 together. Explain your reasoning in detail.",
-        },
-      ],
-      tools: [
-        {
-          name: "calculate",
-          description: "Perform a mathematical calculation",
-          input_schema: {
-            type: "object",
-            properties: {
-              operation: {
-                type: "string",
-                enum: ["add", "subtract", "multiply", "divide"],
-                description: "The operation to perform",
-              },
-              a: { type: "number", description: "First operand" },
-              b: { type: "number", description: "Second operand" },
-            },
-            required: ["operation", "a", "b"],
-          },
-        },
-      ],
-    },
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].message.role": "assistant",
-        object: "chat.completion",
-      },
-    },
-  },
-
-  /**
-   * PDF file content handling.
-   * Tests: file content part conversion to Anthropic document format.
-   * From: anthropic.test.ts "should handle file content parts with PDF data"
-   */
-  proxyAnthropicPdfFile: {
-    "chat-completions": {
-      model: "claude-3-5-sonnet-20241022",
-      messages: [
-        {
-          role: "user",
-          content: [
-            { type: "text", text: "What is in this PDF?" },
-            {
-              // Using image_url with PDF data URL (Braintrust converts to document)
-              type: "image_url",
-              image_url: {
-                url: `data:application/pdf;base64,${PDF_BASE64}`,
-              },
-            },
-          ],
-        },
-      ],
-      max_tokens: 200,
-    },
-    responses: null,
-    anthropic: {
-      model: "claude-3-5-sonnet-20241022",
-      max_tokens: 200,
-      messages: [
-        {
-          role: "user",
-          content: [
-            { type: "text", text: "What is in this PDF?" },
-            {
-              type: "document",
-              source: {
-                type: "base64",
-                media_type: "application/pdf",
-                data: PDF_BASE64,
-              },
-            },
-          ],
-        },
-      ],
-    },
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].message.role": "assistant",
-        object: "chat.completion",
-      },
-    },
-  },
-
-  /**
-   * Image file content handling.
-   * Tests: image content part handling.
-   * From: anthropic.test.ts "should handle file content parts with image data"
-   */
-  proxyAnthropicImageFile: {
-    "chat-completions": {
-      model: "claude-3-5-sonnet-20241022",
-      messages: [
-        {
-          role: "user",
-          content: [
-            { type: "text", text: "What color is this pixel?" },
-            {
-              type: "image_url",
-              image_url: {
-                url: `data:image/png;base64,${IMAGE_BASE64}`,
-              },
-            },
-          ],
-        },
-      ],
-      max_tokens: 100,
-    },
-    responses: null,
-    anthropic: {
-      model: "claude-3-5-sonnet-20241022",
-      max_tokens: 100,
-      messages: [
-        {
-          role: "user",
-          content: [
-            { type: "text", text: "What color is this pixel?" },
-            {
-              type: "image",
-              source: {
-                type: "base64",
-                media_type: "image/png",
-                data: IMAGE_BASE64,
-              },
-            },
-          ],
-        },
-      ],
-    },
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].message.role": "assistant",
-        object: "chat.completion",
-      },
-    },
-  },
-
-  /**
-   * Streaming request.
-   * Tests: SSE event format, delta structure.
-   * From: anthropic.test.ts "should convert OpenAI streaming request to Anthropic and back"
-   */
-  proxyAnthropicStreaming: {
-    "chat-completions": {
-      model: "claude-3-haiku-20240307",
-      messages: [
-        { role: "system", content: "You are a helpful assistant." },
-        { role: "user", content: "Say hello in 3 words." },
-      ],
-      stream: true,
-      max_tokens: 50,
-    },
-    responses: null,
-    anthropic: {
-      model: ANTHROPIC_MODEL,
-      max_tokens: 50,
-      stream: true,
-      system: "You are a helpful assistant.",
-      messages: [{ role: "user", content: "Say hello in 3 words." }],
-    },
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-    },
-  },
-
-  // ============================================================
-  // Expectation-based tests (skip capture, validated by expectations)
-  // ============================================================
-
-  /**
-   * Audio file error - Anthropic doesn't support audio input.
-   * Tests: 400 error for unsupported media type.
-   * From: anthropic.test.ts "should return 400 for unsupported audio file"
-   */
-  proxyAnthropicAudioError: {
-    "chat-completions": {
-      model: "claude-3-7-sonnet-latest",
-      messages: [
-        {
-          role: "user",
-          content: [
-            { type: "text", text: "What is in this audio?" },
-            {
-              type: "input_audio",
-              input_audio: {
-                data: AUDIO_BASE64,
-                format: "wav",
-              },
-            },
-          ],
-        },
-      ],
-      max_tokens: 100,
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 400,
-      error: { type: "invalid_request_error" },
-    },
-  },
-
-  /**
-   * Video file error - Anthropic doesn't support video input.
-   * Tests: 400 error for unsupported media type.
-   * From: anthropic.test.ts "should return 400 for unsupported video file"
-   */
-  proxyAnthropicVideoError: {
-    "chat-completions": {
-      model: "claude-3-7-sonnet-latest",
-      messages: [
-        {
-          role: "user",
-          content: [
-            { type: "text", text: "What is in this video?" },
-            {
-              type: "image_url",
-              image_url: {
-                url: `data:video/mp4;base64,${VIDEO_BASE64}`,
-              },
-            },
-          ],
-        },
-      ],
-      max_tokens: 100,
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 400,
-      error: { type: "invalid_request_error" },
-    },
-  },
-
-  /**
-   * Max tokens exceeds model limit.
-   * Tests: 400 error when max_tokens exceeds Anthropic's limit.
-   * From: anthropic.test.ts "should return 400 when max_tokens exceeds limit"
-   */
-  proxyAnthropicMaxTokensExceeds: {
-    "chat-completions": {
-      model: "claude-sonnet-4-5-20250514",
-      messages: [{ role: "user", content: "Hello" }],
-      max_tokens: 200000, // Exceeds Anthropic's max
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 400,
-    },
-  },
-
-  /**
-   * Reasoning disabled via reasoning_enabled: false.
-   * Tests: Response should not contain reasoning block.
-   * From: anthropic.test.ts "should disable reasoning when reasoning_enabled is false"
-   */
-  proxyAnthropicReasoningDisabled: {
-    // Cast needed: reasoning_enabled is a Braintrust proxy extension
-    // eslint-disable-next-line @typescript-eslint/consistent-type-assertions
-    "chat-completions": {
-      model: "claude-3-7-sonnet-20250219",
-      messages: [{ role: "user", content: "What is 2+2?" }],
-      reasoning_enabled: false,
-      max_tokens: 100,
-    } as OpenAI.Chat.Completions.ChatCompletionCreateParams,
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].message.reasoning": { exists: false },
-        "choices[0].message.role": "assistant",
-      },
-    },
-  },
-
-  /**
-   * JSON object response format.
-   * Tests: response_format: json_object triggers tool-based workaround.
-   * From: anthropic.test.ts "should handle json_object response format"
-   */
-  proxyAnthropicJsonObject: {
-    "chat-completions": {
-      model: "claude-3-haiku-20240307",
-      messages: [
-        {
-          role: "user",
-          content: "Return a JSON object with a greeting field.",
-        },
-      ],
-      response_format: { type: "json_object" },
-      max_tokens: 150,
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].message.role": "assistant",
-        "choices[0].finish_reason": "stop",
-      },
-    },
-  },
-
-  /**
-   * Tool call with tool_choice: required.
-   * Tests: finish_reason should be "tool_calls".
-   * From: anthropic.test.ts "should handle tool_choice required"
-   */
-  proxyAnthropicToolCallRequired: {
-    "chat-completions": {
-      model: "claude-3-haiku-20240307",
-      messages: [{ role: "user", content: "Get the weather in San Francisco" }],
-      tools: [
-        {
-          type: "function",
-          function: {
-            name: "get_weather",
-            description: "Get the current weather",
-            parameters: {
-              type: "object",
-              properties: {
-                location: { type: "string", description: "City name" },
-              },
-              required: ["location"],
-            },
-          },
-        },
-      ],
-      tool_choice: "required",
-      max_tokens: 150,
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].finish_reason": "tool_calls",
-        "choices[0].message.tool_calls[0].type": "function",
-      },
-    },
-  },
-
-  /**
-   * Plain text file support.
-   * Tests: text/plain files are properly handled.
-   * From: anthropic.test.ts "should handle plain text file"
-   */
-  proxyAnthropicPlainTextFile: {
-    "chat-completions": {
-      model: "claude-3-5-sonnet-20241022",
-      messages: [
-        {
-          role: "user",
-          content: [
-            { type: "text", text: "What does this text file say?" },
-            {
-              type: "image_url",
-              image_url: {
-                url: `data:text/plain;base64,${TEXT_BASE64}`,
-              },
-            },
-          ],
-        },
-      ],
-      max_tokens: 100,
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].message.role": "assistant",
-      },
-    },
-  },
-
-  /**
-   * Default max_tokens injection.
-   * Tests: Request without max_tokens still works (proxy injects default).
-   * From: anthropic.test.ts "should inject default max_tokens"
-   */
-  proxyAnthropicDefaultMaxTokens: {
-    "chat-completions": {
-      model: "claude-3-haiku-20240307",
-      messages: [{ role: "user", content: "Say hi" }],
-      // Note: no max_tokens - proxy should inject default
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].message.role": "assistant",
-        object: "chat.completion",
-      },
-    },
-  },
-
-  /**
-   * OpenAI reasoning_effort on non-reasoning model.
-   * Tests: gpt-4o-mini doesn't support reasoning_effort.
-   * From: openai.test.ts "should reject reasoning_effort on non-reasoning model"
-   */
-  proxyOpenAIReasoningDenied: {
-    "chat-completions": {
-      model: "gpt-4o-mini",
-      messages: [{ role: "user", content: "Hello" }],
-      reasoning_effort: "high",
-      max_tokens: 50,
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 400,
-      error: {
-        message: "Unrecognized request argument supplied: reasoning_effort",
-      },
-    },
-  },
-
-  /**
-   * OpenAI o3-mini with reasoning_effort.
-   * Tests: o3-mini supports reasoning_effort parameter.
-   * From: openai.test.ts "should support reasoning_effort on o3-mini"
-   */
-  proxyOpenAIO3MiniReasoning: {
-    "chat-completions": {
-      model: "o3-mini-2025-01-31",
-      messages: [{ role: "user", content: "What is 2+2?" }],
-      reasoning_effort: "medium",
-      max_tokens: 1000,
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].finish_reason": "stop",
-        object: "chat.completion",
-      },
-    },
-  },
-
-  // ============================================================
-  // Google Provider Tests
-  // ============================================================
-
-  /**
-   * Basic Google request translation.
-   * Tests: OpenAI format → Google format via proxy.
-   * From: google.test.ts basic request handling
-   */
-  proxyGoogleBasic: {
-    "chat-completions": {
-      model: "gemini-2.0-flash",
-      messages: [
-        { role: "system", content: "You are a helpful assistant." },
-        { role: "user", content: "Say hello in exactly 3 words." },
-      ],
-      max_tokens: 50,
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].message.role": "assistant",
-        object: "chat.completion",
-      },
-    },
-  },
-
-  /**
-   * Google parameter translation.
-   * Tests: temperature, top_p, max_tokens → Google format.
-   * From: google.params.test.ts parameter mapping
-   */
-  proxyGoogleParamTranslation: {
-    "chat-completions": {
-      model: "gemini-2.0-flash",
-      messages: [{ role: "user", content: "Count to 3." }],
-      temperature: 0.7,
-      top_p: 0.9,
-      max_tokens: 100,
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].message.role": "assistant",
-      },
-    },
-  },
-
-  /**
-   * Google tool calling.
-   * Tests: OpenAI tools format → Google function declarations.
-   * From: google.test.ts tool calling tests
-   */
-  proxyGoogleToolCall: {
-    "chat-completions": {
-      model: "gemini-2.0-flash",
-      messages: [{ role: "user", content: "What's the weather in Tokyo?" }],
-      tools: [
-        {
-          type: "function",
-          function: {
-            name: "get_weather",
-            description: "Get the current weather in a location",
-            parameters: {
-              type: "object",
-              properties: {
-                location: { type: "string", description: "City name" },
-              },
-              required: ["location"],
-            },
-          },
-        },
-      ],
-      tool_choice: "auto",
-      max_tokens: 200,
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].message.tool_calls[0].type": "function",
-      },
-    },
-  },
-
-  /**
-   * Google reasoning/thinking config.
-   * Tests: reasoning_effort → thinkingConfig translation.
-   * From: google.test.ts reasoning tests
-   */
-  proxyGoogleReasoning: {
-    "chat-completions": {
-      model: "gemini-2.5-flash-preview-04-17",
-      messages: [{ role: "user", content: "What is the square root of 144?" }],
-      reasoning_effort: "medium",
-      max_tokens: 500,
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].message.role": "assistant",
-      },
-    },
-  },
-
-  /**
-   * Google image content support.
-   * Tests: image_url handling for Google.
-   * From: google.test.ts multimodal tests
-   */
-  proxyGoogleImageContent: {
-    "chat-completions": {
-      model: "gemini-2.0-flash",
-      messages: [
-        {
-          role: "user",
-          content: [
-            { type: "text", text: "What do you see in this image?" },
-            {
-              type: "image_url",
-              image_url: {
-                url: `data:image/png;base64,${IMAGE_BASE64}`,
-              },
-            },
-          ],
-        },
-      ],
-      max_tokens: 100,
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].message.role": "assistant",
-      },
-    },
-  },
-
-  /**
-   * Google audio support (Google DOES support audio unlike Anthropic).
-   * Tests: audio content handling for Google.
-   * From: google.test.ts audio support
-   */
-  proxyGoogleAudioSupport: {
-    "chat-completions": {
-      model: "gemini-2.0-flash",
-      messages: [
-        {
-          role: "user",
-          content: [
-            { type: "text", text: "What do you hear in this audio?" },
-            {
-              type: "input_audio",
-              input_audio: {
-                data: AUDIO_BASE64,
-                format: "wav",
-              },
-            },
-          ],
-        },
-      ],
-      max_tokens: 100,
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].message.role": "assistant",
-      },
-    },
-  },
-
-  /**
-   * Google video support (Google DOES support video unlike Anthropic).
-   * Tests: video content handling for Google.
-   * From: google.test.ts video support
-   */
-  proxyGoogleVideoSupport: {
-    "chat-completions": {
-      model: "gemini-2.0-flash",
-      messages: [
-        {
-          role: "user",
-          content: [
-            { type: "text", text: "What do you see in this video?" },
-            {
-              type: "image_url",
-              image_url: {
-                url: `data:video/mp4;base64,${VIDEO_BASE64}`,
-              },
-            },
-          ],
-        },
-      ],
-      max_tokens: 100,
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].message.role": "assistant",
-      },
-    },
-  },
-
-  /**
-   * Google stop sequences.
-   * Tests: stop sequences translation.
-   * From: google.params.test.ts stop sequences
-   */
-  proxyGoogleStopSequences: {
-    "chat-completions": {
-      model: "gemini-2.0-flash",
-      messages: [{ role: "user", content: "Count from 1 to 10." }],
-      stop: ["5", "END"],
-      max_tokens: 100,
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].message.role": "assistant",
-      },
-    },
-  },
-
-  // ============================================================
-  // Additional Anthropic Tests
-  // ============================================================
-
-  /**
-   * Markdown file support.
-   * Tests: text/markdown files are properly handled.
-   * From: anthropic.test.ts "should handle markdown file"
-   */
-  proxyAnthropicMarkdownFile: {
-    "chat-completions": {
-      model: "claude-3-5-sonnet-20241022",
-      messages: [
-        {
-          role: "user",
-          content: [
-            {
-              type: "text",
-              text: "What is the heading in this markdown file?",
-            },
-            {
-              type: "image_url",
-              image_url: {
-                url: `data:text/markdown;base64,${MD_BASE64}`,
-              },
-            },
-          ],
-        },
-      ],
-      max_tokens: 100,
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].message.role": "assistant",
-      },
-    },
-  },
-
-  /**
-   * CSV file support.
-   * Tests: text/csv files are properly handled.
-   * From: anthropic.test.ts "should handle CSV file"
-   */
-  proxyAnthropicCSVFile: {
-    "chat-completions": {
-      model: "claude-3-5-sonnet-20241022",
-      messages: [
-        {
-          role: "user",
-          content: [
-            { type: "text", text: "How many rows are in this CSV file?" },
-            {
-              type: "image_url",
-              image_url: {
-                url: `data:text/csv;base64,${CSV_BASE64}`,
-              },
-            },
-          ],
-        },
-      ],
-      max_tokens: 100,
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].message.role": "assistant",
-      },
-    },
-  },
-
-  /**
-   * Tool call with sufficient tokens.
-   * Tests: finish_reason is "tool_calls" not "length" when tokens are sufficient.
-   * From: anthropic.test.ts "should handle tool_use stop reason"
-   */
-  proxyAnthropicToolCallSufficientTokens: {
-    "chat-completions": {
-      model: "claude-3-haiku-20240307",
-      messages: [{ role: "user", content: "Get the weather in Paris" }],
-      tools: [
-        {
-          type: "function",
-          function: {
-            name: "get_weather",
-            description: "Get the current weather",
-            parameters: {
-              type: "object",
-              properties: {
-                location: { type: "string", description: "City name" },
-              },
-              required: ["location"],
-            },
-          },
-        },
-      ],
-      tool_choice: "required",
-      max_tokens: 500, // Sufficient tokens - should not truncate
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].finish_reason": "tool_calls",
-      },
-    },
-  },
-
-  /**
-   * Streaming with reasoning.
-   * Tests: SSE events work correctly with reasoning enabled.
-   * From: anthropic.test.ts "should stream reasoning content"
-   */
-  proxyAnthropicStreamingReasoning: {
-    "chat-completions": {
-      model: "claude-3-7-sonnet-20250219",
-      messages: [{ role: "user", content: "What is 15 * 17?" }],
-      reasoning_effort: "low",
-      stream: true,
-      max_tokens: 2000,
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-    },
-  },
-
-  /**
-   * Multi-turn conversation with tool results.
-   * Tests: Tool result handling in conversation flow.
-   * From: anthropic.test.ts "should handle multi-turn with tool results"
-   */
-  proxyAnthropicToolResultConversation: {
-    "chat-completions": {
-      model: "claude-3-haiku-20240307",
-      messages: [
-        { role: "user", content: "What's the weather in London?" },
-        {
-          role: "assistant",
-          content: null,
-          tool_calls: [
-            {
-              id: "call_123",
-              type: "function",
-              function: {
-                name: "get_weather",
-                arguments: '{"location": "London"}',
-              },
-            },
-          ],
-        },
-        {
-          role: "tool",
-          tool_call_id: "call_123",
-          content: "Currently 15°C and cloudy in London.",
-        },
-      ],
-      tools: [
-        {
-          type: "function",
-          function: {
-            name: "get_weather",
-            description: "Get the current weather",
-            parameters: {
-              type: "object",
-              properties: {
-                location: { type: "string", description: "City name" },
-              },
-              required: ["location"],
-            },
-          },
-        },
-      ],
-      max_tokens: 200,
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].message.role": "assistant",
-        "choices[0].finish_reason": "stop",
-      },
-    },
-  },
-
-  /**
-   * Streaming with tool calls.
-   * Tests: SSE events work correctly with tool calling.
-   * From: anthropic.test.ts "should stream tool calls"
-   */
-  proxyAnthropicStreamingToolCall: {
-    "chat-completions": {
-      model: "claude-3-haiku-20240307",
-      messages: [{ role: "user", content: "Get weather in Berlin" }],
-      tools: [
-        {
-          type: "function",
-          function: {
-            name: "get_weather",
-            description: "Get the current weather",
-            parameters: {
-              type: "object",
-              properties: {
-                location: { type: "string", description: "City name" },
-              },
-              required: ["location"],
-            },
-          },
-        },
-      ],
-      tool_choice: "required",
-      stream: true,
-      max_tokens: 200,
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-    },
-  },
-
-  // ============================================================
-  // Additional OpenAI Tests
-  // ============================================================
-
-  /**
-   * OpenAI PDF file handling.
-   * Tests: OpenAI doesn't support PDFs in chat completions.
-   * From: openai.test.ts "should reject PDF files"
-   */
-  proxyOpenAIPdfError: {
-    "chat-completions": {
-      model: "gpt-4o",
-      messages: [
-        {
-          role: "user",
-          content: [
-            { type: "text", text: "What is in this PDF?" },
-            {
-              type: "image_url",
-              image_url: {
-                url: `data:application/pdf;base64,${PDF_BASE64}`,
-              },
-            },
-          ],
-        },
-      ],
-      max_tokens: 100,
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 400,
-    },
-  },
-
-  /**
-   * OpenAI text file handling.
-   * Tests: OpenAI doesn't support text files like Anthropic does.
-   * From: openai.test.ts "should reject text files"
-   */
-  proxyOpenAITextFileError: {
-    "chat-completions": {
-      model: "gpt-4o",
-      messages: [
-        {
-          role: "user",
-          content: [
-            { type: "text", text: "What is in this text file?" },
-            {
-              type: "image_url",
-              image_url: {
-                url: `data:text/plain;base64,${TEXT_BASE64}`,
-              },
-            },
-          ],
-        },
-      ],
-      max_tokens: 100,
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 400,
-    },
-  },
-
-  /**
-   * OpenAI structured output with json_schema.
-   * Tests: response_format with json_schema type.
-   * From: openai.test.ts "should handle structured output"
-   */
-  proxyOpenAIStructuredOutput: {
-    "chat-completions": {
-      model: "gpt-4o",
-      messages: [
-        { role: "user", content: "What is 2+2? Answer with just the number." },
-      ],
-      response_format: {
-        type: "json_schema",
-        json_schema: {
-          name: "math_result",
-          schema: {
-            type: "object",
-            properties: {
-              result: { type: "number" },
-            },
-            required: ["result"],
-          },
-        },
-      },
-      max_tokens: 50,
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].message.role": "assistant",
-        "choices[0].finish_reason": "stop",
-      },
-    },
-  },
-
-  /**
-   * OpenAI reasoning_effort with null value.
-   * Tests: null reasoning_effort should fallback to medium.
-   * From: openai.test.ts "should fallback to medium when reasoning_effort is null"
-   */
-  proxyOpenAIReasoningEffortNull: {
-    "chat-completions": {
-      model: "o3-mini-2025-01-31",
-      messages: [{ role: "user", content: "What is 5+5?" }],
-      reasoning_effort: null,
-      max_tokens: 500,
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].message.role": "assistant",
-      },
-    },
-  },
-
-  // ============================================================
-  // Cross-Provider Behavior Tests
-  // ============================================================
-
-  /**
-   * Azure parameter filtering.
-   * Tests: Braintrust-specific params are filtered for Azure.
-   * From: azure.test.ts "should filter Braintrust parameters"
-   */
-  proxyAzureParamFiltering: {
-    // Cast needed: reasoning_enabled/reasoning_budget are Braintrust proxy extensions
-    // eslint-disable-next-line @typescript-eslint/consistent-type-assertions
-    "chat-completions": {
-      model: "azure/gpt-4o",
-      messages: [{ role: "user", content: "Hello" }],
-      reasoning_enabled: true,
-      reasoning_budget: 1000,
-      max_tokens: 50,
-    } as OpenAI.Chat.Completions.ChatCompletionCreateParams,
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].message.role": "assistant",
-      },
-    },
-  },
-
-  /**
-   * Claude 3.7 model-specific max_tokens default.
-   * Tests: Claude 3.7 gets 128k default with beta header.
-   * From: anthropic.test.ts "should use model-specific max_tokens"
-   */
-  proxyModelSpecificDefaults: {
-    "chat-completions": {
-      model: "claude-3-7-sonnet-20250219",
-      messages: [{ role: "user", content: "Hi" }],
-      // No max_tokens - should get model-specific default
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].message.role": "assistant",
-      },
-    },
-  },
-
-  /**
-   * Anthropic stop sequences.
-   * Tests: stop sequences are properly translated.
-   * From: anthropic.test.ts stop sequences handling
-   */
-  proxyAnthropicStopSequences: {
-    "chat-completions": {
-      model: "claude-3-haiku-20240307",
-      messages: [{ role: "user", content: "Count from 1 to 10." }],
-      stop: ["5", "END"],
-      max_tokens: 100,
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].message.role": "assistant",
-      },
-    },
-  },
-
-  /**
-   * OpenAI stop sequences consistency.
-   * Tests: stop sequences work on native OpenAI.
-   * From: schema tests for cross-provider consistency
-   */
-  proxyOpenAIStopSequences: {
-    "chat-completions": {
-      model: "gpt-4o-mini",
-      messages: [{ role: "user", content: "Count from 1 to 10." }],
-      stop: ["5", "END"],
-      max_tokens: 100,
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].message.role": "assistant",
-      },
-    },
-  },
-
-  // ============================================================
-  // Additional Missing Tests (from proxy test analysis)
-  // ============================================================
-
-  /**
-   * Google response_format: json_object.
-   * Tests: json_object → generationConfig.response_mime_type: "application/json".
-   * From: google.params.test.ts "should translate json_object response format"
-   */
-  proxyGoogleJsonObjectFormat: {
-    "chat-completions": {
-      model: "gemini-2.0-flash",
-      messages: [
-        {
-          role: "user",
-          content: "Return a JSON object with a greeting field set to hello.",
-        },
-      ],
-      response_format: { type: "json_object" },
-      max_tokens: 100,
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].message.role": "assistant",
-        "choices[0].finish_reason": "stop",
-      },
-    },
-  },
-
-  /**
-   * Google response_format: json_schema.
-   * Tests: json_schema → response_mime_type + response_schema translation.
-   * From: google.params.test.ts "should translate json_schema response format"
-   */
-  proxyGoogleJsonSchemaFormat: {
-    "chat-completions": {
-      model: "gemini-2.0-flash",
-      messages: [
-        {
-          role: "user",
-          content: "What is 10 + 5? Answer with just the number.",
-        },
-      ],
-      response_format: {
-        type: "json_schema",
-        json_schema: {
-          name: "math_result",
-          schema: {
-            type: "object",
-            properties: {
-              result: { type: "number" },
-            },
-            required: ["result"],
-          },
-        },
-      },
-      max_tokens: 50,
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].message.role": "assistant",
-        "choices[0].finish_reason": "stop",
-      },
-    },
-  },
-
-  /**
-   * Google unsupported parameter filtering.
-   * Tests: frequency_penalty, presence_penalty are filtered (not sent to Google).
-   * From: google.params.test.ts "should filter unsupported parameters"
-   */
-  proxyGoogleUnsupportedParamsFilter: {
-    "chat-completions": {
-      model: "gemini-2.0-flash",
-      messages: [{ role: "user", content: "Say hello." }],
-      frequency_penalty: 0.5, // Google doesn't support this
-      presence_penalty: 0.5, // Google doesn't support this
-      max_tokens: 50,
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].message.role": "assistant",
-      },
-    },
-  },
-
-  /**
-   * OpenAI PDF URL conversion.
-   * Tests: Remote PDF URL (in image_url format) → proxy fetches and converts to file block.
-   * From: openai.test.ts "should convert PDF file URL to file block"
-   * Note: Proxy detects .pdf extension and converts to native file format.
-   */
-  proxyOpenAIPdfUrlConversion: {
-    "chat-completions": {
-      model: "gpt-4o",
-      messages: [
-        {
-          role: "user",
-          content: [
-            { type: "text", text: "What type of document is this?" },
-            {
-              // Proxy detects PDF URLs in image_url and converts to file block
-              type: "image_url",
-              image_url: {
-                // Using a small, publicly available PDF
-                url: "https://www.w3.org/WAI/WCAG21/Techniques/pdf/img/table-word.pdf",
-              },
-            },
-          ],
-        },
-      ],
-      max_tokens: 100,
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].message.role": "assistant",
-      },
-    },
-  },
-
-  /**
-   * Anthropic claude-3-7 128k output beta header.
-   * Tests: claude-3-7 without max_tokens gets 128k default and beta header.
-   * From: anthropic.test.ts "should use 128k max_tokens and beta header for claude-3-7"
-   * Note: Different from proxyModelSpecificDefaults - this tests with high output expectation.
-   */
-  proxyAnthropic128kBetaHeader: {
-    "chat-completions": {
-      model: "claude-3-7-sonnet-latest",
-      messages: [
-        {
-          role: "user",
-          content: "Write a very short poem (2 lines) about coding.",
-        },
-      ],
-      // No max_tokens - proxy should inject 128000 and add beta header
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-      fields: {
-        "choices[0].message.role": "assistant",
-        "choices[0].finish_reason": "stop",
-        object: "chat.completion",
-      },
-    },
-  },
-
-  /**
-   * OpenAI o3-mini streaming with reasoning.
-   * Tests: o3-mini streaming returns reasoning content in delta.
-   * From: openai.test.ts "should accept reasoning with o3-mini (streaming)"
-   */
-  proxyOpenAIO3MiniStreamingReasoning: {
-    "chat-completions": {
-      model: "o3-mini-2025-01-31",
-      messages: [{ role: "user", content: "What is 7 * 8?" }],
-      reasoning_effort: "medium",
-      stream: true,
-      max_tokens: 1000,
-    },
-    responses: null,
-    anthropic: null,
-    google: null,
-    bedrock: null,
-    expect: {
-      status: 200,
-    },
-  },
-};
diff --git a/payloads/proxy/cases.ts b/payloads/proxy/cases.ts
new file mode 100644
index 00000000..6bc24911
--- /dev/null
+++ b/payloads/proxy/cases.ts
@@ -0,0 +1,915 @@
+import OpenAI from "openai";
+import { ProxyTestCaseCollection } from "./types";
+
+const TEXT_BASE64 = "SGVsbG8gd29ybGQhCg==";
+const AUDIO_BASE64 =
+  "UklGRiQAAABXQVZFZm10IBAAAAABAAEARKwAAIhYAQACABAAZGF0YQAAAAA=";
+const VIDEO_BASE64 = "AAAAIGZ0eXBpc29tAAACAGlzb21pc28yYXZjMW1wNDE=";
+const PDF_BASE64 =
+  "JVBERi0xLjQKMSAwIG9iago8PC9UeXBlL0NhdGFsb2cvUGFnZXMgMiAwIFI+PgplbmRvYmoKMiAwIG9iago8PC9UeXBlL1BhZ2VzL0tpZHNbMyAwIFJdL0NvdW50IDE+PgplbmRvYmoKMyAwIG9iago8PC9UeXBlL1BhZ2UvTWVkaWFCb3hbMCAwIDYxMiA3OTJdL1BhcmVudCAyIDAgUi9SZXNvdXJjZXM8PD4+Pj4KZW5kb2JqCnhyZWYKMCA0CjAwMDAwMDAwMDAgNjU1MzUgZiAKMDAwMDAwMDAxNSAwMDAwMCBuIAowMDAwMDAwMDYxIDAwMDAwIG4gCjAwMDAwMDAxMTggMDAwMDAgbiAKdHJhaWxlcgo8PC9TaXplIDQvUm9vdCAxIDAgUj4+CnN0YXJ0eHJlZgoyMTUKJSVFT0YK";
+const IMAGE_BASE64 =
+  "iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAYAAAAfFcSJAAAADUlEQVR42mNk+M9QDwADhgGAWjR9awAAAABJRU5ErkJggg==";
+const MD_BASE64 = "IyBUaXRsZQoKVGhpcyBpcyBhIHBhcmFncmFwaC4K";
+const CSV_BASE64 = "bmFtZSxhZ2UKQWxpY2UsMzAKQm9iLDI1Cg==";
+
+export const proxyCases: ProxyTestCaseCollection = {
+  proxyAnthropicBasic: {
+    format: "chat-completions",
+    request: {
+      model: "claude-3-haiku-20240307",
+      messages: [
+        { role: "system", content: "You are a helpful assistant." },
+        { role: "user", content: "Tell me a short joke about programming." },
+      ],
+      max_tokens: 150,
+    },
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+        "choices[0].finish_reason": "stop",
+        object: "chat.completion",
+      },
+    },
+  },
+
+  proxyAnthropicReasoning: {
+    format: "chat-completions",
+    request: {
+      model: "claude-3-7-sonnet-20250219",
+      reasoning_effort: "medium",
+      messages: [
+        { role: "user", content: "How many rs in 'ferrocarril'" },
+        {
+          role: "assistant",
+          content: "There are 4 letter 'r's in the word \"ferrocarril\".",
+        },
+        { role: "user", content: "How many e in what you said?" },
+      ],
+    },
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+        object: "chat.completion",
+      },
+    },
+  },
+
+  proxyAnthropicToolCall: {
+    format: "chat-completions",
+    request: {
+      model: "claude-3-haiku-20240307",
+      messages: [
+        {
+          role: "user",
+          content:
+            "Use the calculate function to add 2 and 3 together. Explain your reasoning in detail.",
+        },
+      ],
+      tools: [
+        {
+          type: "function",
+          function: {
+            name: "calculate",
+            description: "Perform a mathematical calculation",
+            parameters: {
+              type: "object",
+              properties: {
+                operation: {
+                  type: "string",
+                  enum: ["add", "subtract", "multiply", "divide"],
+                  description: "The operation to perform",
+                },
+                a: { type: "number", description: "First operand" },
+                b: { type: "number", description: "Second operand" },
+              },
+              required: ["operation", "a", "b"],
+            },
+          },
+        },
+      ],
+      tool_choice: "auto",
+      max_tokens: 50,
+    },
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+        object: "chat.completion",
+      },
+    },
+  },
+
+  proxyAnthropicPdfFile: {
+    format: "chat-completions",
+    request: {
+      model: "claude-sonnet-4-5-20250929",
+      messages: [
+        {
+          role: "user",
+          content: [
+            { type: "text", text: "What is in this PDF?" },
+            {
+              type: "image_url",
+              image_url: { url: `data:application/pdf;base64,${PDF_BASE64}` },
+            },
+          ],
+        },
+      ],
+      max_tokens: 200,
+    },
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+        object: "chat.completion",
+      },
+    },
+  },
+
+  proxyAnthropicImageFile: {
+    format: "chat-completions",
+    request: {
+      model: "claude-sonnet-4-5-20250929",
+      messages: [
+        {
+          role: "user",
+          content: [
+            { type: "text", text: "What color is this pixel?" },
+            {
+              type: "image_url",
+              image_url: { url: `data:image/png;base64,${IMAGE_BASE64}` },
+            },
+          ],
+        },
+      ],
+      max_tokens: 100,
+    },
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+        object: "chat.completion",
+      },
+    },
+  },
+
+  proxyAnthropicStreaming: {
+    format: "chat-completions",
+    request: {
+      model: "claude-3-haiku-20240307",
+      messages: [
+        { role: "system", content: "You are a helpful assistant." },
+        { role: "user", content: "Say hello in 3 words." },
+      ],
+      stream: true,
+      max_tokens: 50,
+    },
+    expect: { status: 200 },
+  },
+
+  proxyAnthropicAudioError: {
+    format: "chat-completions",
+    request: {
+      model: "claude-3-7-sonnet-latest",
+      messages: [
+        {
+          role: "user",
+          content: [
+            { type: "text", text: "What is in this audio?" },
+            {
+              type: "input_audio",
+              input_audio: { data: AUDIO_BASE64, format: "wav" },
+            },
+          ],
+        },
+      ],
+      max_tokens: 100,
+    },
+    expect: { status: 400, error: { type: "invalid_request_error" } },
+  },
+
+  proxyAnthropicVideoError: {
+    format: "chat-completions",
+    request: {
+      model: "claude-3-7-sonnet-latest",
+      messages: [
+        {
+          role: "user",
+          content: [
+            { type: "text", text: "What is in this video?" },
+            {
+              type: "image_url",
+              image_url: { url: `data:video/mp4;base64,${VIDEO_BASE64}` },
+            },
+          ],
+        },
+      ],
+      max_tokens: 100,
+    },
+    expect: { status: 400, error: { type: "invalid_request_error" } },
+  },
+
+  proxyAnthropicMaxTokensExceeds: {
+    format: "chat-completions",
+    request: {
+      model: "claude-sonnet-4-5-20250929",
+      messages: [{ role: "user", content: "Hello" }],
+      max_tokens: 200000,
+    },
+    expect: { status: 400 },
+  },
+
+  proxyAnthropicReasoningDisabled: {
+    format: "chat-completions",
+    // Cast: reasoning_enabled is a Braintrust proxy extension
+    // eslint-disable-next-line @typescript-eslint/consistent-type-assertions
+    request: {
+      model: "claude-3-7-sonnet-20250219",
+      messages: [{ role: "user", content: "What is 2+2?" }],
+      reasoning_enabled: false,
+      max_tokens: 100,
+    } as OpenAI.Chat.Completions.ChatCompletionCreateParams,
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.reasoning": { exists: false },
+        "choices[0].message.role": "assistant",
+      },
+    },
+  },
+
+  proxyAnthropicJsonObject: {
+    format: "chat-completions",
+    request: {
+      model: "claude-sonnet-4-5-20250929",
+      messages: [
+        {
+          role: "user",
+          content: "Return a JSON object with a greeting field.",
+        },
+      ],
+      response_format: { type: "json_object" },
+      max_tokens: 150,
+    },
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+        "choices[0].finish_reason": "stop",
+      },
+    },
+  },
+
+  proxyAnthropicToolCallRequired: {
+    format: "chat-completions",
+    request: {
+      model: "claude-3-haiku-20240307",
+      messages: [{ role: "user", content: "Get the weather in San Francisco" }],
+      tools: [
+        {
+          type: "function",
+          function: {
+            name: "get_weather",
+            description: "Get the current weather",
+            parameters: {
+              type: "object",
+              properties: {
+                location: { type: "string", description: "City name" },
+              },
+              required: ["location"],
+            },
+          },
+        },
+      ],
+      tool_choice: "required",
+      max_tokens: 150,
+    },
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].finish_reason": "tool_calls",
+        "choices[0].message.tool_calls[0].type": "function",
+      },
+    },
+  },
+
+  proxyAnthropicPlainTextFile: {
+    format: "chat-completions",
+    request: {
+      model: "claude-sonnet-4-5-20250929",
+      messages: [
+        {
+          role: "user",
+          content: [
+            { type: "text", text: "What does this text file say?" },
+            {
+              type: "image_url",
+              image_url: { url: `data:text/plain;base64,${TEXT_BASE64}` },
+            },
+          ],
+        },
+      ],
+      max_tokens: 100,
+    },
+    expect: { status: 200, fields: { "choices[0].message.role": "assistant" } },
+  },
+
+  proxyAnthropicDefaultMaxTokens: {
+    format: "chat-completions",
+    request: {
+      model: "claude-3-haiku-20240307",
+      messages: [{ role: "user", content: "Say hi" }],
+    },
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+        object: "chat.completion",
+      },
+    },
+  },
+
+  proxyOpenAIReasoningDenied: {
+    format: "chat-completions",
+    request: {
+      model: "gpt-4o-mini",
+      messages: [{ role: "user", content: "Hello" }],
+      reasoning_effort: "high",
+      max_tokens: 50,
+    },
+    expect: {
+      status: 400,
+      error: {
+        message: "Unrecognized request argument supplied: reasoning_effort",
+      },
+    },
+  },
+
+  proxyOpenAIO3MiniReasoning: {
+    format: "chat-completions",
+    request: {
+      model: "o3-mini-2025-01-31",
+      messages: [{ role: "user", content: "What is 2+2?" }],
+      reasoning_effort: "medium",
+      max_tokens: 1000,
+    },
+    expect: {
+      status: 200,
+      fields: { "choices[0].finish_reason": "stop", object: "chat.completion" },
+    },
+  },
+
+  proxyGoogleBasic: {
+    format: "chat-completions",
+    request: {
+      model: "gemini-2.0-flash",
+      messages: [
+        { role: "system", content: "You are a helpful assistant." },
+        { role: "user", content: "Say hello in exactly 3 words." },
+      ],
+      max_tokens: 50,
+    },
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+        object: "chat.completion",
+      },
+    },
+  },
+
+  proxyGoogleParamTranslation: {
+    format: "chat-completions",
+    request: {
+      model: "gemini-2.0-flash",
+      messages: [{ role: "user", content: "Count to 3." }],
+      temperature: 0.7,
+      top_p: 0.9,
+      max_tokens: 100,
+    },
+    expect: { status: 200, fields: { "choices[0].message.role": "assistant" } },
+  },
+
+  proxyGoogleToolCall: {
+    format: "chat-completions",
+    request: {
+      model: "gemini-2.0-flash",
+      messages: [{ role: "user", content: "What's the weather in Tokyo?" }],
+      tools: [
+        {
+          type: "function",
+          function: {
+            name: "get_weather",
+            description: "Get the current weather in a location",
+            parameters: {
+              type: "object",
+              properties: {
+                location: { type: "string", description: "City name" },
+              },
+              required: ["location"],
+            },
+          },
+        },
+      ],
+      tool_choice: "auto",
+      max_tokens: 200,
+    },
+    expect: {
+      status: 200,
+      fields: { "choices[0].message.tool_calls[0].type": "function" },
+    },
+  },
+
+  proxyGoogleReasoning: {
+    format: "chat-completions",
+    request: {
+      model: "gemini-2.5-flash-preview-04-17",
+      messages: [{ role: "user", content: "What is the square root of 144?" }],
+      reasoning_effort: "medium",
+      max_tokens: 500,
+    },
+    expect: { status: 200, fields: { "choices[0].message.role": "assistant" } },
+  },
+
+  proxyGoogleImageContent: {
+    format: "chat-completions",
+    request: {
+      model: "gemini-2.0-flash",
+      messages: [
+        {
+          role: "user",
+          content: [
+            { type: "text", text: "What do you see in this image?" },
+            {
+              type: "image_url",
+              image_url: { url: `data:image/png;base64,${IMAGE_BASE64}` },
+            },
+          ],
+        },
+      ],
+      max_tokens: 100,
+    },
+    expect: { status: 200, fields: { "choices[0].message.role": "assistant" } },
+  },
+
+  proxyGoogleAudioSupport: {
+    format: "chat-completions",
+    request: {
+      model: "gemini-2.0-flash",
+      messages: [
+        {
+          role: "user",
+          content: [
+            { type: "text", text: "What do you hear in this audio?" },
+            {
+              type: "input_audio",
+              input_audio: { data: AUDIO_BASE64, format: "wav" },
+            },
+          ],
+        },
+      ],
+      max_tokens: 100,
+    },
+    expect: { status: 200, fields: { "choices[0].message.role": "assistant" } },
+  },
+
+  proxyGoogleVideoSupport: {
+    format: "chat-completions",
+    request: {
+      model: "gemini-2.0-flash",
+      messages: [
+        {
+          role: "user",
+          content: [
+            { type: "text", text: "What do you see in this video?" },
+            {
+              type: "image_url",
+              image_url: { url: `data:video/mp4;base64,${VIDEO_BASE64}` },
+            },
+          ],
+        },
+      ],
+      max_tokens: 100,
+    },
+    expect: { status: 200, fields: { "choices[0].message.role": "assistant" } },
+  },
+
+  proxyGoogleStopSequences: {
+    format: "chat-completions",
+    request: {
+      model: "gemini-2.0-flash",
+      messages: [{ role: "user", content: "Count from 1 to 10." }],
+      stop: ["5", "END"],
+      max_tokens: 100,
+    },
+    expect: { status: 200, fields: { "choices[0].message.role": "assistant" } },
+  },
+
+  proxyAnthropicMarkdownFile: {
+    format: "chat-completions",
+    request: {
+      model: "claude-sonnet-4-5-20250929",
+      messages: [
+        {
+          role: "user",
+          content: [
+            {
+              type: "text",
+              text: "What is the heading in this markdown file?",
+            },
+            {
+              type: "image_url",
+              image_url: { url: `data:text/markdown;base64,${MD_BASE64}` },
+            },
+          ],
+        },
+      ],
+      max_tokens: 100,
+    },
+    expect: { status: 200, fields: { "choices[0].message.role": "assistant" } },
+  },
+
+  proxyAnthropicCSVFile: {
+    format: "chat-completions",
+    request: {
+      model: "claude-sonnet-4-5-20250929",
+      messages: [
+        {
+          role: "user",
+          content: [
+            { type: "text", text: "How many rows are in this CSV file?" },
+            {
+              type: "image_url",
+              image_url: { url: `data:text/csv;base64,${CSV_BASE64}` },
+            },
+          ],
+        },
+      ],
+      max_tokens: 100,
+    },
+    expect: { status: 200, fields: { "choices[0].message.role": "assistant" } },
+  },
+
+  proxyAnthropicToolCallSufficientTokens: {
+    format: "chat-completions",
+    request: {
+      model: "claude-3-haiku-20240307",
+      messages: [{ role: "user", content: "Get the weather in Paris" }],
+      tools: [
+        {
+          type: "function",
+          function: {
+            name: "get_weather",
+            description: "Get the current weather",
+            parameters: {
+              type: "object",
+              properties: {
+                location: { type: "string", description: "City name" },
+              },
+              required: ["location"],
+            },
+          },
+        },
+      ],
+      tool_choice: "required",
+      max_tokens: 500,
+    },
+    expect: {
+      status: 200,
+      fields: { "choices[0].finish_reason": "tool_calls" },
+    },
+  },
+
+  proxyAnthropicStreamingReasoning: {
+    format: "chat-completions",
+    request: {
+      model: "claude-3-7-sonnet-20250219",
+      messages: [{ role: "user", content: "What is 15 * 17?" }],
+      reasoning_effort: "low",
+      stream: true,
+      max_tokens: 2000,
+    },
+    expect: { status: 200 },
+  },
+
+  proxyAnthropicToolResultConversation: {
+    format: "chat-completions",
+    request: {
+      model: "claude-3-haiku-20240307",
+      messages: [
+        { role: "user", content: "What's the weather in London?" },
+        {
+          role: "assistant",
+          content: null,
+          tool_calls: [
+            {
+              id: "call_123",
+              type: "function",
+              function: {
+                name: "get_weather",
+                arguments: '{"location": "London"}',
+              },
+            },
+          ],
+        },
+        {
+          role: "tool",
+          tool_call_id: "call_123",
+          content: "Currently 15°C and cloudy in London.",
+        },
+      ],
+      tools: [
+        {
+          type: "function",
+          function: {
+            name: "get_weather",
+            description: "Get the current weather",
+            parameters: {
+              type: "object",
+              properties: {
+                location: { type: "string", description: "City name" },
+              },
+              required: ["location"],
+            },
+          },
+        },
+      ],
+      max_tokens: 200,
+    },
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+        "choices[0].finish_reason": "stop",
+      },
+    },
+  },
+
+  proxyAnthropicStreamingToolCall: {
+    format: "chat-completions",
+    request: {
+      model: "claude-3-haiku-20240307",
+      messages: [{ role: "user", content: "Get weather in Berlin" }],
+      tools: [
+        {
+          type: "function",
+          function: {
+            name: "get_weather",
+            description: "Get the current weather",
+            parameters: {
+              type: "object",
+              properties: {
+                location: { type: "string", description: "City name" },
+              },
+              required: ["location"],
+            },
+          },
+        },
+      ],
+      tool_choice: "required",
+      stream: true,
+      max_tokens: 200,
+    },
+    expect: { status: 200 },
+  },
+
+  proxyOpenAIPdfError: {
+    format: "chat-completions",
+    request: {
+      model: "gpt-4o",
+      messages: [
+        {
+          role: "user",
+          content: [
+            { type: "text", text: "What is in this PDF?" },
+            {
+              type: "image_url",
+              image_url: { url: `data:application/pdf;base64,${PDF_BASE64}` },
+            },
+          ],
+        },
+      ],
+      max_tokens: 100,
+    },
+    expect: { status: 400 },
+  },
+
+  proxyOpenAITextFileError: {
+    format: "chat-completions",
+    request: {
+      model: "gpt-4o",
+      messages: [
+        {
+          role: "user",
+          content: [
+            { type: "text", text: "What is in this text file?" },
+            {
+              type: "image_url",
+              image_url: { url: `data:text/plain;base64,${TEXT_BASE64}` },
+            },
+          ],
+        },
+      ],
+      max_tokens: 100,
+    },
+    expect: { status: 400 },
+  },
+
+  proxyOpenAIStructuredOutput: {
+    format: "chat-completions",
+    request: {
+      model: "gpt-4o",
+      messages: [
+        { role: "user", content: "What is 2+2? Answer with just the number." },
+      ],
+      response_format: {
+        type: "json_schema",
+        json_schema: {
+          name: "math_result",
+          schema: {
+            type: "object",
+            properties: { result: { type: "number" } },
+            required: ["result"],
+          },
+        },
+      },
+      max_tokens: 50,
+    },
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+        "choices[0].finish_reason": "stop",
+      },
+    },
+  },
+
+  proxyAzureParamFiltering: {
+    format: "chat-completions",
+    // Cast: reasoning_enabled/reasoning_budget are Braintrust proxy extensions
+    // eslint-disable-next-line @typescript-eslint/consistent-type-assertions
+    request: {
+      model: "azure/gpt-4o",
+      messages: [{ role: "user", content: "Hello" }],
+      reasoning_enabled: true,
+      reasoning_budget: 1000,
+      max_tokens: 50,
+    } as OpenAI.Chat.Completions.ChatCompletionCreateParams,
+    expect: { status: 200, fields: { "choices[0].message.role": "assistant" } },
+  },
+
+  proxyModelSpecificDefaults: {
+    format: "chat-completions",
+    request: {
+      model: "claude-3-7-sonnet-20250219",
+      messages: [{ role: "user", content: "Hi" }],
+    },
+    expect: { status: 200, fields: { "choices[0].message.role": "assistant" } },
+  },
+
+  proxyAnthropicStopSequences: {
+    format: "chat-completions",
+    request: {
+      model: "claude-3-haiku-20240307",
+      messages: [{ role: "user", content: "Count from 1 to 10." }],
+      stop: ["5", "END"],
+      max_tokens: 100,
+    },
+    expect: { status: 200, fields: { "choices[0].message.role": "assistant" } },
+  },
+
+  proxyOpenAIStopSequences: {
+    format: "chat-completions",
+    request: {
+      model: "gpt-4o-mini",
+      messages: [{ role: "user", content: "Count from 1 to 10." }],
+      stop: ["5", "END"],
+      max_tokens: 100,
+    },
+    expect: { status: 200, fields: { "choices[0].message.role": "assistant" } },
+  },
+
+  proxyGoogleJsonObjectFormat: {
+    format: "chat-completions",
+    request: {
+      model: "gemini-2.0-flash",
+      messages: [
+        {
+          role: "user",
+          content: "Return a JSON object with a greeting field set to hello.",
+        },
+      ],
+      response_format: { type: "json_object" },
+      max_tokens: 100,
+    },
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+        "choices[0].finish_reason": "stop",
+      },
+    },
+  },
+
+  proxyGoogleJsonSchemaFormat: {
+    format: "chat-completions",
+    request: {
+      model: "gemini-2.0-flash",
+      messages: [
+        {
+          role: "user",
+          content: "What is 10 + 5? Answer with just the number.",
+        },
+      ],
+      response_format: {
+        type: "json_schema",
+        json_schema: {
+          name: "math_result",
+          schema: {
+            type: "object",
+            properties: { result: { type: "number" } },
+            required: ["result"],
+          },
+        },
+      },
+      max_tokens: 50,
+    },
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+        "choices[0].finish_reason": "stop",
+      },
+    },
+  },
+
+  proxyGoogleUnsupportedParamsFilter: {
+    format: "chat-completions",
+    request: {
+      model: "gemini-2.0-flash",
+      messages: [{ role: "user", content: "Say hello." }],
+      frequency_penalty: 0.5,
+      presence_penalty: 0.5,
+      max_tokens: 50,
+    },
+    expect: { status: 200, fields: { "choices[0].message.role": "assistant" } },
+  },
+
+  proxyOpenAIPdfUrlConversion: {
+    format: "chat-completions",
+    request: {
+      model: "gpt-4o",
+      messages: [
+        {
+          role: "user",
+          content: [
+            { type: "text", text: "What type of document is this?" },
+            {
+              type: "image_url",
+              image_url: {
+                url: "https://www.w3.org/WAI/WCAG21/Techniques/pdf/img/table-word.pdf",
+              },
+            },
+          ],
+        },
+      ],
+      max_tokens: 100,
+    },
+    expect: { status: 200, fields: { "choices[0].message.role": "assistant" } },
+  },
+
+  proxyAnthropic128kBetaHeader: {
+    format: "chat-completions",
+    request: {
+      model: "claude-3-7-sonnet-latest",
+      messages: [
+        {
+          role: "user",
+          content: "Write a very short poem (2 lines) about coding.",
+        },
+      ],
+    },
+    expect: {
+      status: 200,
+      fields: {
+        "choices[0].message.role": "assistant",
+        "choices[0].finish_reason": "stop",
+        object: "chat.completion",
+      },
+    },
+  },
+
+  proxyOpenAIO3MiniStreamingReasoning: {
+    format: "chat-completions",
+    request: {
+      model: "o3-mini-2025-01-31",
+      messages: [{ role: "user", content: "What is 7 * 8?" }],
+      reasoning_effort: "medium",
+      stream: true,
+      max_tokens: 1000,
+    },
+    expect: { status: 200 },
+  },
+};
diff --git a/payloads/proxy/index.ts b/payloads/proxy/index.ts
new file mode 100644
index 00000000..3255a5bc
--- /dev/null
+++ b/payloads/proxy/index.ts
@@ -0,0 +1,8 @@
+export * from "./types";
+export { proxyCases } from "./cases";
+
+import { proxyCases } from "./cases";
+
+export function getProxyCaseNames(): string[] {
+  return Object.keys(proxyCases);
+}
diff --git a/payloads/proxy/types.ts b/payloads/proxy/types.ts
new file mode 100644
index 00000000..edf626ab
--- /dev/null
+++ b/payloads/proxy/types.ts
@@ -0,0 +1,24 @@
+import OpenAI from "openai";
+
+export interface ProxyTestExpectation {
+  status?: number;
+  fields?: Record<string, unknown>;
+  error?: {
+    type?: string;
+    message?: string;
+  };
+}
+
+export type ProxyTestCase =
+  | {
+      format: "chat-completions";
+      request: OpenAI.Chat.Completions.ChatCompletionCreateParams;
+      expect: ProxyTestExpectation;
+    }
+  | {
+      format: "responses";
+      request: OpenAI.Responses.ResponseCreateParams;
+      expect: ProxyTestExpectation;
+    };
+
+export type ProxyTestCaseCollection = Record<string, ProxyTestCase>;
diff --git a/payloads/scripts/validation/index.ts b/payloads/scripts/validation/index.ts
index 41e8a5a8..91b569ff 100644
--- a/payloads/scripts/validation/index.ts
+++ b/payloads/scripts/validation/index.ts
@@ -1,22 +1,14 @@
-// Core validation library - runValidation()
-
 import { readFileSync, existsSync } from "fs";
 import { join } from "path";
 import { compareResponses, DiffResult, hasOnlyMinorDiffs } from "./diff-utils";
-
-// Import executors
 import { openaiExecutor } from "../providers/openai";
 import { openaiResponsesExecutor } from "../providers/openai-responses";
 import { anthropicExecutor } from "../providers/anthropic";
-
-// Import test cases from code
 import {
   allTestCases,
   getCaseNames,
   getCaseForProvider,
-  getFullTestCase,
   caseCollections,
-  TestExpectation,
 } from "../../cases";
 import {
   OPENAI_CHAT_COMPLETIONS_MODEL,
@@ -24,8 +16,13 @@ import {
   GOOGLE_MODEL,
   BEDROCK_MODEL,
 } from "../../cases/models";
+import {
+  proxyCases,
+  getProxyCaseNames,
+  ProxyTestExpectation,
+} from "../../proxy";
 
-// Simplified executor interface for the registry (relaxes generic constraints)
+// Relaxes generic constraints for heterogeneous executor types
 interface ExecutorEntry {
   name: string;
   cases: Record<string, unknown>;
@@ -42,15 +39,12 @@ interface ExecutorEntry {
   ignoredFields?: string[];
 }
 
-// Format registry - maps format names to executors
-// Type assertions are necessary for heterogeneous executor types in the registry
-/* eslint-disable @typescript-eslint/consistent-type-assertions */
+/* eslint-disable @typescript-eslint/consistent-type-assertions -- heterogeneous executor types */
 const formatRegistry: Record<string, ExecutorEntry> = {
   "chat-completions": openaiExecutor as ExecutorEntry,
   responses: openaiResponsesExecutor as ExecutorEntry,
   anthropic: anthropicExecutor as ExecutorEntry,
 };
-/* eslint-enable @typescript-eslint/consistent-type-assertions */
 
 /**
  * Type guard to check if value is a record with string keys.
@@ -81,7 +75,7 @@ function getPath(obj: unknown, path: string): unknown {
  * Returns null if all expectations pass, or an error message if any fail.
  */
 function validateExpectations(
-  expect: TestExpectation,
+  expect: ProxyTestExpectation,
   response: unknown,
   httpStatus?: number
 ): string | null {
@@ -207,6 +201,26 @@ function loadSnapshotFile<T>(
 // Default cases to run (fast + representative)
 const DEFAULT_CASES = ["simpleRequest", "toolCallRequest", "reasoningRequest"];
 
+// Batch size for parallel promise execution
+const BATCH_SIZE = 10;
+
+/**
+ * Process an array in batches, running each batch in parallel.
+ */
+async function processBatches<T, R>(
+  items: T[],
+  batchSize: number,
+  processor: (item: T) => Promise<R>
+): Promise<R[]> {
+  const results: R[] = [];
+  for (let i = 0; i < items.length; i += batchSize) {
+    const batch = items.slice(i, i + batchSize);
+    const batchResults = await Promise.all(batch.map(processor));
+    results.push(...batchResults);
+  }
+  return results;
+}
+
 // Provider registry - maps provider aliases to actual model names (uses canonical models.ts)
 const PROVIDER_REGISTRY: Record<string, string> = {
   openai: OPENAI_CHAT_COMPLETIONS_MODEL,
@@ -277,13 +291,26 @@ export async function runValidation(
       continue;
     }
 
-    // Get cases to run
-    const availableCases = getAvailableCases(format);
+    // Get cases to run (snapshot cases + proxy cases)
+    const availableSnapshotCases = getAvailableCases(format);
+    const availableProxyCases = getProxyCaseNames().filter((name) => {
+      const proxyCase = proxyCases[name];
+      return proxyCase && proxyCase.format === format;
+    });
+    const availableCases = [
+      ...availableSnapshotCases,
+      ...availableProxyCases.filter((c) => !availableSnapshotCases.includes(c)),
+    ];
+
     let caseNames: string[];
     if (options.cases) {
       // User specified explicit cases or collection names - expand collections
+      const allCollections: Record<string, string[]> = {
+        ...caseCollections,
+        proxy: getProxyCaseNames(),
+      };
       const expandedCases = options.cases.flatMap(
-        (c) => caseCollections[c] ?? [c]
+        (c) => allCollections[c] ?? [c]
       );
       caseNames = expandedCases.filter((c) => availableCases.includes(c));
     } else if (options.all) {
@@ -308,205 +335,206 @@ export async function runValidation(
       }
     }
 
-    const caseResults = await Promise.all(
-      testCombinations.map(
-        async ({ caseName, providerAlias }): Promise<ValidationResult> => {
-          const start = Date.now();
-
-          // Resolve model name from provider alias
-          const modelName =
-            providerAlias === "default"
-              ? "default"
-              : (PROVIDER_REGISTRY[providerAlias] ?? providerAlias);
-
-          try {
-            // Get request from cases definitions (single source of truth)
-            const caseRequest = getCaseForProvider(
-              allTestCases,
-              caseName,
-              // eslint-disable-next-line @typescript-eslint/consistent-type-assertions -- format is a string key
-              format as
-                | "chat-completions"
-                | "responses"
-                | "anthropic"
-                | "google"
-                | "bedrock"
-            );
-            // eslint-disable-next-line @typescript-eslint/consistent-type-assertions -- Need to type the request for model override
-            let request = caseRequest as Record<string, unknown> | null;
-            // Load expected response from snapshots for comparison
-            const snapshotFilename = options.stream
-              ? "response-streaming.json"
-              : "response.json";
-            const expectedResponse = loadSnapshotFile(
-              caseName,
-              format,
-              snapshotFilename
-            );
-
-            if (!request) {
-              const result: ValidationResult = {
-                format,
-                caseName,
-                model: modelName,
-                success: false,
-                durationMs: Date.now() - start,
-                error: `Case ${caseName} not found for format ${format}`,
-              };
-              options.onResult?.(result);
-              return result;
-            }
-
-            // Check if this is an expectation-based test
-            const fullTestCase = getFullTestCase(allTestCases, caseName);
-            const expectations = fullTestCase?.expect;
-
-            // For expectation-based tests, use direct HTTP request to get status codes
-            if (expectations) {
-              const endpoint =
-                format === "chat-completions"
-                  ? "/v1/chat/completions"
-                  : "/v1/responses";
-              const fetchResponse = await fetch(
-                `${options.proxyUrl}${endpoint}`,
-                {
-                  method: "POST",
-                  headers: {
-                    "Content-Type": "application/json",
-                    ...(options.apiKey
-                      ? { Authorization: `Bearer ${options.apiKey}` }
-                      : {}),
-                  },
-                  body: JSON.stringify(request),
-                }
-              );
-
-              const httpStatus = fetchResponse.status;
-              let responseBody: unknown;
-              try {
-                responseBody = await fetchResponse.json();
-              } catch {
-                responseBody = { error: "Failed to parse response JSON" };
-              }
-
-              const validationError = validateExpectations(
-                expectations,
-                responseBody,
-                httpStatus
-              );
-
-              const result: ValidationResult = {
-                format,
-                caseName,
-                model: modelName,
-                success: validationError === null,
-                durationMs: Date.now() - start,
-                error: validationError ?? undefined,
-                actualResponse: options.verbose ? responseBody : undefined,
-              };
-              options.onResult?.(result);
-              return result;
-            }
-
-            // Standard snapshot-based validation
-            if (!expectedResponse) {
-              const result: ValidationResult = {
-                format,
-                caseName,
-                model: modelName,
-                success: false,
-                durationMs: Date.now() - start,
-                error: `Missing ${snapshotFilename} for ${caseName}/${format}`,
-              };
-              options.onResult?.(result);
-              return result;
-            }
-
-            // Override model only for cross-provider testing
-            // OpenAI formats (chat-completions, responses) with non-OpenAI providers
-            if (
-              providerAlias !== "default" &&
-              providerAlias !== "openai" && // Don't override for OpenAI - tests have correct models
-              PROVIDER_REGISTRY[providerAlias]
-            ) {
-              const isOpenAIFormat =
-                format === "chat-completions" || format === "responses";
-              if (isOpenAIFormat) {
-                // Override for cross-provider translation testing
-                request = {
-                  ...request,
-                  model: PROVIDER_REGISTRY[providerAlias],
-                };
+    const caseResults = await processBatches(
+      testCombinations,
+      BATCH_SIZE,
+      async ({ caseName, providerAlias }): Promise<ValidationResult> => {
+        const start = Date.now();
+
+        // Resolve model name from provider alias
+        const modelName =
+          providerAlias === "default"
+            ? "default"
+            : (PROVIDER_REGISTRY[providerAlias] ?? providerAlias);
+
+        try {
+          // Check if this is a proxy test case first (expectation-based validation)
+          const proxyCase = proxyCases[caseName];
+          const isProxyCase = proxyCase && proxyCase.format === format;
+
+          // For proxy test cases, use direct HTTP validation with expectations
+          if (isProxyCase) {
+            const expectations = proxyCase.expect;
+            const endpoint =
+              format === "chat-completions"
+                ? "/v1/chat/completions"
+                : "/v1/responses";
+            const fetchResponse = await fetch(
+              `${options.proxyUrl}${endpoint}`,
+              {
+                method: "POST",
+                headers: {
+                  "Content-Type": "application/json",
+                  ...(options.apiKey
+                    ? { Authorization: `Bearer ${options.apiKey}` }
+                    : {}),
+                },
+                body: JSON.stringify(proxyCase.request),
               }
-            }
+            );
 
-            // Execute through proxy
-            const actual = await executor.execute(caseName, request, {
-              stream: options.stream,
-              baseURL: options.proxyUrl,
-              apiKey: options.apiKey,
-            });
-
-            if (actual.error) {
-              const result: ValidationResult = {
-                format,
-                caseName,
-                model: modelName,
-                success: false,
-                durationMs: Date.now() - start,
-                error: actual.error,
-              };
-              options.onResult?.(result);
-              return result;
+            const httpStatus = fetchResponse.status;
+            let responseBody: unknown;
+            try {
+              responseBody = await fetchResponse.json();
+            } catch {
+              responseBody = { error: "Failed to parse response JSON" };
             }
 
-            // Compare response (use streamingResponse array when streaming)
-            const actualResponse = options.stream
-              ? actual.streamingResponse
-              : actual.response;
+            const validationError = validateExpectations(
+              expectations,
+              responseBody,
+              httpStatus
+            );
 
-            // Extract actual model from response (fallback to registry-based name)
-            const actualModel =
-              extractModelFromResponse(actualResponse, options.stream) ??
-              modelName;
+            const result: ValidationResult = {
+              format,
+              caseName,
+              model: modelName,
+              success: validationError === null,
+              durationMs: Date.now() - start,
+              error: validationError ?? undefined,
+              actualResponse: options.verbose ? responseBody : undefined,
+            };
+            options.onResult?.(result);
+            return result;
+          }
 
-            const diff = compareResponses(
-              expectedResponse,
-              actualResponse,
-              executor.ignoredFields ?? []
-            );
+          // Standard snapshot-based validation - get request from cases definitions
+          const caseRequest = getCaseForProvider(
+            allTestCases,
+            caseName,
+            // eslint-disable-next-line @typescript-eslint/consistent-type-assertions -- format is a string key
+            format as
+              | "chat-completions"
+              | "responses"
+              | "anthropic"
+              | "google"
+              | "bedrock"
+          );
+          // eslint-disable-next-line @typescript-eslint/consistent-type-assertions -- Need to type the request for model override
+          let request = caseRequest as Record<string, unknown> | null;
+
+          if (!request) {
+            const result: ValidationResult = {
+              format,
+              caseName,
+              model: modelName,
+              success: false,
+              durationMs: Date.now() - start,
+              error: `Case ${caseName} not found for format ${format}`,
+            };
+            options.onResult?.(result);
+            return result;
+          }
 
-            // Determine success/warning state:
-            // - success=true, warning=undefined: perfect match (no diffs)
-            // - success=true, warning=true: only minor diffs (logprobs, tool args)
-            // - success=false: major diffs or errors
-            const onlyMinorDiffs = hasOnlyMinorDiffs(diff);
+          // Load expected response from snapshots for comparison
+          const snapshotFilename = options.stream
+            ? "response-streaming.json"
+            : "response.json";
+          const expectedResponse = loadSnapshotFile(
+            caseName,
+            format,
+            snapshotFilename
+          );
+
+          if (!expectedResponse) {
             const result: ValidationResult = {
               format,
               caseName,
-              model: actualModel,
-              success: diff.match || onlyMinorDiffs,
-              warning: onlyMinorDiffs ? true : undefined,
+              model: modelName,
+              success: false,
               durationMs: Date.now() - start,
-              diff: diff.match ? undefined : diff, // Include diff for warnings too
-              actualResponse: options.verbose ? actualResponse : undefined,
+              error: `Missing ${snapshotFilename} for ${caseName}/${format}`,
             };
             options.onResult?.(result);
             return result;
-          } catch (error) {
+          }
+
+          // Override model only for cross-provider testing
+          // OpenAI formats (chat-completions, responses) with non-OpenAI providers
+          if (
+            providerAlias !== "default" &&
+            providerAlias !== "openai" && // Don't override for OpenAI - tests have correct models
+            PROVIDER_REGISTRY[providerAlias]
+          ) {
+            const isOpenAIFormat =
+              format === "chat-completions" || format === "responses";
+            if (isOpenAIFormat) {
+              // Override for cross-provider translation testing
+              request = {
+                ...request,
+                model: PROVIDER_REGISTRY[providerAlias],
+              };
+            }
+          }
+
+          // Execute through proxy
+          const actual = await executor.execute(caseName, request, {
+            stream: options.stream,
+            baseURL: options.proxyUrl,
+            apiKey: options.apiKey,
+          });
+
+          if (actual.error) {
             const result: ValidationResult = {
               format,
               caseName,
               model: modelName,
               success: false,
               durationMs: Date.now() - start,
-              error: String(error),
+              error: actual.error,
             };
             options.onResult?.(result);
             return result;
           }
+
+          // Compare response (use streamingResponse array when streaming)
+          const actualResponse = options.stream
+            ? actual.streamingResponse
+            : actual.response;
+
+          // Extract actual model from response (fallback to registry-based name)
+          const actualModel =
+            extractModelFromResponse(actualResponse, options.stream) ??
+            modelName;
+
+          const diff = compareResponses(
+            expectedResponse,
+            actualResponse,
+            executor.ignoredFields ?? []
+          );
+
+          // Determine success/warning state:
+          // - success=true, warning=undefined: perfect match (no diffs)
+          // - success=true, warning=true: only minor diffs (logprobs, tool args)
+          // - success=false: major diffs or errors
+          const onlyMinorDiffs = hasOnlyMinorDiffs(diff);
+          const result: ValidationResult = {
+            format,
+            caseName,
+            model: actualModel,
+            success: diff.match || onlyMinorDiffs,
+            warning: onlyMinorDiffs ? true : undefined,
+            durationMs: Date.now() - start,
+            diff: diff.match ? undefined : diff, // Include diff for warnings too
+            actualResponse: options.verbose ? actualResponse : undefined,
+          };
+          options.onResult?.(result);
+          return result;
+        } catch (error) {
+          const result: ValidationResult = {
+            format,
+            caseName,
+            model: modelName,
+            success: false,
+            durationMs: Date.now() - start,
+            error: String(error),
+          };
+          options.onResult?.(result);
+          return result;
         }
-      )
+      }
     );
 
     results.push(...caseResults);

From 520fa1f1f351a53a288a0b6ee2d73c82168a26ac Mon Sep 17 00:00:00 2001
From: Ken Jiang <ken@braintrustdata.com>
Date: Sat, 31 Jan 2026 12:26:07 -0500
Subject: [PATCH 5/5] update reasoning with canonical source and fix convert.rs
 for responses

---
 .../src/requests_expected_differences.json    |  11 +-
 .../src/responses_expected_differences.json   |  49 ++
 crates/coverage-report/src/runner.rs          | 259 ++++----
 .../src/streaming_expected_differences.json   |  15 +
 .../lingua/src/providers/anthropic/adapter.rs |  32 +-
 .../lingua/src/providers/bedrock/adapter.rs   |  27 +-
 crates/lingua/src/providers/google/adapter.rs |   8 +-
 crates/lingua/src/providers/openai/adapter.rs |  49 +-
 crates/lingua/src/providers/openai/convert.rs | 594 +++++++++++++++++-
 .../src/providers/openai/responses_adapter.rs | 135 ++--
 crates/lingua/src/universal/mod.rs            |   6 +-
 crates/lingua/src/universal/reasoning.rs      | 123 ++--
 crates/lingua/src/universal/request.rs        |  43 +-
 crates/lingua/src/universal/tools.rs          |  13 +-
 14 files changed, 1007 insertions(+), 357 deletions(-)

diff --git a/crates/coverage-report/src/requests_expected_differences.json b/crates/coverage-report/src/requests_expected_differences.json
index 2879210b..b45c30fb 100644
--- a/crates/coverage-report/src/requests_expected_differences.json
+++ b/crates/coverage-report/src/requests_expected_differences.json
@@ -5,7 +5,8 @@
       "target": "*",
       "fields": [
         { "pattern": "params.service_tier", "reason": "OpenAI-specific billing tier not universal across providers" },
-        { "pattern": "messages[*].id", "reason": "Message/response IDs are provider-specific (OpenAI uses response-level IDs, Anthropic uses message-level IDs, Bedrock has none)" }
+        { "pattern": "messages[*].id", "reason": "Message/response IDs are provider-specific (OpenAI uses response-level IDs, Anthropic uses message-level IDs, Bedrock has none)" },
+        { "pattern": "params.reasoning.canonical", "reason": "Metadata indicating source format (effort vs budget_tokens) - changes when converting between providers with different canonical representations" }
       ]
     },
     {
@@ -95,7 +96,9 @@
       "fields": [
         { "pattern": "params.temperature", "reason": "Bedrock requires temperature=1.0 for extended thinking" },
         { "pattern": "params.stream", "reason": "Bedrock uses endpoint-based streaming" },
-        { "pattern": "params.metadata", "reason": "Bedrock doesn't support metadata" }
+        { "pattern": "params.metadata", "reason": "Bedrock doesn't support metadata" },
+        { "pattern": "params.reasoning.effort", "reason": "Cross-canonical conversion (effort→budget_tokens) may quantize when max_tokens is very small" },
+        { "pattern": "params.reasoning.summary", "reason": "Bedrock doesn't support reasoning summary" }
       ]
     },
     {
@@ -103,7 +106,9 @@
       "target": "Google",
       "fields": [
         { "pattern": "params.stream", "reason": "Google uses endpoint-based streaming" },
-        { "pattern": "params.metadata", "reason": "Google doesn't support metadata" }
+        { "pattern": "params.metadata", "reason": "Google doesn't support metadata" },
+        { "pattern": "params.reasoning.effort", "reason": "Cross-canonical conversion (effort→budget_tokens) may quantize when max_tokens is very small" },
+        { "pattern": "params.reasoning.summary", "reason": "Google doesn't support reasoning summary" }
       ]
     }
   ],
diff --git a/crates/coverage-report/src/responses_expected_differences.json b/crates/coverage-report/src/responses_expected_differences.json
index a8ac797f..8471714c 100644
--- a/crates/coverage-report/src/responses_expected_differences.json
+++ b/crates/coverage-report/src/responses_expected_differences.json
@@ -21,6 +21,31 @@
       "fields": [
         { "pattern": "usage.completion_reasoning_tokens", "reason": "Anthropic doesn't expose reasoning tokens separately (included in output_tokens)" }
       ]
+    },
+    {
+      "source": "Responses",
+      "target": "Anthropic",
+      "fields": [
+        { "pattern": "messages[*].content[*].provider_options", "reason": "Responses API annotations/logprobs have no Anthropic equivalent" },
+        { "pattern": "messages.length", "reason": "Responses API OutputItems map to separate Messages; Anthropic consolidates into one" }
+      ]
+    },
+    {
+      "source": "Anthropic",
+      "target": "Responses",
+      "fields": [
+        { "pattern": "messages.length", "reason": "Anthropic single message expands to multiple OutputItems in Responses API" }
+      ]
+    },
+    {
+      "source": "Responses",
+      "target": "ChatCompletions",
+      "fields": [
+        { "pattern": "messages[*].content[*].provider_options", "reason": "Responses API annotations/logprobs have no ChatCompletions equivalent" },
+        { "pattern": "messages[*].content[*].provider_executed", "reason": "Responses API provider_executed flag has no ChatCompletions equivalent" },
+        { "pattern": "messages.length", "reason": "Responses API OutputItems map to separate Messages; ChatCompletions consolidates into one" },
+        { "pattern": "messages[*].content.length", "reason": "Responses API reasoning content parts have no ChatCompletions equivalent" }
+      ]
     }
   ],
   "perTestCase": [
@@ -103,6 +128,30 @@
       "fields": [
         { "pattern": "messages[0].content.length", "reason": "Anthropic web search content blocks don't map 1:1 to ChatCompletions structure" }
       ]
+    },
+    {
+      "testCase": "webSearchToolParam",
+      "source": "Anthropic",
+      "target": "Responses",
+      "fields": [
+        { "pattern": "finish_reason", "reason": "Anthropic web search tool responses have different finish_reason mapping" }
+      ]
+    },
+    {
+      "testCase": "webSearchToolAdvancedParam",
+      "source": "Anthropic",
+      "target": "Responses",
+      "fields": [
+        { "pattern": "finish_reason", "reason": "Anthropic web search tool responses have different finish_reason mapping" }
+      ]
+    },
+    {
+      "testCase": "nMultipleCompletionsParam",
+      "source": "ChatCompletions",
+      "target": "Responses",
+      "fields": [
+        { "pattern": "messages.length", "reason": "Responses API doesn't support n>1 (multiple completions)" }
+      ]
     }
   ]
 }
diff --git a/crates/coverage-report/src/runner.rs b/crates/coverage-report/src/runner.rs
index 3b29a044..ed6311ad 100644
--- a/crates/coverage-report/src/runner.rs
+++ b/crates/coverage-report/src/runner.rs
@@ -4,12 +4,8 @@ Test execution for coverage-report.
 
 use std::collections::HashMap;
 
-use bytes::Bytes;
 use lingua::capabilities::ProviderFormat;
 use lingua::processing::adapters::ProviderAdapter;
-use lingua::processing::transform::{
-    transform_request, transform_response, transform_stream_chunk,
-};
 use lingua::serde_json::Value;
 use lingua::universal::{UniversalRequest, UniversalResponse, UniversalStreamChunk};
 
@@ -117,56 +113,16 @@ pub fn test_request_transformation(
     target_adapter.apply_defaults(&mut expected_universal);
     let expected_universal_value = universal_request_to_value(&expected_universal);
 
-    match transform_request(payload, target_adapter.format(), model) {
-        Ok(result) => {
-            // Parse result bytes to Value for validation
-            let output_bytes = result.into_bytes();
-            let transformed: Value = match lingua::serde_json::from_slice(&output_bytes) {
-                Ok(v) => v,
-                Err(e) => {
-                    return TransformResult {
-                        level: ValidationLevel::Fail,
-                        error: Some(format!("Failed to parse transformed output: {}", e)),
-                        diff: None,
-                        limitation_reason: None,
-                    }
-                }
-            };
-
-            // Use request_to_universal to validate - gives detailed error info
-            match target_adapter.request_to_universal(transformed) {
-                Ok(target_universal) => {
-                    let target_universal_value = universal_request_to_value(&target_universal);
-                    let context = CompareContext::for_cross_provider(
-                        TestCategory::Requests,
-                        source_adapter,
-                        target_adapter,
-                        test_case,
-                    );
-                    let roundtrip_result = compare_values(
-                        &expected_universal_value,
-                        &target_universal_value,
-                        context.as_ref(),
-                    );
-                    diff_to_transform_result(roundtrip_result)
-                }
-                Err(e) => TransformResult {
-                    level: ValidationLevel::Fail,
-                    error: Some(format!("Conversion from universal format failed: {}", e)),
-                    diff: None,
-                    limitation_reason: None,
-                },
-            }
-        }
+    let provider_value = match target_adapter.request_from_universal(&expected_universal) {
+        Ok(v) => v,
         Err(e) => {
-            let error_msg = e.to_string();
+            let error_msg = format!("Conversion from universal failed: {}", e);
             let context = CompareContext::for_cross_provider(
                 TestCategory::Requests,
                 source_adapter,
                 target_adapter,
                 test_case,
             );
-            // For roundtrip tests (context=None), all errors are real failures
             let reason = context.as_ref().and_then(|ctx| {
                 ctx.is_test_case_limitation().or_else(|| {
                     is_expected_error(
@@ -185,13 +141,50 @@ pub fn test_request_transformation(
                 ValidationLevel::Fail
             };
 
-            TransformResult {
+            return TransformResult {
                 level,
                 error: Some(error_msg),
                 diff: None,
                 limitation_reason: reason.map(|r| r.to_string()),
-            }
+            };
         }
+    };
+
+    let transformed: Value = match lingua::serde_json::to_value(&provider_value) {
+        Ok(v) => v,
+        Err(e) => {
+            return TransformResult {
+                level: ValidationLevel::Fail,
+                error: Some(format!("Failed to serialize provider value: {}", e)),
+                diff: None,
+                limitation_reason: None,
+            };
+        }
+    };
+
+    // Use request_to_universal to validate - gives detailed error info
+    match target_adapter.request_to_universal(transformed) {
+        Ok(target_universal) => {
+            let target_universal_value = universal_request_to_value(&target_universal);
+            let context = CompareContext::for_cross_provider(
+                TestCategory::Requests,
+                source_adapter,
+                target_adapter,
+                test_case,
+            );
+            let roundtrip_result = compare_values(
+                &expected_universal_value,
+                &target_universal_value,
+                context.as_ref(),
+            );
+            diff_to_transform_result(roundtrip_result)
+        }
+        Err(e) => TransformResult {
+            level: ValidationLevel::Fail,
+            error: Some(format!("Conversion from universal format failed: {}", e)),
+            diff: None,
+            limitation_reason: None,
+        },
     }
 }
 
@@ -239,56 +232,16 @@ pub fn test_response_transformation(
 
     let expected_universal_value = universal_response_to_value(&expected_universal);
 
-    match transform_response(payload, target_adapter.format()) {
-        Ok(result) => {
-            // Parse result bytes to Value for validation
-            let output_bytes = result.into_bytes();
-            let transformed: Value = match lingua::serde_json::from_slice(&output_bytes) {
-                Ok(v) => v,
-                Err(e) => {
-                    return TransformResult {
-                        level: ValidationLevel::Fail,
-                        error: Some(format!("Failed to parse transformed output: {}", e)),
-                        diff: None,
-                        limitation_reason: None,
-                    }
-                }
-            };
-
-            // Use response_to_universal to validate - gives detailed error info
-            match target_adapter.response_to_universal(transformed) {
-                Ok(target_universal) => {
-                    let target_universal_value = universal_response_to_value(&target_universal);
-                    let context = CompareContext::for_cross_provider(
-                        TestCategory::Responses,
-                        source_adapter,
-                        target_adapter,
-                        test_case,
-                    );
-                    let roundtrip_result = compare_values(
-                        &expected_universal_value,
-                        &target_universal_value,
-                        context.as_ref(),
-                    );
-                    diff_to_transform_result(roundtrip_result)
-                }
-                Err(e) => TransformResult {
-                    level: ValidationLevel::Fail,
-                    error: Some(format!("Conversion from universal format failed: {}", e)),
-                    diff: None,
-                    limitation_reason: None,
-                },
-            }
-        }
+    let provider_value = match target_adapter.response_from_universal(&expected_universal) {
+        Ok(v) => v,
         Err(e) => {
-            let error_msg = e.to_string();
+            let error_msg = format!("Conversion from universal failed: {}", e);
             let context = CompareContext::for_cross_provider(
                 TestCategory::Responses,
                 source_adapter,
                 target_adapter,
                 test_case,
             );
-            // For roundtrip tests (context=None), all errors are real failures
             let reason = context.as_ref().and_then(|ctx| {
                 ctx.is_test_case_limitation().or_else(|| {
                     is_expected_error(
@@ -307,13 +260,49 @@ pub fn test_response_transformation(
                 ValidationLevel::Fail
             };
 
-            TransformResult {
+            return TransformResult {
                 level,
                 error: Some(error_msg),
                 diff: None,
                 limitation_reason: reason.map(|r| r.to_string()),
-            }
+            };
+        }
+    };
+
+    let transformed: Value = match lingua::serde_json::to_value(&provider_value) {
+        Ok(v) => v,
+        Err(e) => {
+            return TransformResult {
+                level: ValidationLevel::Fail,
+                error: Some(format!("Failed to serialize provider value: {}", e)),
+                diff: None,
+                limitation_reason: None,
+            };
+        }
+    };
+
+    match target_adapter.response_to_universal(transformed) {
+        Ok(target_universal) => {
+            let target_universal_value = universal_response_to_value(&target_universal);
+            let context = CompareContext::for_cross_provider(
+                TestCategory::Responses,
+                source_adapter,
+                target_adapter,
+                test_case,
+            );
+            let roundtrip_result = compare_values(
+                &expected_universal_value,
+                &target_universal_value,
+                context.as_ref(),
+            );
+            diff_to_transform_result(roundtrip_result)
         }
+        Err(e) => TransformResult {
+            level: ValidationLevel::Fail,
+            error: Some(format!("Conversion from universal format failed: {}", e)),
+            diff: None,
+            limitation_reason: None,
+        },
     }
 }
 
@@ -406,56 +395,48 @@ fn test_single_stream_event(
         }
     };
 
-    // Serialize each event back to bytes for the transform function
-    let event_bytes = match lingua::serde_json::to_vec(event) {
-        Ok(b) => Bytes::from(b),
-        Err(e) => {
-            return TransformResult {
-                level: ValidationLevel::Fail,
-                error: Some(format!("failed to serialize: {}", e)),
-                diff: None,
-                limitation_reason: None,
+    let target_universal = match &source_universal {
+        Some(chunk) => {
+            let provider_value = match target_adapter.stream_from_universal(chunk) {
+                Ok(v) => v,
+                Err(e) => {
+                    return TransformResult {
+                        level: ValidationLevel::Fail,
+                        error: Some(format!("Conversion from universal failed: {}", e)),
+                        diff: None,
+                        limitation_reason: None,
+                    };
+                }
             };
-        }
-    };
 
-    // Transform the event to target format
-    let result = match transform_stream_chunk(event_bytes, target_adapter.format()) {
-        Ok(r) => r,
-        Err(e) => {
-            return TransformResult {
-                level: ValidationLevel::Fail,
-                error: Some(e.to_string()),
-                diff: None,
-                limitation_reason: None,
-            }
-        }
-    };
+            let transformed: Value = match lingua::serde_json::to_value(&provider_value) {
+                Ok(v) => v,
+                Err(e) => {
+                    return TransformResult {
+                        level: ValidationLevel::Fail,
+                        error: Some(format!("Failed to serialize provider value: {}", e)),
+                        diff: None,
+                        limitation_reason: None,
+                    };
+                }
+            };
 
-    // Parse result bytes to Value for validation
-    let output_bytes = result.into_bytes();
-    let transformed: Value = match lingua::serde_json::from_slice(&output_bytes) {
-        Ok(v) => v,
-        Err(e) => {
-            return TransformResult {
-                level: ValidationLevel::Fail,
-                error: Some(e.to_string()),
-                diff: None,
-                limitation_reason: None,
+            // Convert back to universal for comparison
+            match target_adapter.stream_to_universal(transformed) {
+                Ok(u) => u,
+                Err(e) => {
+                    return TransformResult {
+                        level: ValidationLevel::Fail,
+                        error: Some(format!("Conversion from universal format failed: {}", e)),
+                        diff: None,
+                        limitation_reason: None,
+                    };
+                }
             }
         }
-    };
-
-    // Validate transformed output can be parsed by target adapter
-    let target_universal = match target_adapter.stream_to_universal(transformed) {
-        Ok(u) => u,
-        Err(e) => {
-            return TransformResult {
-                level: ValidationLevel::Fail,
-                error: Some(format!("Conversion from universal format failed: {}", e)),
-                diff: None,
-                limitation_reason: None,
-            }
+        None => {
+            // Keep-alive event with no universal representation - pass through
+            None
         }
     };
 
diff --git a/crates/coverage-report/src/streaming_expected_differences.json b/crates/coverage-report/src/streaming_expected_differences.json
index 897a4f09..0a8ba157 100644
--- a/crates/coverage-report/src/streaming_expected_differences.json
+++ b/crates/coverage-report/src/streaming_expected_differences.json
@@ -39,6 +39,21 @@
       "fields": [
         { "pattern": "model", "reason": "Bedrock streaming format doesn't include model in events" }
       ]
+    },
+    {
+      "source": "*",
+      "target": "Anthropic",
+      "fields": [
+        { "pattern": "usage.completion_reasoning_tokens", "reason": "Anthropic doesn't expose reasoning tokens separately (included in output_tokens)" }
+      ]
+    },
+    {
+      "source": "Responses",
+      "target": "Anthropic",
+      "fields": [
+        { "pattern": "id", "reason": "Responses API response IDs don't map to Anthropic streaming format" },
+        { "pattern": "model", "reason": "Responses API model field isn't preserved in Anthropic streaming events" }
+      ]
     }
   ],
   "perTestCase": [
diff --git a/crates/lingua/src/providers/anthropic/adapter.rs b/crates/lingua/src/providers/anthropic/adapter.rs
index 66d9b233..04e7e3f6 100644
--- a/crates/lingua/src/providers/anthropic/adapter.rs
+++ b/crates/lingua/src/providers/anthropic/adapter.rs
@@ -18,7 +18,6 @@ use crate::providers::anthropic::try_parse_anthropic;
 use crate::serde_json::{self, Map, Value};
 use crate::universal::convert::TryFromLLM;
 use crate::universal::message::{Message, UserContent};
-use crate::universal::reasoning::ANTHROPIC_THINKING_TEMPERATURE;
 use crate::universal::tools::{tools_to_anthropic_value, UniversalTool};
 use crate::universal::transform::extract_system_messages;
 use crate::universal::{
@@ -162,24 +161,18 @@ impl ProviderAdapter for AnthropicAdapter {
         let max_tokens = req.params.max_tokens.unwrap_or(DEFAULT_MAX_TOKENS);
         obj.insert("max_tokens".into(), Value::Number(max_tokens.into()));
 
-        // Check if reasoning/thinking is enabled (needed for temperature override)
+        // Check if reasoning/thinking is enabled
         // Note: thinking_val can be { type: "disabled" } or { type: "enabled", ... }
-        // Only override temperature when type is "enabled"
         let thinking_val = req.params.reasoning_for(ProviderFormat::Anthropic);
         let reasoning_enabled = thinking_val
             .as_ref()
             .and_then(|v| v.get("type"))
             .and_then(|t| t.as_str())
             .is_some_and(|t| t == "enabled");
+        if !reasoning_enabled {
+            insert_opt_f64(&mut obj, "temperature", req.params.temperature);
+        }
 
-        // Insert other params
-        // Anthropic requires temperature=1.0 when extended thinking is enabled
-        let temperature = if reasoning_enabled {
-            Some(ANTHROPIC_THINKING_TEMPERATURE)
-        } else {
-            req.params.temperature
-        };
-        insert_opt_f64(&mut obj, "temperature", temperature);
         insert_opt_f64(&mut obj, "top_p", req.params.top_p);
         insert_opt_i64(&mut obj, "top_k", req.params.top_k);
 
@@ -687,7 +680,7 @@ mod tests {
     }
 
     #[test]
-    fn test_anthropic_auto_corrects_temperature_with_thinking() {
+    fn test_anthropic_omits_temperature_with_thinking() {
         use crate::universal::message::UserContent;
         use crate::universal::request::ReasoningConfig;
 
@@ -700,7 +693,7 @@ mod tests {
                 content: UserContent::String("Hello".to_string()),
             }],
             params: UniversalParams {
-                temperature: Some(0.5), // User specified, but should be overridden
+                temperature: Some(0.5), // User specified, but should be omitted
                 reasoning: Some(ReasoningConfig {
                     enabled: Some(true),
                     budget_tokens: Some(2048),
@@ -713,14 +706,10 @@ mod tests {
 
         let result = adapter.request_from_universal(&req).unwrap();
 
-        // Temperature should be auto-corrected to 1.0 (ANTHROPIC_THINKING_TEMPERATURE)
-        assert_eq!(
-            result.get("temperature").unwrap().as_f64().unwrap(),
-            1.0,
-            "Temperature should be auto-corrected to 1.0 when thinking is enabled"
+        assert!(
+            result.get("temperature").is_none(),
+            "Temperature should be omitted when thinking is enabled"
         );
-
-        // Thinking should be present
         assert!(
             result.get("thinking").is_some(),
             "thinking field should be present"
@@ -748,14 +737,11 @@ mod tests {
 
         let result = adapter.request_from_universal(&req).unwrap();
 
-        // Temperature should be preserved as user specified
         assert_eq!(
             result.get("temperature").unwrap().as_f64().unwrap(),
             0.7,
             "Temperature should be preserved when thinking is not enabled"
         );
-
-        // No thinking field
         assert!(
             result.get("thinking").is_none(),
             "thinking field should not be present"
diff --git a/crates/lingua/src/providers/bedrock/adapter.rs b/crates/lingua/src/providers/bedrock/adapter.rs
index a1abafe6..e8a56d5e 100644
--- a/crates/lingua/src/providers/bedrock/adapter.rs
+++ b/crates/lingua/src/providers/bedrock/adapter.rs
@@ -19,7 +19,6 @@ use crate::providers::bedrock::try_parse_bedrock;
 use crate::serde_json::{self, Map, Value};
 use crate::universal::convert::TryFromLLM;
 use crate::universal::message::Message;
-use crate::universal::reasoning::ANTHROPIC_THINKING_TEMPERATURE;
 use crate::universal::request::ReasoningConfig;
 use crate::universal::tools::{UniversalTool, UniversalToolType};
 use crate::universal::{
@@ -178,20 +177,16 @@ impl ProviderAdapter for BedrockAdapter {
                 .map_err(|e| TransformError::SerializationFailed(e.to_string()))?,
         );
 
-        // Check if reasoning/thinking is enabled (for temperature override)
+        // Check if reasoning/thinking is enabled
         // Note: thinking_config can be { type: "disabled" } or { type: "enabled", ... }
-        // Only override temperature when type is "enabled"
         let thinking_config = req.params.reasoning_for(ProviderFormat::Converse);
         let reasoning_enabled = thinking_config
             .as_ref()
             .and_then(|v| v.get("type"))
             .and_then(|t| t.as_str())
             .is_some_and(|t| t == "enabled");
-
-        // Build inferenceConfig if any params are set
-        // Note: Claude on Bedrock requires temperature=1.0 when extended thinking is enabled
         let temperature = if reasoning_enabled {
-            Some(ANTHROPIC_THINKING_TEMPERATURE)
+            None
         } else {
             req.params.temperature
         };
@@ -684,7 +679,7 @@ mod tests {
     }
 
     #[test]
-    fn test_bedrock_reasoning_sets_temperature_to_1() {
+    fn test_bedrock_reasoning_omits_temperature() {
         use crate::universal::request::ReasoningConfig;
 
         let adapter = BedrockAdapter;
@@ -699,7 +694,7 @@ mod tests {
                     budget_tokens: Some(2048),
                     ..Default::default()
                 }),
-                temperature: Some(0.5), // This should be overridden to 1.0
+                temperature: Some(0.5), // This should be omitted when thinking is enabled
                 max_tokens: Some(4096),
                 ..Default::default()
             },
@@ -707,9 +702,12 @@ mod tests {
 
         let reconstructed = adapter.request_from_universal(&universal).unwrap();
 
-        // Temperature should be 1.0 when thinking is enabled
+        // Temperature should be omitted when thinking is enabled (let Bedrock default to 1.0)
         let inference_config = reconstructed.get("inferenceConfig").unwrap();
-        assert_eq!(inference_config.get("temperature").unwrap(), 1.0);
+        assert!(
+            inference_config.get("temperature").is_none(),
+            "Temperature should be omitted when thinking is enabled"
+        );
     }
 
     #[test]
@@ -752,8 +750,11 @@ mod tests {
         assert_eq!(thinking.get("type").unwrap(), "enabled");
         assert_eq!(thinking.get("budget_tokens").unwrap(), 2500);
 
-        // Verify temperature is set to 1.0
+        // Temperature should be omitted when thinking is enabled
         let inference_config = reconstructed.get("inferenceConfig").unwrap();
-        assert_eq!(inference_config.get("temperature").unwrap(), 1.0);
+        assert!(
+            inference_config.get("temperature").is_none(),
+            "Temperature should be omitted when thinking is enabled"
+        );
     }
 }
diff --git a/crates/lingua/src/providers/google/adapter.rs b/crates/lingua/src/providers/google/adapter.rs
index 34532470..d7b67e34 100644
--- a/crates/lingua/src/providers/google/adapter.rs
+++ b/crates/lingua/src/providers/google/adapter.rs
@@ -70,9 +70,15 @@ impl ProviderAdapter for GoogleAdapter {
                 // thinkingBudget: 0 means disabled
                 let reasoning = config.thinking_config.as_ref().map(|tc| {
                     let is_disabled = tc.thinking_budget == Some(0);
+                    let budget_tokens = tc.thinking_budget.map(|b| b as i64);
+                    // Derive effort from budget_tokens
+                    let effort = budget_tokens
+                        .map(|b| crate::universal::reasoning::budget_to_effort(b, None));
                     crate::universal::ReasoningConfig {
                         enabled: Some(!is_disabled),
-                        budget_tokens: tc.thinking_budget.map(|b| b as i64),
+                        effort,
+                        budget_tokens,
+                        canonical: Some(crate::universal::ReasoningCanonical::BudgetTokens),
                         ..Default::default()
                     }
                 });
diff --git a/crates/lingua/src/providers/openai/adapter.rs b/crates/lingua/src/providers/openai/adapter.rs
index ce2acb9b..b77a3d33 100644
--- a/crates/lingua/src/providers/openai/adapter.rs
+++ b/crates/lingua/src/providers/openai/adapter.rs
@@ -535,38 +535,59 @@ fn build_reasoning_config(
     reasoning_effort: Option<OpenAIReasoningEffort>,
     max_tokens: Option<i64>,
 ) -> Option<ReasoningConfig> {
-    // Check if any reasoning field is set
+    use crate::universal::reasoning::budget_to_effort;
+    use crate::universal::ReasoningCanonical;
+
     if reasoning_enabled.is_none() && reasoning_budget.is_none() && reasoning_effort.is_none() {
         return None;
     }
 
-    // Determine if reasoning is disabled
-    // reasoning_enabled: false OR reasoning_budget: 0 means disabled
     let is_disabled = reasoning_enabled == Some(false) || reasoning_budget == Some(0);
 
     if is_disabled {
         return Some(ReasoningConfig {
             enabled: Some(false),
+            effort: None,
             budget_tokens: None,
+            canonical: None,
             ..Default::default()
         });
     }
 
-    // Calculate budget_tokens: reasoning_budget takes precedence over reasoning_effort
-    let budget_tokens = reasoning_budget.or_else(|| {
-        reasoning_effort.map(|effort| {
-            let universal_effort = match effort {
-                OpenAIReasoningEffort::Low | OpenAIReasoningEffort::Minimal => ReasoningEffort::Low,
-                OpenAIReasoningEffort::Medium => ReasoningEffort::Medium,
-                OpenAIReasoningEffort::High => ReasoningEffort::High,
-            };
-            effort_to_budget(universal_effort, max_tokens)
-        })
-    });
+    let (effort, budget_tokens, canonical) = if let Some(budget) = reasoning_budget {
+        let derived_effort = budget_to_effort(budget, max_tokens);
+        (
+            Some(derived_effort),
+            Some(budget),
+            Some(ReasoningCanonical::BudgetTokens),
+        )
+    } else if let Some(openai_effort) = reasoning_effort {
+        let universal_effort = match openai_effort {
+            OpenAIReasoningEffort::Low | OpenAIReasoningEffort::Minimal => ReasoningEffort::Low,
+            OpenAIReasoningEffort::Medium => ReasoningEffort::Medium,
+            OpenAIReasoningEffort::High => ReasoningEffort::High,
+        };
+        let derived_budget = effort_to_budget(universal_effort, max_tokens);
+        (
+            Some(universal_effort),
+            Some(derived_budget),
+            Some(ReasoningCanonical::Effort),
+        )
+    } else {
+        let default_effort = ReasoningEffort::Medium;
+        let derived_budget = effort_to_budget(default_effort, max_tokens);
+        (
+            Some(default_effort),
+            Some(derived_budget),
+            Some(ReasoningCanonical::Effort),
+        )
+    };
 
     Some(ReasoningConfig {
         enabled: Some(true),
+        effort,
         budget_tokens,
+        canonical,
         ..Default::default()
     })
 }
diff --git a/crates/lingua/src/providers/openai/convert.rs b/crates/lingua/src/providers/openai/convert.rs
index bf8a5303..172be733 100644
--- a/crates/lingua/src/providers/openai/convert.rs
+++ b/crates/lingua/src/providers/openai/convert.rs
@@ -4,8 +4,8 @@ use crate::serde_json;
 use crate::universal::convert::TryFromLLM;
 use crate::universal::defaults::{EMPTY_OBJECT_STR, REFUSAL_TEXT};
 use crate::universal::{
-    AssistantContent, AssistantContentPart, Message, TextContentPart, ToolCallArguments,
-    ToolContentPart, ToolResultContentPart, UserContent, UserContentPart,
+    AssistantContent, AssistantContentPart, Message, ProviderOptions, TextContentPart,
+    ToolCallArguments, ToolContentPart, ToolResultContentPart, UserContent, UserContentPart,
 };
 use crate::util::media::parse_base64_data_url;
 use serde::{Deserialize, Serialize};
@@ -1321,6 +1321,7 @@ pub fn universal_to_responses_input(
                     AssistantContent::Array(parts) => {
                         // Categorize all parts into separate collections
                         let mut reasoning_parts: Vec<openai::SummaryText> = vec![];
+                        let mut has_reasoning = false;
                         let mut encrypted_content = None;
                         let mut normal_parts: Vec<openai::InputContent> = vec![];
                         let mut tool_calls: Vec<(String, String, ToolCallArguments, Option<bool>)> =
@@ -1332,6 +1333,7 @@ pub fn universal_to_responses_input(
                                     text,
                                     encrypted_content: ec,
                                 } => {
+                                    has_reasoning = true;
                                     encrypted_content = ec.clone();
                                     if !text.is_empty() {
                                         reasoning_parts.push(openai::SummaryText {
@@ -1360,8 +1362,8 @@ pub fn universal_to_responses_input(
                             }
                         }
 
-                        // 1. Emit reasoning item if present
-                        if !reasoning_parts.is_empty() || encrypted_content.is_some() {
+                        // 1. Emit reasoning item if any reasoning part existed (even with empty text)
+                        if has_reasoning {
                             result.push(openai::InputItem {
                                 role: None,
                                 content: None,
@@ -1381,7 +1383,8 @@ pub fn universal_to_responses_input(
                                     normal_parts,
                                 )),
                                 input_item_type: Some(openai::InputItemType::Message),
-                                id: None, // id was used for reasoning if present
+                                // Only clear id if reasoning was emitted (it used the id)
+                                id: if has_reasoning { None } else { id.clone() },
                                 status: Some(openai::FunctionCallItemStatus::Completed),
                                 ..Default::default()
                             });
@@ -1659,32 +1662,585 @@ impl TryFromLLM<openai::InputItem> for openai::OutputItem {
     }
 }
 
+/// Convert OpenAI OutputItem collection to universal Message collection.
+/// Each OutputItem becomes a separate Message to preserve the structure.
 impl TryFromLLM<Vec<openai::OutputItem>> for Vec<Message> {
     type Error = ConvertError;
 
-    fn try_from(messages: Vec<openai::OutputItem>) -> Result<Vec<Message>, Self::Error> {
-        let input_items: Vec<openai::InputItem> = messages
-            .into_iter()
-            .map(TryFromLLM::try_from)
-            .collect::<Result<_, _>>()?;
-        TryFromLLM::try_from(input_items)
+    fn try_from(items: Vec<openai::OutputItem>) -> Result<Vec<Message>, Self::Error> {
+        let mut messages: Vec<Message> = Vec::new();
+
+        for mut item in items {
+            let item_id = item.id.clone();
+
+            let parts: Vec<AssistantContentPart> = match item.output_item_type {
+                Some(openai::OutputItemType::Message) => {
+                    // Extract text content from message output items
+                    let mut text_parts = Vec::new();
+                    if let Some(content) = item.content {
+                        for c in content {
+                            if let Some(text) = c.text {
+                                // Preserve annotations and logprobs in provider_options
+                                let provider_options =
+                                    if c.annotations.is_some() || c.logprobs.is_some() {
+                                        let mut options = serde_json::Map::new();
+                                        if let Some(annotations) = c.annotations {
+                                            if let Ok(value) = serde_json::to_value(&annotations) {
+                                                options.insert("annotations".to_string(), value);
+                                            }
+                                        }
+                                        if let Some(logprobs) = c.logprobs {
+                                            if let Ok(value) = serde_json::to_value(&logprobs) {
+                                                options.insert("logprobs".to_string(), value);
+                                            }
+                                        }
+                                        if options.is_empty() {
+                                            None
+                                        } else {
+                                            Some(ProviderOptions { options })
+                                        }
+                                    } else {
+                                        None
+                                    };
+                                text_parts.push(AssistantContentPart::Text(TextContentPart {
+                                    text,
+                                    provider_options,
+                                }));
+                            }
+                        }
+                    }
+                    text_parts
+                }
+                Some(openai::OutputItemType::Reasoning) => {
+                    // Convert reasoning output to reasoning content parts
+                    let mut reasoning_parts = Vec::new();
+                    let mut first = true;
+                    for summary in item.summary.unwrap_or_default() {
+                        reasoning_parts.push(AssistantContentPart::Reasoning {
+                            text: summary.text,
+                            encrypted_content: if first {
+                                first = false;
+                                item.encrypted_content.take()
+                            } else {
+                                None
+                            },
+                        });
+                    }
+                    // Handle empty reasoning (still preserve encrypted content)
+                    if first {
+                        reasoning_parts.push(AssistantContentPart::Reasoning {
+                            text: String::new(),
+                            encrypted_content: item.encrypted_content.take(),
+                        });
+                    }
+                    reasoning_parts
+                }
+                Some(openai::OutputItemType::FunctionCall) => {
+                    let tool_call_id =
+                        item.call_id
+                            .ok_or_else(|| ConvertError::MissingRequiredField {
+                                field: "function call call_id".to_string(),
+                            })?;
+                    let tool_name =
+                        item.name
+                            .ok_or_else(|| ConvertError::MissingRequiredField {
+                                field: "function call name".to_string(),
+                            })?;
+                    let arguments_str = item
+                        .arguments
+                        .unwrap_or_else(|| EMPTY_OBJECT_STR.to_string());
+
+                    vec![AssistantContentPart::ToolCall {
+                        tool_call_id,
+                        tool_name,
+                        arguments: arguments_str.into(),
+                        provider_options: None,
+                        provider_executed: None,
+                    }]
+                }
+                Some(openai::OutputItemType::CodeInterpreterCall) => {
+                    vec![AssistantContentPart::ToolCall {
+                        tool_call_id: item.id.clone().unwrap_or_default(),
+                        tool_name: "code_interpreter".to_string(),
+                        arguments: build_tool_arguments(&serde_json::json!({
+                            "code": item.code,
+                            "container_id": item.container_id,
+                            "outputs": item.outputs,
+                            "status": item.status,
+                        })),
+                        provider_options: None,
+                        provider_executed: Some(true),
+                    }]
+                }
+                Some(openai::OutputItemType::WebSearchCall) => {
+                    vec![AssistantContentPart::ToolCall {
+                        tool_call_id: item.id.clone().unwrap_or_default(),
+                        tool_name: "web_search".to_string(),
+                        arguments: build_tool_arguments(&serde_json::json!({
+                            "action": item.action,
+                            "queries": item.queries,
+                            "status": item.status,
+                        })),
+                        provider_options: None,
+                        provider_executed: Some(true),
+                    }]
+                }
+                Some(openai::OutputItemType::FileSearchCall) => {
+                    vec![AssistantContentPart::ToolCall {
+                        tool_call_id: item.id.clone().unwrap_or_default(),
+                        tool_name: "file_search".to_string(),
+                        arguments: build_tool_arguments(&serde_json::json!({
+                            "queries": item.queries,
+                            "results": item.results,
+                            "status": item.status,
+                        })),
+                        provider_options: None,
+                        provider_executed: Some(true),
+                    }]
+                }
+                Some(openai::OutputItemType::ComputerCall) => {
+                    vec![AssistantContentPart::ToolCall {
+                        tool_call_id: item.id.clone().unwrap_or_default(),
+                        tool_name: "computer".to_string(),
+                        arguments: build_tool_arguments(&serde_json::json!({
+                            "action": item.action,
+                            "status": item.status,
+                        })),
+                        provider_options: None,
+                        provider_executed: Some(true),
+                    }]
+                }
+                Some(openai::OutputItemType::ImageGenerationCall) => {
+                    vec![AssistantContentPart::ToolCall {
+                        tool_call_id: item.id.clone().unwrap_or_default(),
+                        tool_name: "image_generation".to_string(),
+                        arguments: build_tool_arguments(&serde_json::json!({
+                            "result": item.result,
+                            "status": item.status,
+                        })),
+                        provider_options: None,
+                        provider_executed: Some(true),
+                    }]
+                }
+                Some(openai::OutputItemType::LocalShellCall) => {
+                    vec![AssistantContentPart::ToolCall {
+                        tool_call_id: item.id.clone().unwrap_or_default(),
+                        tool_name: "local_shell".to_string(),
+                        arguments: build_tool_arguments(&serde_json::json!({
+                            "action": item.action,
+                            "status": item.status,
+                        })),
+                        provider_options: None,
+                        provider_executed: Some(true),
+                    }]
+                }
+                Some(openai::OutputItemType::McpCall) => {
+                    vec![AssistantContentPart::ToolCall {
+                        tool_call_id: item.id.clone().unwrap_or_default(),
+                        tool_name: "mcp_call".to_string(),
+                        arguments: build_tool_arguments(&serde_json::json!({
+                            "server_label": item.server_label,
+                            "status": item.status,
+                        })),
+                        provider_options: None,
+                        provider_executed: Some(true),
+                    }]
+                }
+                Some(openai::OutputItemType::McpListTools) => {
+                    vec![AssistantContentPart::ToolCall {
+                        tool_call_id: item.id.clone().unwrap_or_default(),
+                        tool_name: "mcp_list_tools".to_string(),
+                        arguments: build_tool_arguments(&serde_json::json!({
+                            "server_label": item.server_label,
+                            "tools": item.tools,
+                            "status": item.status,
+                        })),
+                        provider_options: None,
+                        provider_executed: Some(true),
+                    }]
+                }
+                Some(openai::OutputItemType::McpApprovalRequest) => {
+                    vec![AssistantContentPart::ToolCall {
+                        tool_call_id: item.id.clone().unwrap_or_default(),
+                        tool_name: "mcp_approval_request".to_string(),
+                        arguments: build_tool_arguments(&serde_json::json!({
+                            "status": item.status,
+                        })),
+                        provider_options: None,
+                        provider_executed: Some(true),
+                    }]
+                }
+                _ => {
+                    // Skip unknown output item types
+                    continue;
+                }
+            };
+
+            // Only create a message if there are parts
+            if !parts.is_empty() {
+                messages.push(Message::Assistant {
+                    content: AssistantContent::Array(parts),
+                    id: item_id,
+                });
+            }
+        }
+
+        Ok(messages)
     }
 }
 
 /// Convert universal Message collection to OpenAI OutputItem collection
 /// This leverages the Message -> InputItem -> OutputItem conversion chain
+/// Convert universal Message collection to OpenAI OutputItem collection.
+/// This directly converts content parts to OutputItems, preserving order.
 impl TryFromLLM<Vec<Message>> for Vec<openai::OutputItem> {
     type Error = ConvertError;
 
     fn try_from(messages: Vec<Message>) -> Result<Self, Self::Error> {
-        // Convert each message to InputItem first, then to OutputItem
-        let input_items: Vec<openai::InputItem> = messages
-            .into_iter()
-            .map(TryFromLLM::try_from)
-            .collect::<Result<_, _>>()?;
-
-        // Then convert InputItems to OutputItems
-        input_items.into_iter().map(TryFromLLM::try_from).collect()
+        let mut result = Vec::new();
+
+        for msg in messages {
+            if let Message::Assistant { content, id } = msg {
+                match content {
+                    AssistantContent::String(text) => {
+                        result.push(openai::OutputItem {
+                            output_item_type: Some(openai::OutputItemType::Message),
+                            role: Some(openai::MessageRole::Assistant),
+                            content: Some(vec![openai::OutputMessageContent {
+                                output_message_content_type: openai::ContentType::OutputText,
+                                text: Some(text),
+                                annotations: None,
+                                logprobs: None,
+                                refusal: None,
+                            }]),
+                            id,
+                            status: Some(openai::FunctionCallItemStatus::Completed),
+                            ..Default::default()
+                        });
+                    }
+                    AssistantContent::Array(parts) => {
+                        // Track whether we've assigned the id to prevent duplicate IDs
+                        let mut id_used = false;
+                        let use_id = |used: &mut bool, id: &Option<String>| -> Option<String> {
+                            if *used {
+                                None
+                            } else {
+                                *used = true;
+                                id.clone()
+                            }
+                        };
+
+                        // Collect consecutive reasoning parts into a single OutputItem
+                        let mut pending_reasoning_summaries: Vec<openai::SummaryText> = vec![];
+                        let mut pending_encrypted_content: Option<String> = None;
+                        let mut has_pending_reasoning = false;
+
+                        let flush_reasoning =
+                            |result: &mut Vec<openai::OutputItem>,
+                             summaries: &mut Vec<openai::SummaryText>,
+                             encrypted: &mut Option<String>,
+                             has_reasoning: &mut bool,
+                             id_used: &mut bool,
+                             id: &Option<String>| {
+                                if *has_reasoning {
+                                    let use_id_inner =
+                                        |used: &mut bool, id: &Option<String>| -> Option<String> {
+                                            if *used {
+                                                None
+                                            } else {
+                                                *used = true;
+                                                id.clone()
+                                            }
+                                        };
+                                    result.push(openai::OutputItem {
+                                        output_item_type: Some(openai::OutputItemType::Reasoning),
+                                        summary: Some(std::mem::take(summaries)),
+                                        encrypted_content: encrypted.take(),
+                                        id: use_id_inner(id_used, id),
+                                        ..Default::default()
+                                    });
+                                    *has_reasoning = false;
+                                }
+                            };
+
+                        for part in parts {
+                            match part {
+                                AssistantContentPart::Text(text_part) => {
+                                    // Flush any pending reasoning before text
+                                    flush_reasoning(
+                                        &mut result,
+                                        &mut pending_reasoning_summaries,
+                                        &mut pending_encrypted_content,
+                                        &mut has_pending_reasoning,
+                                        &mut id_used,
+                                        &id,
+                                    );
+                                    // Extract annotations and logprobs from provider_options
+                                    let (annotations, logprobs) = if let Some(ref opts) =
+                                        text_part.provider_options
+                                    {
+                                        let annotations =
+                                            opts.options.get("annotations").and_then(|v| {
+                                                serde_json::from_value::<Vec<openai::Annotation>>(
+                                                    v.clone(),
+                                                )
+                                                .ok()
+                                            });
+                                        let logprobs = opts.options.get("logprobs").and_then(|v| {
+                                            serde_json::from_value::<Vec<openai::LogProbability>>(
+                                                v.clone(),
+                                            )
+                                            .ok()
+                                        });
+                                        (annotations, logprobs)
+                                    } else {
+                                        (None, None)
+                                    };
+                                    result.push(openai::OutputItem {
+                                        output_item_type: Some(openai::OutputItemType::Message),
+                                        role: Some(openai::MessageRole::Assistant),
+                                        content: Some(vec![openai::OutputMessageContent {
+                                            output_message_content_type:
+                                                openai::ContentType::OutputText,
+                                            text: Some(text_part.text),
+                                            annotations,
+                                            logprobs,
+                                            refusal: None,
+                                        }]),
+                                        id: use_id(&mut id_used, &id),
+                                        status: Some(openai::FunctionCallItemStatus::Completed),
+                                        ..Default::default()
+                                    });
+                                }
+                                AssistantContentPart::Reasoning {
+                                    text,
+                                    encrypted_content,
+                                } => {
+                                    // Accumulate reasoning summaries
+                                    has_pending_reasoning = true;
+                                    if !text.is_empty() {
+                                        pending_reasoning_summaries.push(openai::SummaryText {
+                                            text,
+                                            summary_text_type: openai::SummaryType::SummaryText,
+                                        });
+                                    }
+                                    if encrypted_content.is_some() {
+                                        pending_encrypted_content = encrypted_content;
+                                    }
+                                }
+                                AssistantContentPart::ToolCall {
+                                    tool_call_id,
+                                    tool_name,
+                                    arguments,
+                                    provider_executed,
+                                    ..
+                                } => {
+                                    // Flush any pending reasoning before tool call
+                                    flush_reasoning(
+                                        &mut result,
+                                        &mut pending_reasoning_summaries,
+                                        &mut pending_encrypted_content,
+                                        &mut has_pending_reasoning,
+                                        &mut id_used,
+                                        &id,
+                                    );
+                                    if provider_executed == Some(true) {
+                                        // Built-in tool: convert to appropriate OutputItem type
+                                        let args_value = match &arguments {
+                                            ToolCallArguments::Valid(map) => {
+                                                serde_json::Value::Object(map.clone())
+                                            }
+                                            ToolCallArguments::Invalid(s) => {
+                                                serde_json::Value::String(s.clone())
+                                            }
+                                        };
+
+                                        let item = match tool_name.as_str() {
+                                            "code_interpreter" => openai::OutputItem {
+                                                output_item_type: Some(
+                                                    openai::OutputItemType::CodeInterpreterCall,
+                                                ),
+                                                id: Some(tool_call_id),
+                                                code: args_value
+                                                    .get("code")
+                                                    .and_then(|v| v.as_str())
+                                                    .map(|s| s.to_string()),
+                                                container_id: args_value
+                                                    .get("container_id")
+                                                    .and_then(|v| v.as_str())
+                                                    .map(|s| s.to_string()),
+                                                outputs: args_value.get("outputs").and_then(|v| {
+                                                    serde_json::from_value(v.clone()).ok()
+                                                }),
+                                                status: args_value.get("status").and_then(|v| {
+                                                    serde_json::from_value(v.clone()).ok()
+                                                }),
+                                                ..Default::default()
+                                            },
+                                            "web_search" => openai::OutputItem {
+                                                output_item_type: Some(
+                                                    openai::OutputItemType::WebSearchCall,
+                                                ),
+                                                id: Some(tool_call_id),
+                                                action: args_value.get("action").and_then(|v| {
+                                                    serde_json::from_value(v.clone()).ok()
+                                                }),
+                                                queries: args_value.get("queries").and_then(|v| {
+                                                    serde_json::from_value(v.clone()).ok()
+                                                }),
+                                                status: args_value.get("status").and_then(|v| {
+                                                    serde_json::from_value(v.clone()).ok()
+                                                }),
+                                                ..Default::default()
+                                            },
+                                            "file_search" => openai::OutputItem {
+                                                output_item_type: Some(
+                                                    openai::OutputItemType::FileSearchCall,
+                                                ),
+                                                id: Some(tool_call_id),
+                                                queries: args_value.get("queries").and_then(|v| {
+                                                    serde_json::from_value(v.clone()).ok()
+                                                }),
+                                                results: args_value.get("results").and_then(|v| {
+                                                    serde_json::from_value(v.clone()).ok()
+                                                }),
+                                                status: args_value.get("status").and_then(|v| {
+                                                    serde_json::from_value(v.clone()).ok()
+                                                }),
+                                                ..Default::default()
+                                            },
+                                            "computer" => openai::OutputItem {
+                                                output_item_type: Some(
+                                                    openai::OutputItemType::ComputerCall,
+                                                ),
+                                                id: Some(tool_call_id),
+                                                action: args_value.get("action").and_then(|v| {
+                                                    serde_json::from_value(v.clone()).ok()
+                                                }),
+                                                status: args_value.get("status").and_then(|v| {
+                                                    serde_json::from_value(v.clone()).ok()
+                                                }),
+                                                ..Default::default()
+                                            },
+                                            "image_generation" => openai::OutputItem {
+                                                output_item_type: Some(
+                                                    openai::OutputItemType::ImageGenerationCall,
+                                                ),
+                                                id: Some(tool_call_id),
+                                                result: args_value
+                                                    .get("result")
+                                                    .and_then(|v| v.as_str())
+                                                    .map(|s| s.to_string()),
+                                                status: args_value.get("status").and_then(|v| {
+                                                    serde_json::from_value(v.clone()).ok()
+                                                }),
+                                                ..Default::default()
+                                            },
+                                            "local_shell" => openai::OutputItem {
+                                                output_item_type: Some(
+                                                    openai::OutputItemType::LocalShellCall,
+                                                ),
+                                                id: Some(tool_call_id),
+                                                action: args_value.get("action").and_then(|v| {
+                                                    serde_json::from_value(v.clone()).ok()
+                                                }),
+                                                status: args_value.get("status").and_then(|v| {
+                                                    serde_json::from_value(v.clone()).ok()
+                                                }),
+                                                ..Default::default()
+                                            },
+                                            "mcp_call" => openai::OutputItem {
+                                                output_item_type: Some(
+                                                    openai::OutputItemType::McpCall,
+                                                ),
+                                                id: Some(tool_call_id),
+                                                server_label: args_value
+                                                    .get("server_label")
+                                                    .and_then(|v| v.as_str())
+                                                    .map(|s| s.to_string()),
+                                                status: args_value.get("status").and_then(|v| {
+                                                    serde_json::from_value(v.clone()).ok()
+                                                }),
+                                                ..Default::default()
+                                            },
+                                            "mcp_list_tools" => openai::OutputItem {
+                                                output_item_type: Some(
+                                                    openai::OutputItemType::McpListTools,
+                                                ),
+                                                id: Some(tool_call_id),
+                                                server_label: args_value
+                                                    .get("server_label")
+                                                    .and_then(|v| v.as_str())
+                                                    .map(|s| s.to_string()),
+                                                tools: args_value.get("tools").and_then(|v| {
+                                                    serde_json::from_value(v.clone()).ok()
+                                                }),
+                                                status: args_value.get("status").and_then(|v| {
+                                                    serde_json::from_value(v.clone()).ok()
+                                                }),
+                                                ..Default::default()
+                                            },
+                                            "mcp_approval_request" => openai::OutputItem {
+                                                output_item_type: Some(
+                                                    openai::OutputItemType::McpApprovalRequest,
+                                                ),
+                                                id: Some(tool_call_id),
+                                                status: args_value.get("status").and_then(|v| {
+                                                    serde_json::from_value(v.clone()).ok()
+                                                }),
+                                                ..Default::default()
+                                            },
+                                            _ => {
+                                                // Unknown provider-executed tool - fall back to FunctionCall
+                                                openai::OutputItem {
+                                                    output_item_type: Some(
+                                                        openai::OutputItemType::FunctionCall,
+                                                    ),
+                                                    call_id: Some(tool_call_id),
+                                                    name: Some(tool_name),
+                                                    arguments: Some(arguments.to_string()),
+                                                    status: Some(
+                                                        openai::FunctionCallItemStatus::Completed,
+                                                    ),
+                                                    ..Default::default()
+                                                }
+                                            }
+                                        };
+                                        result.push(item);
+                                    } else {
+                                        // Regular function call
+                                        result.push(openai::OutputItem {
+                                            output_item_type: Some(
+                                                openai::OutputItemType::FunctionCall,
+                                            ),
+                                            id: use_id(&mut id_used, &id),
+                                            call_id: Some(tool_call_id),
+                                            name: Some(tool_name),
+                                            arguments: Some(arguments.to_string()),
+                                            status: Some(openai::FunctionCallItemStatus::Completed),
+                                            ..Default::default()
+                                        });
+                                    }
+                                }
+                                // Skip File and ToolResult variants as they don't map to OutputItems
+                                _ => {}
+                            }
+                        }
+                        // Flush any remaining pending reasoning at the end
+                        flush_reasoning(
+                            &mut result,
+                            &mut pending_reasoning_summaries,
+                            &mut pending_encrypted_content,
+                            &mut has_pending_reasoning,
+                            &mut id_used,
+                            &id,
+                        );
+                    }
+                }
+            }
+        }
+
+        Ok(result)
     }
 }
 
diff --git a/crates/lingua/src/providers/openai/responses_adapter.rs b/crates/lingua/src/providers/openai/responses_adapter.rs
index 0b23cdb9..b394c87d 100644
--- a/crates/lingua/src/providers/openai/responses_adapter.rs
+++ b/crates/lingua/src/providers/openai/responses_adapter.rs
@@ -312,103 +312,39 @@ impl ProviderAdapter for ResponsesAdapter {
     }
 
     fn response_to_universal(&self, payload: Value) -> Result<UniversalResponse, TransformError> {
-        let output = payload
+        use crate::providers::openai::generated::OutputItem;
+
+        let output_items: Vec<OutputItem> = payload
             .get("output")
             .and_then(Value::as_array)
+            .map(|arr| serde_json::from_value(Value::Array(arr.clone())))
+            .transpose()
+            .map_err(|e| {
+                TransformError::ToUniversalFailed(format!("Failed to parse output items: {}", e))
+            })?
             .ok_or_else(|| TransformError::ToUniversalFailed("missing output".to_string()))?;
 
-        // Convert output items to messages
-        // Responses API has multiple output types: message, function_call, reasoning, etc.
-        let mut messages: Vec<Message> = Vec::new();
-        let mut tool_calls: Vec<Value> = Vec::new();
-
-        for item in output {
-            let item_type = item.get("type").and_then(Value::as_str);
-
-            match item_type {
-                Some("message") => {
-                    // Message type - extract text content
-                    if let Some(content) = item.get("content") {
-                        if let Some(content_arr) = content.as_array() {
-                            let text: String = content_arr
-                                .iter()
-                                .filter_map(|c| {
-                                    if c.get("type").and_then(Value::as_str) == Some("output_text")
-                                    {
-                                        c.get("text").and_then(Value::as_str).map(String::from)
-                                    } else {
-                                        None
-                                    }
-                                })
-                                .collect::<Vec<_>>()
-                                .join("");
-                            if !text.is_empty() {
-                                messages.push(Message::Assistant {
-                                    content: AssistantContent::String(text),
-                                    id: None,
-                                });
-                            }
-                        }
-                    }
-                }
-                Some("function_call") => {
-                    // Function call - collect for later conversion to tool calls
-                    tool_calls.push(item.clone());
-                }
-                _ => {
-                    // Skip reasoning and other types for now
-                }
-            }
-        }
-
-        // If we have tool calls but no messages, create an assistant message with tool calls
-        if !tool_calls.is_empty() && messages.is_empty() {
-            // Convert function_call items to tool call format
-            use crate::universal::message::{AssistantContentPart, ToolCallArguments};
-            let parts: Vec<AssistantContentPart> = tool_calls
-                .iter()
-                .filter_map(|tc| {
-                    let name = tc.get("name").and_then(Value::as_str)?;
-                    let call_id = tc.get("call_id").and_then(Value::as_str)?;
-                    let arguments = tc.get("arguments").and_then(Value::as_str)?;
-
-                    // Try to parse arguments as JSON, fall back to invalid string
-                    let args = serde_json::from_str::<Map<String, Value>>(arguments)
-                        .map(ToolCallArguments::Valid)
-                        .unwrap_or_else(|_| ToolCallArguments::Invalid(arguments.to_string()));
-
-                    Some(AssistantContentPart::ToolCall {
-                        tool_call_id: call_id.to_string(),
-                        tool_name: name.to_string(),
-                        arguments: args,
-                        provider_options: None,
-                        provider_executed: None,
-                    })
+        let messages: Vec<Message> = TryFromLLM::try_from(output_items)
+            .map_err(|e: ConvertError| TransformError::ToUniversalFailed(e.to_string()))?;
+
+        let has_tool_calls = messages.iter().any(|m| {
+            if let Message::Assistant {
+                content: AssistantContent::Array(parts),
+                ..
+            } = m
+            {
+                parts.iter().any(|p| {
+                    matches!(
+                        p,
+                        crate::universal::message::AssistantContentPart::ToolCall { .. }
+                    )
                 })
-                .collect();
-
-            if !parts.is_empty() {
-                messages.push(Message::Assistant {
-                    content: AssistantContent::Array(parts),
-                    id: None,
-                });
+            } else {
+                false
             }
-        }
-
-        // If still no messages, try output_text field as fallback
-        // Include empty string to preserve message structure from source
-        if messages.is_empty() {
-            if let Some(text) = payload.get("output_text").and_then(Value::as_str) {
-                messages.push(Message::Assistant {
-                    content: AssistantContent::String(text.to_string()),
-                    id: None,
-                });
-            }
-        }
+        });
 
-        // Map status to finish_reason
-        // If we have tool calls, the finish reason should be ToolCalls regardless of status
-        let finish_reason = if !tool_calls.is_empty() {
+        let finish_reason = if has_tool_calls {
             Some(FinishReason::ToolCalls)
         } else {
             match payload.get("status").and_then(Value::as_str) {
@@ -434,15 +370,9 @@ impl ProviderAdapter for ResponsesAdapter {
     }
 
     fn response_from_universal(&self, resp: &UniversalResponse) -> Result<Value, TransformError> {
-        // Convert messages to InputItems (handles 1:N expansion for mixed content)
-        let input_items = universal_to_responses_input(&resp.messages)
-            .map_err(|e| TransformError::FromUniversalFailed(e.to_string()))?;
+        use crate::providers::openai::generated::OutputItem;
 
-        // Convert InputItems to OutputItems using existing infrastructure
-        let output_items: Vec<crate::providers::openai::generated::OutputItem> = input_items
-            .into_iter()
-            .map(TryFromLLM::try_from)
-            .collect::<Result<_, _>>()
+        let output_items: Vec<OutputItem> = TryFromLLM::try_from(resp.messages.clone())
             .map_err(|e: ConvertError| TransformError::FromUniversalFailed(e.to_string()))?;
 
         // Serialize OutputItems to JSON values
@@ -602,6 +532,7 @@ impl ProviderAdapter for ResponsesAdapter {
                 let response = payload.get("response");
                 let usage = response
                     .and_then(|r| r.get("usage"))
+                    .filter(|u| !u.is_null())
                     .map(|u| UniversalUsage::from_provider_value(u, self.format()));
 
                 let model = response
@@ -632,6 +563,7 @@ impl ProviderAdapter for ResponsesAdapter {
                 let response = payload.get("response");
                 let usage = response
                     .and_then(|r| r.get("usage"))
+                    .filter(|u| !u.is_null())
                     .map(|u| UniversalUsage::from_provider_value(u, self.format()));
 
                 Ok(Some(UniversalStreamChunk::new(
@@ -656,6 +588,12 @@ impl ProviderAdapter for ResponsesAdapter {
                 } else {
                     payload.get("response")
                 };
+
+                // If no response data, this is a keep-alive roundtrip
+                if response.is_none() {
+                    return Ok(Some(UniversalStreamChunk::keep_alive()));
+                }
+
                 let model = response
                     .and_then(|r| r.get("model"))
                     .and_then(Value::as_str)
@@ -666,6 +604,7 @@ impl ProviderAdapter for ResponsesAdapter {
                     .map(String::from);
                 let usage = response
                     .and_then(|r| r.get("usage"))
+                    .filter(|u| !u.is_null())
                     .map(|u| UniversalUsage::from_provider_value(u, self.format()));
 
                 Ok(Some(UniversalStreamChunk::new(
diff --git a/crates/lingua/src/universal/mod.rs b/crates/lingua/src/universal/mod.rs
index 720c7499..ef58afc4 100644
--- a/crates/lingua/src/universal/mod.rs
+++ b/crates/lingua/src/universal/mod.rs
@@ -25,9 +25,9 @@ pub mod transform;
 pub use defaults::*;
 pub use message::*;
 pub use request::{
-    parse_stop_sequences, JsonSchemaConfig, ReasoningConfig, ReasoningEffort, ResponseFormatConfig,
-    ResponseFormatType, SummaryMode, ToolChoiceConfig, ToolChoiceMode, UniversalParams,
-    UniversalRequest,
+    parse_stop_sequences, JsonSchemaConfig, ReasoningCanonical, ReasoningConfig, ReasoningEffort,
+    ResponseFormatConfig, ResponseFormatType, SummaryMode, ToolChoiceConfig, ToolChoiceMode,
+    UniversalParams, UniversalRequest,
 };
 pub use response::{FinishReason, UniversalResponse, UniversalUsage};
 pub use stream::{UniversalStreamChoice, UniversalStreamChunk};
diff --git a/crates/lingua/src/universal/reasoning.rs b/crates/lingua/src/universal/reasoning.rs
index ebf4ed68..24c2e169 100644
--- a/crates/lingua/src/universal/reasoning.rs
+++ b/crates/lingua/src/universal/reasoning.rs
@@ -52,7 +52,7 @@ use crate::providers::openai::generated::{
 use crate::serde_json::{json, Map, Value};
 #[cfg(test)]
 use crate::universal::request::SummaryMode;
-use crate::universal::request::{ReasoningConfig, ReasoningEffort};
+use crate::universal::request::{ReasoningCanonical, ReasoningConfig, ReasoningEffort};
 
 // =============================================================================
 // Heuristic Constants
@@ -82,9 +82,6 @@ pub const DEFAULT_MAX_TOKENS: i64 = 4096;
 /// Default reasoning effort when enabled but no budget specified
 pub const DEFAULT_REASONING_EFFORT: ReasoningEffort = ReasoningEffort::Medium;
 
-/// Required temperature for Anthropic when thinking is enabled
-pub const ANTHROPIC_THINKING_TEMPERATURE: f64 = 1.0;
-
 // =============================================================================
 // Effort ↔ Budget Conversion
 // =============================================================================
@@ -105,7 +102,6 @@ pub const ANTHROPIC_THINKING_TEMPERATURE: f64 = 1.0;
 /// # Validation
 /// - If `max_tokens` is None, zero, or negative, uses `DEFAULT_MAX_TOKENS` (4096)
 pub fn effort_to_budget(effort: ReasoningEffort, max_tokens: Option<i64>) -> i64 {
-    // Validate max_tokens - must be strictly positive
     let max = match max_tokens {
         Some(value) if value > 0 => value,
         _ => DEFAULT_MAX_TOKENS, // Use default for None, zero, or negative
@@ -163,12 +159,18 @@ pub fn budget_to_effort(budget: i64, max_tokens: Option<i64>) -> ReasoningEffort
 
 /// Convert Anthropic Thinking to ReasoningConfig.
 ///
-/// Anthropic's thinking is already normalized on `budget_tokens`, so this is a direct mapping.
+/// Anthropic's thinking uses `budget_tokens` as canonical. Effort is derived.
 impl From<&Thinking> for ReasoningConfig {
     fn from(thinking: &Thinking) -> Self {
+        let enabled = matches!(thinking.thinking_type, ThinkingType::Enabled);
+        let budget_tokens = thinking.budget_tokens;
+        let effort = budget_tokens.map(|b| budget_to_effort(b, None));
+
         ReasoningConfig {
-            enabled: Some(matches!(thinking.thinking_type, ThinkingType::Enabled)),
-            budget_tokens: thinking.budget_tokens,
+            enabled: Some(enabled),
+            effort,
+            budget_tokens,
+            canonical: Some(ReasoningCanonical::BudgetTokens),
             ..Default::default()
         }
     }
@@ -176,8 +178,8 @@ impl From<&Thinking> for ReasoningConfig {
 
 /// Convert OpenAI ReasoningEffort to ReasoningConfig with context (for Chat API).
 ///
+/// OpenAI's effort is canonical. Budget_tokens is derived.
 /// Takes max_tokens as context to compute accurate budget_tokens.
-/// Uses DEFAULT_MAX_TOKENS if max_tokens is None.
 impl From<(OpenAIReasoningEffort, Option<i64>)> for ReasoningConfig {
     fn from((effort, max_tokens): (OpenAIReasoningEffort, Option<i64>)) -> Self {
         let universal_effort = match effort {
@@ -185,9 +187,14 @@ impl From<(OpenAIReasoningEffort, Option<i64>)> for ReasoningConfig {
             OpenAIReasoningEffort::Medium => ReasoningEffort::Medium,
             OpenAIReasoningEffort::High => ReasoningEffort::High,
         };
+        // Derive budget_tokens from effort
+        let budget_tokens = effort_to_budget(universal_effort, max_tokens);
+
         ReasoningConfig {
             enabled: Some(true),
-            budget_tokens: Some(effort_to_budget(universal_effort, max_tokens)),
+            effort: Some(universal_effort),
+            budget_tokens: Some(budget_tokens),
+            canonical: Some(ReasoningCanonical::Effort),
             ..Default::default()
         }
     }
@@ -195,18 +202,27 @@ impl From<(OpenAIReasoningEffort, Option<i64>)> for ReasoningConfig {
 
 /// Convert OpenAI Reasoning to ReasoningConfig (for Responses API) - fallback.
 ///
+/// OpenAI's effort is canonical. Budget_tokens is derived.
 /// Uses DEFAULT_MAX_TOKENS for effort→budget conversion when max_tokens is not available.
 /// For context-aware conversion, use the tuple-based From impl.
 impl From<&OpenAIReasoning> for ReasoningConfig {
     fn from(reasoning: &OpenAIReasoning) -> Self {
-        let budget_tokens = reasoning.effort.as_ref().map(|e| {
-            let universal_effort = match e {
-                OpenAIReasoningEffort::Low | OpenAIReasoningEffort::Minimal => ReasoningEffort::Low,
-                OpenAIReasoningEffort::Medium => ReasoningEffort::Medium,
-                OpenAIReasoningEffort::High => ReasoningEffort::High,
-            };
-            effort_to_budget(universal_effort, None) // Uses DEFAULT_MAX_TOKENS
-        });
+        // Extract effort and derive budget_tokens
+        let (effort, budget_tokens) = reasoning
+            .effort
+            .as_ref()
+            .map(|e| {
+                let universal_effort = match e {
+                    OpenAIReasoningEffort::Low | OpenAIReasoningEffort::Minimal => {
+                        ReasoningEffort::Low
+                    }
+                    OpenAIReasoningEffort::Medium => ReasoningEffort::Medium,
+                    OpenAIReasoningEffort::High => ReasoningEffort::High,
+                };
+                let budget = effort_to_budget(universal_effort, None); // Uses DEFAULT_MAX_TOKENS
+                (universal_effort, budget)
+            })
+            .map_or((None, None), |(e, b)| (Some(e), Some(b)));
 
         let summary = reasoning
             .summary
@@ -220,7 +236,9 @@ impl From<&OpenAIReasoning> for ReasoningConfig {
 
         ReasoningConfig {
             enabled: Some(true),
+            effort,
             budget_tokens,
+            canonical: Some(ReasoningCanonical::Effort),
             summary,
         }
     }
@@ -228,18 +246,26 @@ impl From<&OpenAIReasoning> for ReasoningConfig {
 
 /// Convert OpenAI Reasoning to ReasoningConfig with context (for Responses API).
 ///
+/// OpenAI's effort is canonical. Budget_tokens is derived.
 /// Takes max_tokens as context to compute accurate budget_tokens.
-/// Uses provided max_tokens or DEFAULT_MAX_TOKENS if None.
 impl From<(&OpenAIReasoning, Option<i64>)> for ReasoningConfig {
     fn from((reasoning, max_tokens): (&OpenAIReasoning, Option<i64>)) -> Self {
-        let budget_tokens = reasoning.effort.as_ref().map(|e| {
-            let universal_effort = match e {
-                OpenAIReasoningEffort::Low | OpenAIReasoningEffort::Minimal => ReasoningEffort::Low,
-                OpenAIReasoningEffort::Medium => ReasoningEffort::Medium,
-                OpenAIReasoningEffort::High => ReasoningEffort::High,
-            };
-            effort_to_budget(universal_effort, max_tokens)
-        });
+        // Extract effort and derive budget_tokens
+        let (effort, budget_tokens) = reasoning
+            .effort
+            .as_ref()
+            .map(|e| {
+                let universal_effort = match e {
+                    OpenAIReasoningEffort::Low | OpenAIReasoningEffort::Minimal => {
+                        ReasoningEffort::Low
+                    }
+                    OpenAIReasoningEffort::Medium => ReasoningEffort::Medium,
+                    OpenAIReasoningEffort::High => ReasoningEffort::High,
+                };
+                let budget = effort_to_budget(universal_effort, max_tokens);
+                (universal_effort, budget)
+            })
+            .map_or((None, None), |(e, b)| (Some(e), Some(b)));
 
         let summary = reasoning
             .summary
@@ -253,7 +279,9 @@ impl From<(&OpenAIReasoning, Option<i64>)> for ReasoningConfig {
 
         ReasoningConfig {
             enabled: Some(true),
+            effort,
             budget_tokens,
+            canonical: Some(ReasoningCanonical::Effort),
             summary,
         }
     }
@@ -310,10 +338,13 @@ pub fn from_google(config: &Value) -> ReasoningConfig {
         });
 
     let budget_tokens = config.get("thinkingBudget").and_then(Value::as_i64);
+    let effort = budget_tokens.map(|b| budget_to_effort(b, None));
 
     ReasoningConfig {
         enabled,
+        effort,
         budget_tokens,
+        canonical: Some(ReasoningCanonical::BudgetTokens),
         ..Default::default()
     }
 }
@@ -328,7 +359,12 @@ fn to_openai_chat(config: &ReasoningConfig, max_tokens: Option<i64>) -> Option<S
         return None;
     }
 
-    // Convert budget_tokens → effort at adapter boundary
+    // Use effort directly (always populated when enabled)
+    if let Some(effort) = config.effort {
+        return Some(effort.to_string());
+    }
+
+    // Fallback: convert budget_tokens → effort
     if let Some(budget) = config.budget_tokens {
         let effort = budget_to_effort(budget, max_tokens);
         return Some(effort.to_string());
@@ -346,14 +382,17 @@ fn to_openai_responses(config: &ReasoningConfig, max_tokens: Option<i64>) -> Opt
 
     let mut obj = Map::new();
 
-    // Convert budget_tokens → effort at adapter boundary
-    let effort = if let Some(budget) = config.budget_tokens {
+    // Use effort directly (always populated when enabled)
+    let effort_str = if let Some(effort) = config.effort {
+        effort.to_string()
+    } else if let Some(budget) = config.budget_tokens {
+        // Fallback: convert budget_tokens → effort
         budget_to_effort(budget, max_tokens).to_string()
     } else {
         DEFAULT_REASONING_EFFORT.to_string() // Default if only enabled=true
     };
 
-    obj.insert("effort".into(), Value::String(effort));
+    obj.insert("effort".into(), Value::String(effort_str));
 
     // Summary
     if let Some(summary) = config.summary {
@@ -369,13 +408,20 @@ fn to_openai_responses(config: &ReasoningConfig, max_tokens: Option<i64>) -> Opt
 /// - `Some({ type: "disabled" })` when explicitly disabled
 /// - `Some({ type: "enabled", budget_tokens: N })` when enabled
 /// - `None` when not specified (no thinking field)
-fn to_anthropic(config: &ReasoningConfig, _max_tokens: Option<i64>) -> Option<Value> {
+fn to_anthropic(config: &ReasoningConfig, max_tokens: Option<i64>) -> Option<Value> {
     match config.enabled {
         // Explicitly disabled - return disabled payload
         Some(false) => Some(json!({ "type": "disabled" })),
         // Enabled - return enabled payload with budget
         Some(true) => {
-            let budget = config.budget_tokens.unwrap_or(MIN_THINKING_BUDGET);
+            // Use budget_tokens directly (always populated when enabled)
+            // Fallback: derive from effort
+            let budget = config.budget_tokens.unwrap_or_else(|| {
+                config
+                    .effort
+                    .map(|e| effort_to_budget(e, max_tokens))
+                    .unwrap_or(MIN_THINKING_BUDGET)
+            });
             Some(json!({
                 "type": "enabled",
                 "budget_tokens": budget
@@ -392,13 +438,20 @@ fn to_anthropic(config: &ReasoningConfig, _max_tokens: Option<i64>) -> Option<Va
 /// - `Some({ thinkingBudget: 0 })` when explicitly disabled
 /// - `Some({ includeThoughts: true, thinkingBudget: N })` when enabled
 /// - `None` when not specified (no thinkingConfig field)
-fn to_google(config: &ReasoningConfig, _max_tokens: Option<i64>) -> Option<Value> {
+fn to_google(config: &ReasoningConfig, max_tokens: Option<i64>) -> Option<Value> {
     match config.enabled {
         // Explicitly disabled - return disabled payload
         Some(false) => Some(json!({ "thinkingBudget": 0 })),
         // Enabled - return enabled payload with budget
         Some(true) => {
-            let budget = config.budget_tokens.unwrap_or(MIN_THINKING_BUDGET);
+            // Use budget_tokens directly (always populated when enabled)
+            // Fallback: derive from effort
+            let budget = config.budget_tokens.unwrap_or_else(|| {
+                config
+                    .effort
+                    .map(|e| effort_to_budget(e, max_tokens))
+                    .unwrap_or(MIN_THINKING_BUDGET)
+            });
             Some(json!({
                 "includeThoughts": true,
                 "thinkingBudget": budget
diff --git a/crates/lingua/src/universal/request.rs b/crates/lingua/src/universal/request.rs
index 1bd22d58..837e14af 100644
--- a/crates/lingua/src/universal/request.rs
+++ b/crates/lingua/src/universal/request.rs
@@ -225,21 +225,31 @@ impl UniversalParams {
 
 /// Configuration for extended thinking / reasoning capabilities.
 ///
-/// Uses `budget_tokens` as the canonical field for cross-provider conversion.
-/// When converting TO a provider, values are converted at the adapter boundary.
-/// OpenAI's `reasoning_effort` levels are converted to/from budget_tokens using heuristics.
+/// Both `effort` and `budget_tokens` are always populated when reasoning is enabled.
+/// The `canonical` field indicates which was the original source of truth:
+/// - `Effort`: From OpenAI (effort is canonical, budget_tokens derived)
+/// - `BudgetTokens`: From Anthropic/Google (budget_tokens is canonical, effort derived)
 #[derive(Debug, Clone, Default, Serialize, Deserialize)]
 pub struct ReasoningConfig {
     /// Whether reasoning/thinking is enabled.
     #[serde(skip_serializing_if = "Option::is_none")]
     pub enabled: Option<bool>,
 
-    /// Token budget for thinking (canonical field).
-    /// All providers' reasoning configurations are normalized to this field.
-    /// OpenAI effort levels are converted to budget_tokens at adapter boundaries.
+    /// Reasoning effort level (low/medium/high).
+    /// Always populated when enabled. Used by OpenAI Chat/Responses API.
+    #[serde(skip_serializing_if = "Option::is_none")]
+    pub effort: Option<ReasoningEffort>,
+
+    /// Token budget for thinking.
+    /// Always populated when enabled. Used by Anthropic/Google.
     #[serde(skip_serializing_if = "Option::is_none")]
     pub budget_tokens: Option<i64>,
 
+    /// Which field is the canonical source of truth.
+    /// Indicates whether `effort` or `budget_tokens` was the original value.
+    #[serde(skip_serializing_if = "Option::is_none")]
+    pub canonical: Option<ReasoningCanonical>,
+
     /// Summary mode for reasoning output.
     /// Maps to OpenAI Responses API's `reasoning.summary` field.
     #[serde(skip_serializing_if = "Option::is_none")]
@@ -255,7 +265,10 @@ impl ReasoningConfig {
             return true;
         }
         // Empty config (no meaningful fields set)
-        self.enabled.is_none() && self.budget_tokens.is_none() && self.summary.is_none()
+        self.enabled.is_none()
+            && self.effort.is_none()
+            && self.budget_tokens.is_none()
+            && self.summary.is_none()
     }
 }
 
@@ -269,7 +282,8 @@ fn reasoning_should_skip(reasoning: &Option<ReasoningConfig>) -> bool {
 }
 
 /// Reasoning effort level (portable across providers).
-#[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize)]
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize, Deserialize)]
+#[serde(rename_all = "lowercase")]
 pub enum ReasoningEffort {
     Low,
     Medium,
@@ -315,6 +329,19 @@ impl AsRef<str> for ReasoningEffort {
     }
 }
 
+/// Indicates which field is the canonical source of truth for reasoning configuration.
+///
+/// When converting between providers, both `effort` and `budget_tokens` are always populated
+/// (one derived from the other). This field indicates which was the original source.
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize, Deserialize)]
+#[serde(rename_all = "snake_case")]
+pub enum ReasoningCanonical {
+    /// `effort` is the source of truth (from OpenAI Chat/Responses API)
+    Effort,
+    /// `budget_tokens` is the source of truth (from Anthropic/Google)
+    BudgetTokens,
+}
+
 /// Summary mode for reasoning output.
 #[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize, Deserialize)]
 pub enum SummaryMode {
diff --git a/crates/lingua/src/universal/tools.rs b/crates/lingua/src/universal/tools.rs
index 2840538a..74ad7853 100644
--- a/crates/lingua/src/universal/tools.rs
+++ b/crates/lingua/src/universal/tools.rs
@@ -496,11 +496,22 @@ fn detect_tools_format(tools: &Value) -> ToolsFormat {
 
         // Has type, no function wrapper → check if Anthropic builtin or Responses API
         (Some(t), false, _) => {
+            // OpenAI Responses builtins (check these first since some overlap with Anthropic)
+            if t == "code_interpreter"
+                || t == "file_search"
+                || t == "mcp"
+                || t == "computer_use_preview"
+                || t.starts_with("web_search_preview")
+            // web_search_preview, web_search_preview_2025_03_11
+            {
+                ToolsFormat::OpenAIResponses
+            }
             // Anthropic built-in tools use versioned type names (e.g., bash_20250124).
             // Update this list when Anthropic adds new built-in tool types.
-            if t.starts_with("bash_")
+            else if t.starts_with("bash_")
                 || t.starts_with("text_editor_")
                 || t.starts_with("web_search_")
+            // Anthropic's web_search_YYYYMMDD format
             {
                 ToolsFormat::AnthropicBuiltin
             } else {