From 914860a6bdf317b1bb343fd82ed7d66e067d8c91 Mon Sep 17 00:00:00 2001
From: ajmallesh <ajmallesh@gmail.com>
Date: Thu, 15 Jan 2026 14:14:37 -0800
Subject: [PATCH 1/9] feat: add claude-code-router support for multi-model
 testing

- Add ROUTER=true flag to route requests through claude-code-router
- Add router service to docker-compose with profile-based activation
- Support OpenAI (gpt-4o) and Google Gemini (gemini-2.5-pro) as alternatives
- Add router-config.json with provider configuration template
- Update .env.example with provider API key options
- Document router mode limitations (cost tracking shows $0)
---
 .env.example               | 27 ++++++++++++++++++++++-
 CLAUDE.md                  | 11 ++++++++++
 configs/router-config.json | 31 ++++++++++++++++++++++++++
 docker-compose.yml         | 30 +++++++++++++++++++++++++
 shannon                    | 45 +++++++++++++++++++++++++++++++++-----
 5 files changed, 138 insertions(+), 6 deletions(-)
 create mode 100644 configs/router-config.json
diff --git a/.env.example b/.env.example
index 9378e66..27bc16d 100644
--- a/.env.example
+++ b/.env.example
@@ -1,8 +1,33 @@
 # Shannon Environment Configuration
 # Copy this file to .env and fill in your credentials
 
-# Anthropic API Key (required - choose one)
+# Recommended output token configuration for larger tool outputs
+CLAUDE_CODE_MAX_OUTPUT_TOKENS=64000
+
+# =============================================================================
+# OPTION 1: Direct Anthropic (default, no router)
+# =============================================================================
 ANTHROPIC_API_KEY=your-api-key-here
 
 # OR use OAuth token instead
 # CLAUDE_CODE_OAUTH_TOKEN=your-oauth-token-here
+
+# =============================================================================
+# OPTION 2: Router Mode (use alternative providers)
+# =============================================================================
+# Enable router mode by running: ./shannon start ... ROUTER=true
+# Then configure ONE of the providers below:
+
+# --- OpenAI ---
+# OPENAI_API_KEY=sk-your-openai-key
+# ROUTER_DEFAULT=openai,gpt-4o
+
+# --- Google Gemini ---
+GEMINI_API_KEY=your-gemini-key
+ROUTER_DEFAULT=gemini,gemini-2.5-pro
+
+# =============================================================================
+# Available Models
+# =============================================================================
+# OpenAI:  gpt-4o, gpt-4o-mini
+# Gemini:  gemini-2.5-pro, gemini-2.5-flash
diff --git a/CLAUDE.md b/CLAUDE.md
index 04bce8c..2d49db7 100644
--- a/CLAUDE.md
+++ b/CLAUDE.md
@@ -50,6 +50,7 @@ CONFIG=<file>          YAML configuration file for authentication and testing pa
 OUTPUT=<path>          Custom output directory for session folder (default: ./audit-logs/)
 PIPELINE_TESTING=true  Use minimal prompts and fast retry intervals (10s instead of 5min)
 REBUILD=true           Force Docker rebuild with --no-cache (use when code changes aren't picked up)
+ROUTER=true            Route requests through claude-code-router for multi-model support (see limitations below)
 ```
 
 ### Generate TOTP for Authentication
@@ -284,6 +285,16 @@ Missing tools can be skipped using `PIPELINE_TESTING=true` mode during developme
 - `subfinder` - Subdomain discovery
 - `whatweb` - Web technology detection
 
+### Router Mode Limitations
+When using `ROUTER=true` to route requests through claude-code-router (e.g., to use OpenAI models):
+
+**Cost tracking shows $0.00**: The Claude Agent SDK expects `total_cost_usd` in the result message, which is Anthropic-specific. OpenAI's API returns token counts in `usage` but not a cost field, and the router doesn't translate this. This is a known limitation of the router, not a Shannon bug.
+
+**Workarounds:**
+- Accept $0 costs when using router mode (recommended for dev/testing)
+- Use Anthropic directly for production runs where cost tracking matters
+- Use external tools like `ccusage` for post-hoc token analysis
+
 ### Diagnostic & Utility Scripts
 ```bash
 # View Temporal workflow history
diff --git a/configs/router-config.json b/configs/router-config.json
new file mode 100644
index 0000000..8d043e4
--- /dev/null
+++ b/configs/router-config.json
@@ -0,0 +1,31 @@
+{
+  "HOST": "0.0.0.0",
+  "APIKEY": "shannon-router-key",
+  "LOG": true,
+  "LOG_LEVEL": "info",
+  "NON_INTERACTIVE_MODE": true,
+  "API_TIMEOUT_MS": 600000,
+  "Providers": [
+    {
+      "name": "openai",
+      "api_base_url": "https://api.openai.com/v1/chat/completions",
+      "api_key": "$OPENAI_API_KEY",
+      "models": ["gpt-4o", "gpt-4o-mini"],
+      "transformer": {
+        "use": [["maxtoken", { "max_tokens": 16384 }]]
+      }
+    },
+    {
+      "name": "gemini",
+      "api_base_url": "https://generativelanguage.googleapis.com/v1beta/models/",
+      "api_key": "$GEMINI_API_KEY",
+      "models": ["gemini-2.5-pro", "gemini-2.5-flash"],
+      "transformer": {
+        "use": ["gemini"]
+      }
+    }
+  ],
+  "Router": {
+    "default": "$ROUTER_DEFAULT"
+  }
+}
diff --git a/docker-compose.yml b/docker-compose.yml
index 211e2bf..afb7d3d 100644
--- a/docker-compose.yml
+++ b/docker-compose.yml
@@ -20,6 +20,8 @@ services:
     environment:
       - TEMPORAL_ADDRESS=temporal:7233
       - ANTHROPIC_API_KEY=${ANTHROPIC_API_KEY:-}
+      - ANTHROPIC_BASE_URL=${ANTHROPIC_BASE_URL:-}  # Optional: route through claude-code-router
+      - ANTHROPIC_AUTH_TOKEN=${ANTHROPIC_AUTH_TOKEN:-}  # Auth token for router
       - CLAUDE_CODE_OAUTH_TOKEN=${CLAUDE_CODE_OAUTH_TOKEN:-}
       - CLAUDE_CODE_MAX_OUTPUT_TOKENS=${CLAUDE_CODE_MAX_OUTPUT_TOKENS:-64000}
     depends_on:
@@ -36,5 +38,33 @@ services:
     security_opt:
       - seccomp:unconfined
 
+  # Optional: claude-code-router for multi-model support
+  # Start with: ROUTER=true ./shannon start ...
+  router:
+    image: node:20-slim
+    profiles: ["router"]  # Only starts when explicitly requested
+    command: >
+      sh -c "apt-get update && apt-get install -y gettext-base &&
+             npm install -g @musistudio/claude-code-router &&
+             mkdir -p /root/.claude-code-router &&
+             envsubst < /config/router-config.json > /root/.claude-code-router/config.json &&
+             ccr start"
+    ports:
+      - "3456:3456"
+    volumes:
+      - ./configs/router-config.json:/config/router-config.json:ro
+    environment:
+      - HOST=0.0.0.0
+      - ANTHROPIC_API_KEY=${ANTHROPIC_API_KEY:-}
+      - OPENAI_API_KEY=${OPENAI_API_KEY:-}
+      - GEMINI_API_KEY=${GEMINI_API_KEY:-}
+      - ROUTER_DEFAULT=${ROUTER_DEFAULT:-openai,gpt-4o}
+    healthcheck:
+      test: ["CMD", "node", "-e", "require('http').get('http://localhost:3456/health', r => process.exit(r.statusCode === 200 ? 0 : 1)).on('error', () => process.exit(1))"]
+      interval: 10s
+      timeout: 5s
+      retries: 5
+      start_period: 30s
+
 volumes:
   temporal-data:
diff --git a/shannon b/shannon
index 61f8a4e..c979d76 100755
--- a/shannon
+++ b/shannon
@@ -35,6 +35,7 @@ Options for 'start':
   CONFIG=<path>          Configuration file (YAML)
   OUTPUT=<path>          Output directory for reports (default: ./audit-logs/)
   PIPELINE_TESTING=true  Use minimal prompts for fast testing
+  ROUTER=true            Route requests through claude-code-router (multi-model support)
 
 Options for 'stop':
   CLEAN=true             Remove all data including volumes
@@ -63,6 +64,7 @@ parse_args() {
       CLEAN=*) CLEAN="${arg#CLEAN=}" ;;
       PIPELINE_TESTING=*) PIPELINE_TESTING="${arg#PIPELINE_TESTING=}" ;;
       REBUILD=*) REBUILD="${arg#REBUILD=}" ;;
+      ROUTER=*) ROUTER="${arg#ROUTER=}" ;;
     esac
   done
 }
@@ -121,10 +123,16 @@ cmd_start() {
     exit 1
   fi
 
-  # Check for API key
+  # Check for API key (router mode can use OPENAI_API_KEY or GEMINI_API_KEY instead)
   if [ -z "$ANTHROPIC_API_KEY" ] && [ -z "$CLAUDE_CODE_OAUTH_TOKEN" ]; then
-    echo "ERROR: Set ANTHROPIC_API_KEY or CLAUDE_CODE_OAUTH_TOKEN in .env"
-    exit 1
+    if [ "$ROUTER" = "true" ] && { [ -n "$OPENAI_API_KEY" ] || [ -n "$GEMINI_API_KEY" ]; }; then
+      # Router mode with alternative provider - set a placeholder for SDK init
+      export ANTHROPIC_API_KEY="router-mode"
+    else
+      echo "ERROR: Set ANTHROPIC_API_KEY or CLAUDE_CODE_OAUTH_TOKEN in .env"
+      echo "       (or use ROUTER=true with OPENAI_API_KEY or GEMINI_API_KEY)"
+      exit 1
+    fi
   fi
 
   # Determine container path for REPO
@@ -149,6 +157,33 @@ cmd_start() {
     export OUTPUT_DIR="$OUTPUT"
   fi
 
+  # Handle ROUTER flag - start claude-code-router for multi-model support
+  if [ "$ROUTER" = "true" ]; then
+    # Check if router is already running
+    if docker compose -f "$COMPOSE_FILE" --profile router ps router 2>/dev/null | grep -q "running"; then
+      echo "Router already running, skipping startup..."
+    else
+      echo "Starting claude-code-router..."
+
+      # Check for OpenAI API key
+      if [ -z "$OPENAI_API_KEY" ] && [ -z "$GEMINI_API_KEY" ]; then
+        echo "WARNING: Neither OPENAI_API_KEY nor GEMINI_API_KEY set. Router may not work."
+      fi
+
+      # Start router with profile
+      docker compose -f "$COMPOSE_FILE" --profile router up -d router
+
+      # Give router a few seconds to start (health check disabled for now - TODO: debug later)
+      echo "Waiting for router to start..."
+      sleep 5
+    fi
+
+    # Set ANTHROPIC_BASE_URL to route through router
+    export ANTHROPIC_BASE_URL="http://router:3456"
+    # Set auth token to match router's APIKEY
+    export ANTHROPIC_AUTH_TOKEN="shannon-router-key"
+  fi
+
   # Ensure containers are running (starts them if needed)
   ensure_containers
 
@@ -226,9 +261,9 @@ cmd_stop() {
   parse_args "$@"
 
   if [ "$CLEAN" = "true" ]; then
-    docker compose -f "$COMPOSE_FILE" down -v
+    docker compose -f "$COMPOSE_FILE" --profile router down -v
   else
-    docker compose -f "$COMPOSE_FILE" down
+    docker compose -f "$COMPOSE_FILE" --profile router down
   fi
 }
 

From d925c4942be2001e83f0f63ed7419ba2ebfc5d79 Mon Sep 17 00:00:00 2001
From: ajmallesh <ajmallesh@gmail.com>
Date: Thu, 15 Jan 2026 15:16:05 -0800
Subject: [PATCH 2/9] feat: add DeepSeek provider support for
 claude-code-router

- Add DeepSeek provider config with Together.ai and official API support
- Configure deepseek and enhancetool transformers for reliable tool calling
- Add DEEPSEEK_API_KEY and DEEPSEEK_API_BASE env vars to docker-compose
- Update shannon CLI to recognize DeepSeek as valid router provider
---
 .env.example               | 19 +++++++++++++++----
 configs/router-config.json |  9 +++++++++
 docker-compose.yml         |  2 ++
 shannon                    | 12 ++++++------
 4 files changed, 32 insertions(+), 10 deletions(-)

diff --git a/.env.example b/.env.example
index 27bc16d..8f865f1 100644
--- a/.env.example
+++ b/.env.example
@@ -23,11 +23,22 @@ ANTHROPIC_API_KEY=your-api-key-here
 # ROUTER_DEFAULT=openai,gpt-4o
 
 # --- Google Gemini ---
-GEMINI_API_KEY=your-gemini-key
-ROUTER_DEFAULT=gemini,gemini-2.5-pro
+# GEMINI_API_KEY=your-gemini-key
+# ROUTER_DEFAULT=gemini,gemini-2.5-pro
+
+# --- DeepSeek (cheapest option) ---
+# DEEPSEEK_API_KEY=your-together-or-deepseek-key
+# DEEPSEEK_API_BASE=https://api.together.xyz/v1/chat/completions  # Default: Together.ai
+# ROUTER_DEFAULT=deepseek,deepseek-ai/DeepSeek-V3
+#
+# To use DeepSeek's official API instead:
+# DEEPSEEK_API_BASE=https://api.deepseek.com/chat/completions
+# ROUTER_DEFAULT=deepseek,deepseek-chat
 
 # =============================================================================
 # Available Models
 # =============================================================================
-# OpenAI:  gpt-4o, gpt-4o-mini
-# Gemini:  gemini-2.5-pro, gemini-2.5-flash
+# OpenAI:     gpt-4o, gpt-4o-mini
+# Gemini:     gemini-2.5-pro, gemini-2.5-flash
+# DeepSeek:   (Together.ai) deepseek-ai/DeepSeek-V3, deepseek-ai/DeepSeek-R1
+#             (Official)    deepseek-chat, deepseek-reasoner
diff --git a/configs/router-config.json b/configs/router-config.json
index 8d043e4..6d5213d 100644
--- a/configs/router-config.json
+++ b/configs/router-config.json
@@ -23,6 +23,15 @@
       "transformer": {
         "use": ["gemini"]
       }
+    },
+    {
+      "name": "deepseek",
+      "api_base_url": "$DEEPSEEK_API_BASE",
+      "api_key": "$DEEPSEEK_API_KEY",
+      "models": ["deepseek-ai/DeepSeek-V3", "deepseek-ai/DeepSeek-R1", "deepseek-chat", "deepseek-reasoner"],
+      "transformer": {
+        "use": ["deepseek", "enhancetool"]
+      }
     }
   ],
   "Router": {
diff --git a/docker-compose.yml b/docker-compose.yml
index afb7d3d..664e3b6 100644
--- a/docker-compose.yml
+++ b/docker-compose.yml
@@ -58,6 +58,8 @@ services:
       - ANTHROPIC_API_KEY=${ANTHROPIC_API_KEY:-}
       - OPENAI_API_KEY=${OPENAI_API_KEY:-}
       - GEMINI_API_KEY=${GEMINI_API_KEY:-}
+      - DEEPSEEK_API_KEY=${DEEPSEEK_API_KEY:-}
+      - DEEPSEEK_API_BASE=${DEEPSEEK_API_BASE:-https://api.together.xyz/v1/chat/completions}
       - ROUTER_DEFAULT=${ROUTER_DEFAULT:-openai,gpt-4o}
     healthcheck:
       test: ["CMD", "node", "-e", "require('http').get('http://localhost:3456/health', r => process.exit(r.statusCode === 200 ? 0 : 1)).on('error', () => process.exit(1))"]
diff --git a/shannon b/shannon
index c979d76..3719a40 100755
--- a/shannon
+++ b/shannon
@@ -123,14 +123,14 @@ cmd_start() {
     exit 1
   fi
 
-  # Check for API key (router mode can use OPENAI_API_KEY or GEMINI_API_KEY instead)
+  # Check for API key (router mode can use alternative provider API keys)
   if [ -z "$ANTHROPIC_API_KEY" ] && [ -z "$CLAUDE_CODE_OAUTH_TOKEN" ]; then
-    if [ "$ROUTER" = "true" ] && { [ -n "$OPENAI_API_KEY" ] || [ -n "$GEMINI_API_KEY" ]; }; then
+    if [ "$ROUTER" = "true" ] && { [ -n "$OPENAI_API_KEY" ] || [ -n "$GEMINI_API_KEY" ] || [ -n "$DEEPSEEK_API_KEY" ]; }; then
       # Router mode with alternative provider - set a placeholder for SDK init
       export ANTHROPIC_API_KEY="router-mode"
     else
       echo "ERROR: Set ANTHROPIC_API_KEY or CLAUDE_CODE_OAUTH_TOKEN in .env"
-      echo "       (or use ROUTER=true with OPENAI_API_KEY or GEMINI_API_KEY)"
+      echo "       (or use ROUTER=true with OPENAI_API_KEY, GEMINI_API_KEY, or DEEPSEEK_API_KEY)"
       exit 1
     fi
   fi
@@ -165,9 +165,9 @@ cmd_start() {
     else
       echo "Starting claude-code-router..."
 
-      # Check for OpenAI API key
-      if [ -z "$OPENAI_API_KEY" ] && [ -z "$GEMINI_API_KEY" ]; then
-        echo "WARNING: Neither OPENAI_API_KEY nor GEMINI_API_KEY set. Router may not work."
+      # Check for provider API keys
+      if [ -z "$OPENAI_API_KEY" ] && [ -z "$GEMINI_API_KEY" ] && [ -z "$DEEPSEEK_API_KEY" ]; then
+        echo "WARNING: No provider API key set (OPENAI_API_KEY, GEMINI_API_KEY, or DEEPSEEK_API_KEY). Router may not work."
       fi
 
       # Start router with profile

From d01980ce4b5fddbb811dc77a36394aabf97c674b Mon Sep 17 00:00:00 2001
From: ajmallesh <ajmallesh@gmail.com>
Date: Thu, 15 Jan 2026 15:21:34 -0800
Subject: [PATCH 3/9] feat: add OpenRouter provider support for
 claude-code-router

---
 .env.example               |  6 ++++++
 configs/router-config.json | 14 ++++++++++++++
 docker-compose.yml         |  1 +
 shannon                    |  8 ++++----
 4 files changed, 25 insertions(+), 4 deletions(-)

diff --git a/.env.example b/.env.example
index 8f865f1..bcdd021 100644
--- a/.env.example
+++ b/.env.example
@@ -35,6 +35,10 @@ ANTHROPIC_API_KEY=your-api-key-here
 # DEEPSEEK_API_BASE=https://api.deepseek.com/chat/completions
 # ROUTER_DEFAULT=deepseek,deepseek-chat
 
+# --- OpenRouter (access 100+ models via single API) ---
+# OPENROUTER_API_KEY=sk-or-your-openrouter-key
+# ROUTER_DEFAULT=openrouter,anthropic/claude-sonnet-4
+
 # =============================================================================
 # Available Models
 # =============================================================================
@@ -42,3 +46,5 @@ ANTHROPIC_API_KEY=your-api-key-here
 # Gemini:     gemini-2.5-pro, gemini-2.5-flash
 # DeepSeek:   (Together.ai) deepseek-ai/DeepSeek-V3, deepseek-ai/DeepSeek-R1
 #             (Official)    deepseek-chat, deepseek-reasoner
+# OpenRouter: anthropic/claude-sonnet-4, google/gemini-2.5-pro-preview,
+#             openai/gpt-4o, meta-llama/llama-3.3-70b-instruct (100+ more)
diff --git a/configs/router-config.json b/configs/router-config.json
index 6d5213d..dd3fc47 100644
--- a/configs/router-config.json
+++ b/configs/router-config.json
@@ -32,6 +32,20 @@
       "transformer": {
         "use": ["deepseek", "enhancetool"]
       }
+    },
+    {
+      "name": "openrouter",
+      "api_base_url": "https://openrouter.ai/api/v1/chat/completions",
+      "api_key": "$OPENROUTER_API_KEY",
+      "models": [
+        "anthropic/claude-sonnet-4",
+        "google/gemini-2.5-pro-preview",
+        "openai/gpt-4o",
+        "meta-llama/llama-3.3-70b-instruct"
+      ],
+      "transformer": {
+        "use": ["openrouter"]
+      }
     }
   ],
   "Router": {
diff --git a/docker-compose.yml b/docker-compose.yml
index 664e3b6..0f55219 100644
--- a/docker-compose.yml
+++ b/docker-compose.yml
@@ -60,6 +60,7 @@ services:
       - GEMINI_API_KEY=${GEMINI_API_KEY:-}
       - DEEPSEEK_API_KEY=${DEEPSEEK_API_KEY:-}
       - DEEPSEEK_API_BASE=${DEEPSEEK_API_BASE:-https://api.together.xyz/v1/chat/completions}
+      - OPENROUTER_API_KEY=${OPENROUTER_API_KEY:-}
       - ROUTER_DEFAULT=${ROUTER_DEFAULT:-openai,gpt-4o}
     healthcheck:
       test: ["CMD", "node", "-e", "require('http').get('http://localhost:3456/health', r => process.exit(r.statusCode === 200 ? 0 : 1)).on('error', () => process.exit(1))"]
diff --git a/shannon b/shannon
index 3719a40..760b0b1 100755
--- a/shannon
+++ b/shannon
@@ -125,12 +125,12 @@ cmd_start() {
 
   # Check for API key (router mode can use alternative provider API keys)
   if [ -z "$ANTHROPIC_API_KEY" ] && [ -z "$CLAUDE_CODE_OAUTH_TOKEN" ]; then
-    if [ "$ROUTER" = "true" ] && { [ -n "$OPENAI_API_KEY" ] || [ -n "$GEMINI_API_KEY" ] || [ -n "$DEEPSEEK_API_KEY" ]; }; then
+    if [ "$ROUTER" = "true" ] && { [ -n "$OPENAI_API_KEY" ] || [ -n "$GEMINI_API_KEY" ] || [ -n "$DEEPSEEK_API_KEY" ] || [ -n "$OPENROUTER_API_KEY" ]; }; then
       # Router mode with alternative provider - set a placeholder for SDK init
       export ANTHROPIC_API_KEY="router-mode"
     else
       echo "ERROR: Set ANTHROPIC_API_KEY or CLAUDE_CODE_OAUTH_TOKEN in .env"
-      echo "       (or use ROUTER=true with OPENAI_API_KEY, GEMINI_API_KEY, or DEEPSEEK_API_KEY)"
+      echo "       (or use ROUTER=true with OPENAI_API_KEY, GEMINI_API_KEY, DEEPSEEK_API_KEY, or OPENROUTER_API_KEY)"
       exit 1
     fi
   fi
@@ -166,8 +166,8 @@ cmd_start() {
       echo "Starting claude-code-router..."
 
       # Check for provider API keys
-      if [ -z "$OPENAI_API_KEY" ] && [ -z "$GEMINI_API_KEY" ] && [ -z "$DEEPSEEK_API_KEY" ]; then
-        echo "WARNING: No provider API key set (OPENAI_API_KEY, GEMINI_API_KEY, or DEEPSEEK_API_KEY). Router may not work."
+      if [ -z "$OPENAI_API_KEY" ] && [ -z "$GEMINI_API_KEY" ] && [ -z "$DEEPSEEK_API_KEY" ] && [ -z "$OPENROUTER_API_KEY" ]; then
+        echo "WARNING: No provider API key set (OPENAI_API_KEY, GEMINI_API_KEY, DEEPSEEK_API_KEY, or OPENROUTER_API_KEY). Router may not work."
       fi
 
       # Start router with profile

From cd04c7a6d2d34f6bfbc7dcc986c9287a8fac913d Mon Sep 17 00:00:00 2001
From: ajmallesh <ajmallesh@gmail.com>
Date: Thu, 15 Jan 2026 18:30:19 -0800
Subject: [PATCH 4/9] feat: add model tracking and reporting across pipeline

- Track actual model name from router through audit logs, session.json, and query output
- Add router-utils.ts to resolve model names from ROUTER_DEFAULT env var
- Inject model info into final report's Executive Summary section
- Update documentation with supported providers, pricing, and config examples
- Update router-config.json with latest model versions (GPT-5.2, Gemini 2.5, etc.)
---
 .env.example                 | 14 +++---
 CLAUDE.md                    | 52 +++++++++++++++++-----
 README.md                    | 50 ++++++++++++++++++++-
 configs/router-config.json   | 13 +++---
 docker-compose.yml           |  1 +
 src/ai/claude-executor.ts    | 34 ++++++++++-----
 src/ai/message-handlers.ts   | 18 +++++---
 src/ai/router-utils.ts       | 34 +++++++++++++++
 src/audit/audit-session.ts   |  7 +--
 src/audit/metrics-tracker.ts | 21 ++++++---
 src/phases/pre-recon.ts      |  6 +--
 src/phases/reporting.ts      | 84 ++++++++++++++++++++++++++++++++++++
 src/temporal/activities.ts   | 26 ++++++++++-
 src/temporal/query.ts        |  3 ++
 src/temporal/shared.ts       |  1 +
 src/temporal/workflows.ts    |  4 ++
 16 files changed, 312 insertions(+), 56 deletions(-)
 create mode 100644 src/ai/router-utils.ts

diff --git a/.env.example b/.env.example
index bcdd021..fd00877 100644
--- a/.env.example
+++ b/.env.example
@@ -20,7 +20,7 @@ ANTHROPIC_API_KEY=your-api-key-here
 
 # --- OpenAI ---
 # OPENAI_API_KEY=sk-your-openai-key
-# ROUTER_DEFAULT=openai,gpt-4o
+# ROUTER_DEFAULT=openai,gpt-5.2
 
 # --- Google Gemini ---
 # GEMINI_API_KEY=your-gemini-key
@@ -42,9 +42,9 @@ ANTHROPIC_API_KEY=your-api-key-here
 # =============================================================================
 # Available Models
 # =============================================================================
-# OpenAI:     gpt-4o, gpt-4o-mini
-# Gemini:     gemini-2.5-pro, gemini-2.5-flash
-# DeepSeek:   (Together.ai) deepseek-ai/DeepSeek-V3, deepseek-ai/DeepSeek-R1
-#             (Official)    deepseek-chat, deepseek-reasoner
-# OpenRouter: anthropic/claude-sonnet-4, google/gemini-2.5-pro-preview,
-#             openai/gpt-4o, meta-llama/llama-3.3-70b-instruct (100+ more)
+# OpenAI:     gpt-5.2, gpt-5-mini
+# Gemini:     gemini-2.5-pro
+# DeepSeek:   (Together.ai) deepseek-ai/DeepSeek-V3
+#             (Official)    deepseek-chat
+# OpenRouter: anthropic/claude-sonnet-4, google/gemini-3-pro-preview,
+#             openai/gpt-5.2 (100+ more)
diff --git a/CLAUDE.md b/CLAUDE.md
index 2d49db7..8d2d55c 100644
--- a/CLAUDE.md
+++ b/CLAUDE.md
@@ -50,7 +50,7 @@ CONFIG=<file>          YAML configuration file for authentication and testing pa
 OUTPUT=<path>          Custom output directory for session folder (default: ./audit-logs/)
 PIPELINE_TESTING=true  Use minimal prompts and fast retry intervals (10s instead of 5min)
 REBUILD=true           Force Docker rebuild with --no-cache (use when code changes aren't picked up)
-ROUTER=true            Route requests through claude-code-router for multi-model support (see limitations below)
+ROUTER=true            Route requests through claude-code-router for multi-model support
 ```
 
 ### Generate TOTP for Authentication
@@ -262,11 +262,51 @@ The tool should only be used on systems you own or have explicit permission to t
 - `shannon` - CLI script for running pentests
 - `docker-compose.yml` - Temporal server + worker containers
 - `configs/` - YAML configs with `config-schema.json` for validation
+- `configs/router-config.json` - Router service configuration for multi-model support
 - `prompts/` - AI prompt templates (`vuln-*.txt`, `exploit-*.txt`, etc.)
 
 **Output:**
 - `audit-logs/{hostname}_{sessionId}/` - Session metrics, agent logs, deliverables
 
+### Router Mode (Multi-Model Support)
+
+Shannon supports routing Claude Agent SDK requests through alternative LLM providers via [claude-code-router](https://github.com/musistudio/claude-code-router).
+
+**Enable router mode:**
+```bash
+./shannon start URL=<url> REPO=<path> ROUTER=true
+```
+
+**Supported Providers:**
+
+| Provider | Models | Use Case |
+|----------|--------|----------|
+| OpenAI | `gpt-5.2`, `gpt-5-mini` | Good tool use, balanced cost/performance |
+| Gemini | `gemini-2.5-pro` | Long context (1M+ tokens), strong reasoning |
+| DeepSeek | `deepseek-ai/DeepSeek-V3`, `deepseek-chat` | Cheapest option for dev/testing |
+| OpenRouter | `anthropic/claude-sonnet-4`, `google/gemini-3-pro-preview`, `openai/gpt-5.2` | Multi-provider access via single API |
+
+**Configuration (in .env):**
+```bash
+# OpenAI
+OPENAI_API_KEY=sk-your-key
+ROUTER_DEFAULT=openai,gpt-5.2
+
+# Gemini
+GEMINI_API_KEY=your-gemini-key
+ROUTER_DEFAULT=gemini,gemini-2.5-pro
+
+# DeepSeek (via Together.ai)
+DEEPSEEK_API_KEY=your-together-key
+ROUTER_DEFAULT=deepseek,deepseek-ai/DeepSeek-V3
+
+# OpenRouter
+OPENROUTER_API_KEY=sk-or-your-key
+ROUTER_DEFAULT=openrouter,anthropic/claude-sonnet-4
+```
+
+**Note:** Shannon is optimized for Anthropic's Claude models. Alternative providers are useful for cost savings during development but may produce varying results.
+
 ## Troubleshooting
 
 ### Common Issues
@@ -285,16 +325,6 @@ Missing tools can be skipped using `PIPELINE_TESTING=true` mode during developme
 - `subfinder` - Subdomain discovery
 - `whatweb` - Web technology detection
 
-### Router Mode Limitations
-When using `ROUTER=true` to route requests through claude-code-router (e.g., to use OpenAI models):
-
-**Cost tracking shows $0.00**: The Claude Agent SDK expects `total_cost_usd` in the result message, which is Anthropic-specific. OpenAI's API returns token counts in `usage` but not a cost field, and the router doesn't translate this. This is a known limitation of the router, not a Shannon bug.
-
-**Workarounds:**
-- Accept $0 costs when using router mode (recommended for dev/testing)
-- Use Anthropic directly for production runs where cost tracking matters
-- Use external tools like `ccusage` for post-hoc token analysis
-
 ### Diagnostic & Utility Scripts
 ```bash
 # View Temporal workflow history
diff --git a/README.md b/README.md
index 51b9916..a0cf107 100644
--- a/README.md
+++ b/README.md
@@ -84,6 +84,7 @@ Shannon is available in two editions:
   - [Stopping Shannon](#stopping-shannon)
   - [Usage Examples](#usage-examples)
   - [Configuration (Optional)](#configuration-optional)
+  - [Router Mode (Alternative Providers)](#router-mode-alternative-providers)
   - [Output and Results](#output-and-results)
 - [Sample Reports & Benchmarks](#-sample-reports--benchmarks)
 - [Architecture](#-architecture)
@@ -100,7 +101,9 @@ Shannon is available in two editions:
 ### Prerequisites
 
 - **Docker** - Container runtime ([Install Docker](https://docs.docker.com/get-docker/))
-- **Anthropic API key or Claude Code OAuth token** - Get from [Anthropic Console](https://console.anthropic.com)
+- **AI Provider Credentials** (choose one):
+  - **Anthropic API key or Claude Code OAuth token** (recommended) - Get from [Anthropic Console](https://console.anthropic.com)
+  - **Alternative providers via Router Mode** - OpenAI, Google Gemini, DeepSeek, or OpenRouter (see [Router Mode](#router-mode-alternative-providers))
 
 ### Quick Start
 
@@ -252,6 +255,49 @@ rules:
 
 If your application uses two-factor authentication, simply add the TOTP secret to your config file. The AI will automatically generate the required codes during testing.
 
+### Router Mode (Alternative Providers)
+
+Shannon can route requests through alternative AI providers instead of Anthropic. This is useful for:
+- **Cost optimization** - DeepSeek is significantly cheaper (~$0.14/M input tokens vs $3/M for Claude)
+- **Model experimentation** - Test with GPT-5.2, Gemini 3, or open-source models
+- **API availability** - Use OpenRouter if Anthropic API is unavailable in your region
+
+#### Quick Setup
+
+1. Add your provider API key to `.env`:
+   ```bash
+   # Choose one provider:
+   OPENAI_API_KEY=sk-...
+   # OR
+   GEMINI_API_KEY=...
+   # OR
+   DEEPSEEK_API_KEY=...
+   # OR
+   OPENROUTER_API_KEY=sk-or-...
+
+   # Set default model:
+   ROUTER_DEFAULT=openai,gpt-5.2  # provider,model format
+   ```
+
+2. Run with `ROUTER=true`:
+   ```bash
+   ./shannon start URL=https://example.com REPO=/path/to/repo ROUTER=true
+   ```
+
+#### Supported Providers
+
+| Provider | Models | Approx. Cost | Notes |
+|----------|--------|--------------|-------|
+| **Anthropic** (default) | Claude Sonnet 4 | $3/$15 per M tokens | Best quality, recommended |
+| **OpenAI** | gpt-5.2, gpt-5-mini | $2.50/$10 per M tokens | Good alternative |
+| **Google Gemini** | gemini-2.5-pro | ~$1.25/$5 per M tokens | Long context (1M+), strong reasoning |
+| **DeepSeek** | DeepSeek-V3 | ~$0.14/$0.28 per M tokens | Cheapest option |
+| **OpenRouter** | 100+ models | Varies | Single API for many models |
+
+#### Disclaimer
+
+> **Output quality depends on model choice.** Shannon is optimized for and tested with Anthropic's Claude models. Alternative providers may produce varying results depending on the model's reasoning capabilities.
+
 ### Output and Results
 
 All results are saved to `./audit-logs/{hostname}_{sessionId}/` by default. Use `--output <path>` to specify a custom directory.
@@ -430,7 +476,7 @@ Shannon is designed for legitimate security auditing purposes only.
 #### **5. Cost & Performance**
 
 - **Time**: As of the current version, a full test run typically takes **1 to 1.5 hours** to complete.
-- **Cost**: Running the full test using Anthropic's Claude 4.5 Sonnet model may incur costs of approximately **$50 USD**. Please note that costs are subject to change based on model pricing and the complexity of the target application.
+- **Cost**: Running the full test using Anthropic's Claude 4.5 Sonnet model may incur costs of approximately **$50 USD**. Using Router Mode with DeepSeek can reduce this to **~$5 USD** (see [Router Mode](#router-mode-alternative-providers)). Costs vary based on model pricing and application complexity.
 
 #### **6. Windows Antivirus False Positives**
 
diff --git a/configs/router-config.json b/configs/router-config.json
index dd3fc47..d1a430f 100644
--- a/configs/router-config.json
+++ b/configs/router-config.json
@@ -10,16 +10,16 @@
       "name": "openai",
       "api_base_url": "https://api.openai.com/v1/chat/completions",
       "api_key": "$OPENAI_API_KEY",
-      "models": ["gpt-4o", "gpt-4o-mini"],
+      "models": ["gpt-5.2", "gpt-5-mini"],
       "transformer": {
-        "use": [["maxtoken", { "max_tokens": 16384 }]]
+        "use": [["maxcompletiontokens", { "max_completion_tokens": 16384 }]]
       }
     },
     {
       "name": "gemini",
       "api_base_url": "https://generativelanguage.googleapis.com/v1beta/models/",
       "api_key": "$GEMINI_API_KEY",
-      "models": ["gemini-2.5-pro", "gemini-2.5-flash"],
+      "models": ["gemini-2.5-pro"],
       "transformer": {
         "use": ["gemini"]
       }
@@ -28,7 +28,7 @@
       "name": "deepseek",
       "api_base_url": "$DEEPSEEK_API_BASE",
       "api_key": "$DEEPSEEK_API_KEY",
-      "models": ["deepseek-ai/DeepSeek-V3", "deepseek-ai/DeepSeek-R1", "deepseek-chat", "deepseek-reasoner"],
+      "models": ["deepseek-ai/DeepSeek-V3", "deepseek-chat"],
       "transformer": {
         "use": ["deepseek", "enhancetool"]
       }
@@ -39,9 +39,8 @@
       "api_key": "$OPENROUTER_API_KEY",
       "models": [
         "anthropic/claude-sonnet-4",
-        "google/gemini-2.5-pro-preview",
-        "openai/gpt-4o",
-        "meta-llama/llama-3.3-70b-instruct"
+        "google/gemini-3-pro-preview",
+        "openai/gpt-5.2"
       ],
       "transformer": {
         "use": ["openrouter"]
diff --git a/docker-compose.yml b/docker-compose.yml
index 0f55219..f551b58 100644
--- a/docker-compose.yml
+++ b/docker-compose.yml
@@ -22,6 +22,7 @@ services:
       - ANTHROPIC_API_KEY=${ANTHROPIC_API_KEY:-}
       - ANTHROPIC_BASE_URL=${ANTHROPIC_BASE_URL:-}  # Optional: route through claude-code-router
       - ANTHROPIC_AUTH_TOKEN=${ANTHROPIC_AUTH_TOKEN:-}  # Auth token for router
+      - ROUTER_DEFAULT=${ROUTER_DEFAULT:-}  # Model name when using router (e.g., "gemini,gemini-2.5-pro")
       - CLAUDE_CODE_OAUTH_TOKEN=${CLAUDE_CODE_OAUTH_TOKEN:-}
       - CLAUDE_CODE_MAX_OUTPUT_TOKENS=${CLAUDE_CODE_MAX_OUTPUT_TOKENS:-64000}
     depends_on:
diff --git a/src/ai/claude-executor.ts b/src/ai/claude-executor.ts
index 0e57c2a..bd194e2 100644
--- a/src/ai/claude-executor.ts
+++ b/src/ai/claude-executor.ts
@@ -25,23 +25,25 @@ import { dispatchMessage } from './message-handlers.js';
 import { detectExecutionContext, formatErrorOutput, formatCompletionMessage } from './output-formatters.js';
 import { createProgressManager } from './progress-manager.js';
 import { createAuditLogger } from './audit-logger.js';
+import { getActualModelName } from './router-utils.js';
 
 declare global {
   var SHANNON_DISABLE_LOADER: boolean | undefined;
 }
 
 export interface ClaudePromptResult {
-  result?: string | null;
+  result?: string | null | undefined;
   success: boolean;
   duration: number;
-  turns?: number;
+  turns?: number | undefined;
   cost: number;
-  partialCost?: number;
-  apiErrorDetected?: boolean;
-  error?: string;
-  errorType?: string;
-  prompt?: string;
-  retryable?: boolean;
+  model?: string | undefined;
+  partialCost?: number | undefined;
+  apiErrorDetected?: boolean | undefined;
+  error?: string | undefined;
+  errorType?: string | undefined;
+  prompt?: string | undefined;
+  retryable?: boolean | undefined;
 }
 
 interface StdioMcpServer {
@@ -247,6 +249,7 @@ export async function runClaudePrompt(
     result = messageLoopResult.result;
     apiErrorDetected = messageLoopResult.apiErrorDetected;
     totalCost = messageLoopResult.cost;
+    const model = messageLoopResult.model;
 
     // === SPENDING CAP SAFEGUARD ===
     // Defense-in-depth: Detect spending cap that slipped through detectApiError().
@@ -283,6 +286,7 @@ export async function runClaudePrompt(
       duration,
       turns: turnCount,
       cost: totalCost,
+      model,
       partialCost: totalCost,
       apiErrorDetected
     };
@@ -316,6 +320,7 @@ interface MessageLoopResult {
   result: string | null;
   apiErrorDetected: boolean;
   cost: number;
+  model?: string | undefined;
 }
 
 interface MessageLoopDeps {
@@ -339,6 +344,7 @@ async function processMessageStream(
   let result: string | null = null;
   let apiErrorDetected = false;
   let cost = 0;
+  let model: string | undefined;
   let lastHeartbeat = Date.now();
 
   for await (const message of query({ prompt: fullPrompt, options })) {
@@ -370,12 +376,18 @@ async function processMessageStream(
       break;
     }
 
-    if (dispatchResult.type === 'continue' && dispatchResult.apiErrorDetected) {
-      apiErrorDetected = true;
+    if (dispatchResult.type === 'continue') {
+      if (dispatchResult.apiErrorDetected) {
+        apiErrorDetected = true;
+      }
+      // Capture model from SystemInitMessage, but override with router model if applicable
+      if (dispatchResult.model) {
+        model = getActualModelName(dispatchResult.model);
+      }
     }
   }
 
-  return { turnCount, result, apiErrorDetected, cost };
+  return { turnCount, result, apiErrorDetected, cost, model };
 }
 
 // Main entry point for agent execution. Handles retries, git checkpoints, and validation.
diff --git a/src/ai/message-handlers.ts b/src/ai/message-handlers.ts
index c1a8fe7..b57ffa3 100644
--- a/src/ai/message-handlers.ts
+++ b/src/ai/message-handlers.ts
@@ -10,6 +10,7 @@ import { PentestError } from '../error-handling.js';
 import { filterJsonToolCalls } from '../utils/output-formatter.js';
 import { formatTimestamp } from '../utils/formatting.js';
 import chalk from 'chalk';
+import { getActualModelName } from './router-utils.js';
 import {
   formatAssistantOutput,
   formatResultOutput,
@@ -178,7 +179,7 @@ function outputLines(lines: string[]): void {
 
 // Message dispatch result types
 export type MessageDispatchAction =
-  | { type: 'continue'; apiErrorDetected?: boolean }
+  | { type: 'continue'; apiErrorDetected?: boolean | undefined; model?: string | undefined }
   | { type: 'complete'; result: string | null; cost: number }
   | { type: 'throw'; error: Error };
 
@@ -229,13 +230,18 @@ export async function dispatchMessage(
     }
 
     case 'system': {
-      if (message.subtype === 'init' && !execContext.useCleanOutput) {
+      if (message.subtype === 'init') {
         const initMsg = message as SystemInitMessage;
-        console.log(chalk.blue(`    Model: ${initMsg.model}, Permission: ${initMsg.permissionMode}`));
-        if (initMsg.mcp_servers && initMsg.mcp_servers.length > 0) {
-          const mcpStatus = initMsg.mcp_servers.map(s => `${s.name}(${s.status})`).join(', ');
-          console.log(chalk.blue(`    MCP: ${mcpStatus}`));
+        const actualModel = getActualModelName(initMsg.model);
+        if (!execContext.useCleanOutput) {
+          console.log(chalk.blue(`    Model: ${actualModel}, Permission: ${initMsg.permissionMode}`));
+          if (initMsg.mcp_servers && initMsg.mcp_servers.length > 0) {
+            const mcpStatus = initMsg.mcp_servers.map(s => `${s.name}(${s.status})`).join(', ');
+            console.log(chalk.blue(`    MCP: ${mcpStatus}`));
+          }
         }
+        // Return actual model for tracking in audit logs
+        return { type: 'continue', model: actualModel };
       }
       return { type: 'continue' };
     }
diff --git a/src/ai/router-utils.ts b/src/ai/router-utils.ts
new file mode 100644
index 0000000..a2dbd06
--- /dev/null
+++ b/src/ai/router-utils.ts
@@ -0,0 +1,34 @@
+// Copyright (C) 2025 Keygraph, Inc.
+//
+// This program is free software: you can redistribute it and/or modify
+// it under the terms of the GNU Affero General Public License version 3
+// as published by the Free Software Foundation.
+
+/**
+ * Get the actual model name being used.
+ * When using claude-code-router, the SDK reports its configured model (claude-sonnet)
+ * but the actual model is determined by ROUTER_DEFAULT env var.
+ */
+export function getActualModelName(sdkReportedModel?: string): string | undefined {
+  const routerBaseUrl = process.env.ANTHROPIC_BASE_URL;
+  const routerDefault = process.env.ROUTER_DEFAULT;
+
+  // If router mode is active and ROUTER_DEFAULT is set, use that
+  if (routerBaseUrl && routerDefault) {
+    // ROUTER_DEFAULT format: "provider,model" (e.g., "gemini,gemini-2.5-pro")
+    const parts = routerDefault.split(',');
+    if (parts.length >= 2) {
+      return parts.slice(1).join(','); // Handle model names with commas
+    }
+  }
+
+  // Fall back to SDK-reported model
+  return sdkReportedModel;
+}
+
+/**
+ * Check if router mode is active.
+ */
+export function isRouterMode(): boolean {
+  return !!process.env.ANTHROPIC_BASE_URL && !!process.env.ROUTER_DEFAULT;
+}
diff --git a/src/audit/audit-session.ts b/src/audit/audit-session.ts
index 505f6f7..bdfb3c5 100644
--- a/src/audit/audit-session.ts
+++ b/src/audit/audit-session.ts
@@ -26,9 +26,10 @@ interface AgentEndResult {
   duration_ms: number;
   cost_usd: number;
   success: boolean;
-  error?: string;
-  checkpoint?: string;
-  isFinalAttempt?: boolean;
+  model?: string | undefined;
+  error?: string | undefined;
+  checkpoint?: string | undefined;
+  isFinalAttempt?: boolean | undefined;
 }
 
 /**
diff --git a/src/audit/metrics-tracker.ts b/src/audit/metrics-tracker.ts
index 3e552ef..1096fe0 100644
--- a/src/audit/metrics-tracker.ts
+++ b/src/audit/metrics-tracker.ts
@@ -26,7 +26,8 @@ interface AttemptData {
   cost_usd: number;
   success: boolean;
   timestamp: string;
-  error?: string;
+  model?: string | undefined;
+  error?: string | undefined;
 }
 
 interface AgentMetrics {
@@ -34,7 +35,8 @@ interface AgentMetrics {
   attempts: AttemptData[];
   final_duration_ms: number;
   total_cost_usd: number;
-  checkpoint?: string;
+  model?: string | undefined;
+  checkpoint?: string | undefined;
 }
 
 interface PhaseMetrics {
@@ -66,9 +68,10 @@ interface AgentEndResult {
   duration_ms: number;
   cost_usd: number;
   success: boolean;
-  error?: string;
-  checkpoint?: string;
-  isFinalAttempt?: boolean;
+  model?: string | undefined;
+  error?: string | undefined;
+  checkpoint?: string | undefined;
+  isFinalAttempt?: boolean | undefined;
 }
 
 interface ActiveTimer {
@@ -169,6 +172,10 @@ export class MetricsTracker {
       timestamp: formatTimestamp(),
     };
 
+    if (result.model) {
+      attempt.model = result.model;
+    }
+
     if (result.error) {
       attempt.error = result.error;
     }
@@ -183,6 +190,10 @@ export class MetricsTracker {
       agent.status = 'success';
       agent.final_duration_ms = result.duration_ms;
 
+      if (result.model) {
+        agent.model = result.model;
+      }
+
       if (result.checkpoint) {
         agent.checkpoint = result.checkpoint;
       }
diff --git a/src/phases/pre-recon.ts b/src/phases/pre-recon.ts
index 5430029..88dc3ed 100644
--- a/src/phases/pre-recon.ts
+++ b/src/phases/pre-recon.ts
@@ -18,9 +18,9 @@ import type { DistributedConfig } from '../types/config.js';
 interface AgentResult {
   success: boolean;
   duration: number;
-  cost?: number;
-  error?: string;
-  retryable?: boolean;
+  cost?: number | undefined;
+  error?: string | undefined;
+  retryable?: boolean | undefined;
 }
 
 type ToolName = 'nmap' | 'subfinder' | 'whatweb' | 'schemathesis';
diff --git a/src/phases/reporting.ts b/src/phases/reporting.ts
index 7ea28d5..ec9f86b 100644
--- a/src/phases/reporting.ts
+++ b/src/phases/reporting.ts
@@ -68,3 +68,87 @@ export async function assembleFinalReport(sourceDir: string): Promise<string> {
 
   return finalContent;
 }
+
+/**
+ * Inject model information into the final security report.
+ * Reads session.json to get the model(s) used, then injects a "Model:" line
+ * into the Executive Summary section of the report.
+ */
+export async function injectModelIntoReport(
+  repoPath: string,
+  outputPath: string
+): Promise<void> {
+  // 1. Read session.json to get model information
+  const sessionJsonPath = path.join(outputPath, 'session.json');
+
+  if (!(await fs.pathExists(sessionJsonPath))) {
+    console.log(chalk.yellow('⚠️ session.json not found, skipping model injection'));
+    return;
+  }
+
+  interface SessionData {
+    metrics: {
+      agents: Record<string, { model?: string }>;
+    };
+  }
+
+  const sessionData: SessionData = await fs.readJson(sessionJsonPath);
+
+  // 2. Extract unique models from all agents
+  const models = new Set<string>();
+  for (const agent of Object.values(sessionData.metrics.agents)) {
+    if (agent.model) {
+      models.add(agent.model);
+    }
+  }
+
+  if (models.size === 0) {
+    console.log(chalk.yellow('⚠️ No model information found in session.json'));
+    return;
+  }
+
+  const modelStr = Array.from(models).join(', ');
+  console.log(chalk.blue(`📝 Injecting model info into report: ${modelStr}`));
+
+  // 3. Read the final report
+  const reportPath = path.join(repoPath, 'deliverables', 'comprehensive_security_assessment_report.md');
+
+  if (!(await fs.pathExists(reportPath))) {
+    console.log(chalk.yellow('⚠️ Final report not found, skipping model injection'));
+    return;
+  }
+
+  let reportContent = await fs.readFile(reportPath, 'utf8');
+
+  // 4. Find and inject model line after "Assessment Date" in Executive Summary
+  // Pattern: "- Assessment Date: <date>" followed by a newline
+  const assessmentDatePattern = /^(- Assessment Date: .+)$/m;
+  const match = reportContent.match(assessmentDatePattern);
+
+  if (match) {
+    // Inject model line after Assessment Date
+    const modelLine = `- Model: ${modelStr}`;
+    reportContent = reportContent.replace(
+      assessmentDatePattern,
+      `$1\n${modelLine}`
+    );
+    console.log(chalk.green('✅ Model info injected into Executive Summary'));
+  } else {
+    // If no Assessment Date line found, try to add after Executive Summary header
+    const execSummaryPattern = /^## Executive Summary$/m;
+    if (reportContent.match(execSummaryPattern)) {
+      // Add model as first item in Executive Summary
+      reportContent = reportContent.replace(
+        execSummaryPattern,
+        `## Executive Summary\n- Model: ${modelStr}`
+      );
+      console.log(chalk.green('✅ Model info added to Executive Summary header'));
+    } else {
+      console.log(chalk.yellow('⚠️ Could not find Executive Summary section'));
+      return;
+    }
+  }
+
+  // 5. Write modified report back
+  await fs.writeFile(reportPath, reportContent);
+}
diff --git a/src/temporal/activities.ts b/src/temporal/activities.ts
index 9425ccf..90572b0 100644
--- a/src/temporal/activities.ts
+++ b/src/temporal/activities.ts
@@ -67,7 +67,7 @@ import {
   rollbackGitWorkspace,
   getGitCommitHash,
 } from '../utils/git-manager.js';
-import { assembleFinalReport } from '../phases/reporting.js';
+import { assembleFinalReport, injectModelIntoReport } from '../phases/reporting.js';
 import { getPromptNameForAgent } from '../types/agents.js';
 import { AuditSession } from '../audit/index.js';
 import type { WorkflowSummary } from '../audit/workflow-logger.js';
@@ -192,6 +192,7 @@ async function runAgentActivity(
           duration_ms: result.duration,
           cost_usd: 0,
           success: false,
+          model: result.model,
           error: `Spending cap likely reached: ${resultText.slice(0, 100)}`,
         });
         // Throw as billing error so Temporal retries with long backoff
@@ -207,6 +208,7 @@ async function runAgentActivity(
         duration_ms: result.duration,
         cost_usd: result.cost || 0,
         success: false,
+        model: result.model,
         error: result.error || 'Execution failed',
       });
       throw new Error(result.error || 'Agent execution failed');
@@ -221,6 +223,7 @@ async function runAgentActivity(
         duration_ms: result.duration,
         cost_usd: result.cost || 0,
         success: false,
+        model: result.model,
         error: 'Output validation failed',
       });
 
@@ -243,6 +246,7 @@ async function runAgentActivity(
       duration_ms: result.duration,
       cost_usd: result.cost || 0,
       success: true,
+      model: result.model,
       ...(commitHash && { checkpoint: commitHash }),
     });
     await commitGitSuccess(repoPath, agentName);
@@ -254,6 +258,7 @@ async function runAgentActivity(
       outputTokens: null,
       costUsd: result.cost ?? null,
       numTurns: result.turns ?? null,
+      model: result.model,
     };
   } catch (error) {
     // Rollback git workspace before Temporal retry to ensure clean state
@@ -369,6 +374,25 @@ export async function assembleReportActivity(input: ActivityInput): Promise<void
   }
 }
 
+/**
+ * Inject model metadata into the final report.
+ * This must be called AFTER runReportAgent to add the model information to the Executive Summary.
+ */
+export async function injectReportMetadataActivity(input: ActivityInput): Promise<void> {
+  const { repoPath, outputPath } = input;
+  if (!outputPath) {
+    console.log(chalk.yellow('⚠️ No output path provided, skipping model injection'));
+    return;
+  }
+  try {
+    await injectModelIntoReport(repoPath, outputPath);
+  } catch (error) {
+    const err = error as Error;
+    console.log(chalk.yellow(`⚠️ Error injecting model into report: ${err.message}`));
+    // Don't throw - this is a non-critical enhancement
+  }
+}
+
 /**
  * Check if exploitation should run for a given vulnerability type.
  * Reads the vulnerability queue file and returns the decision.
diff --git a/src/temporal/query.ts b/src/temporal/query.ts
index a97fe74..bf058a7 100644
--- a/src/temporal/query.ts
+++ b/src/temporal/query.ts
@@ -35,6 +35,7 @@ interface AgentMetrics {
   outputTokens: number | null;
   costUsd: number | null;
   numTurns: number | null;
+  model?: string | undefined;
 }
 
 interface PipelineProgress {
@@ -123,8 +124,10 @@ async function queryWorkflow(): Promise<void> {
         const metrics = progress.agentMetrics[agent];
         const duration = metrics ? formatDuration(metrics.durationMs) : 'unknown';
         const cost = metrics?.costUsd ? `$${metrics.costUsd.toFixed(4)}` : '';
+        const model = metrics?.model ? ` [${metrics.model}]` : '';
         console.log(
           chalk.green(`  - ${agent}`) +
+            chalk.blue(model) +
             chalk.gray(` (${duration}${cost ? ', ' + cost : ''})`)
         );
       }
diff --git a/src/temporal/shared.ts b/src/temporal/shared.ts
index e10ad33..9120bfc 100644
--- a/src/temporal/shared.ts
+++ b/src/temporal/shared.ts
@@ -17,6 +17,7 @@ export interface AgentMetrics {
   outputTokens: number | null;
   costUsd: number | null;
   numTurns: number | null;
+  model?: string | undefined;
 }
 
 export interface PipelineSummary {
diff --git a/src/temporal/workflows.ts b/src/temporal/workflows.ts
index 3a2781f..1165b94 100644
--- a/src/temporal/workflows.ts
+++ b/src/temporal/workflows.ts
@@ -276,6 +276,10 @@ export async function pentestPipelineWorkflow(
     // Then run the report agent to add executive summary and clean up
     state.agentMetrics['report'] = await a.runReportAgent(activityInput);
     state.completedAgents.push('report');
+
+    // Inject model metadata into the final report
+    await a.injectReportMetadataActivity(activityInput);
+
     await a.logPhaseTransition(activityInput, 'reporting', 'complete');
 
     // === Complete ===

From 9606ffcf7024a3fd897e722615730e10bcd186c4 Mon Sep 17 00:00:00 2001
From: ajmallesh <ajmallesh@gmail.com>
Date: Fri, 16 Jan 2026 11:18:27 -0800
Subject: [PATCH 5/9] fix: add universal billing error detection for router
 mode

- Add HTTP 402 and 'insufficient credits' patterns to error classification
- Detect provider billing errors in both exception and message content paths
---
 src/ai/message-handlers.ts | 3 +++
 src/error-handling.ts      | 2 ++
 2 files changed, 5 insertions(+)

diff --git a/src/ai/message-handlers.ts b/src/ai/message-handlers.ts
index b57ffa3..6a8418c 100644
--- a/src/ai/message-handlers.ts
+++ b/src/ai/message-handlers.ts
@@ -60,12 +60,15 @@ export function detectApiError(content: string): ApiErrorDetection {
   // When Claude Code hits its spending cap, it returns a short message like
   // "Spending cap reached resets 8am" instead of throwing an error.
   // These should retry with 5-30 min backoff so workflows can recover when cap resets.
+  // Also catches provider billing errors (OpenRouter 402, etc.) that appear in message content.
   const BILLING_PATTERNS = [
     'spending cap',
     'spending limit',
     'cap reached',
     'budget exceeded',
     'usage limit',
+    '402',                  // HTTP Payment Required (universal)
+    'insufficient credits', // OpenRouter
   ];
 
   const isBillingError = BILLING_PATTERNS.some((pattern) =>
diff --git a/src/error-handling.ts b/src/error-handling.ts
index ac605a5..3f00131 100644
--- a/src/error-handling.ts
+++ b/src/error-handling.ts
@@ -211,7 +211,9 @@ export function classifyErrorForTemporal(error: unknown): TemporalErrorClassific
   // === BILLING ERRORS (Retryable with long backoff) ===
   // Anthropic returns billing as 400 invalid_request_error
   // Human can add credits OR wait for spending cap to reset (5-30 min backoff)
+  // 402 is HTTP "Payment Required" - universal across providers (OpenRouter, etc.)
   if (
+    message.includes('402') ||
     message.includes('billing_error') ||
     message.includes('credit balance is too low') ||
     message.includes('insufficient credits') ||

From 63741d780e5b6ccd7a579a1f551a58affbfba94b Mon Sep 17 00:00:00 2001
From: ajmallesh <ajmallesh@gmail.com>
Date: Fri, 16 Jan 2026 17:29:54 -0800
Subject: [PATCH 6/9] revert: remove '402' billing pattern causing false
 positives

Reverts 5428422 - the pattern matched tool call IDs containing "402"
---
 src/ai/message-handlers.ts | 3 ---
 src/error-handling.ts      | 2 --
 2 files changed, 5 deletions(-)

diff --git a/src/ai/message-handlers.ts b/src/ai/message-handlers.ts
index 6a8418c..b57ffa3 100644
--- a/src/ai/message-handlers.ts
+++ b/src/ai/message-handlers.ts
@@ -60,15 +60,12 @@ export function detectApiError(content: string): ApiErrorDetection {
   // When Claude Code hits its spending cap, it returns a short message like
   // "Spending cap reached resets 8am" instead of throwing an error.
   // These should retry with 5-30 min backoff so workflows can recover when cap resets.
-  // Also catches provider billing errors (OpenRouter 402, etc.) that appear in message content.
   const BILLING_PATTERNS = [
     'spending cap',
     'spending limit',
     'cap reached',
     'budget exceeded',
     'usage limit',
-    '402',                  // HTTP Payment Required (universal)
-    'insufficient credits', // OpenRouter
   ];
 
   const isBillingError = BILLING_PATTERNS.some((pattern) =>
diff --git a/src/error-handling.ts b/src/error-handling.ts
index 3f00131..ac605a5 100644
--- a/src/error-handling.ts
+++ b/src/error-handling.ts
@@ -211,9 +211,7 @@ export function classifyErrorForTemporal(error: unknown): TemporalErrorClassific
   // === BILLING ERRORS (Retryable with long backoff) ===
   // Anthropic returns billing as 400 invalid_request_error
   // Human can add credits OR wait for spending cap to reset (5-30 min backoff)
-  // 402 is HTTP "Payment Required" - universal across providers (OpenRouter, etc.)
   if (
-    message.includes('402') ||
     message.includes('billing_error') ||
     message.includes('credit balance is too low') ||
     message.includes('insufficient credits') ||

From f85c1bd193070645400c486fb51d22d8bc33cc01 Mon Sep 17 00:00:00 2001
From: ajmallesh <ajmallesh@gmail.com>
Date: Tue, 20 Jan 2026 09:49:16 -0800
Subject: [PATCH 7/9] refactor: simplify router to OpenAI and OpenRouter
 providers only

- Remove Gemini direct and DeepSeek provider configurations
- Keep OpenAI (gpt-5.2, gpt-5-mini) and OpenRouter (Gemini 3 models)
- Update documentation and environment examples
- Remove cost column from README providers table
---
 .env.example               | 23 +++--------------------
 CLAUDE.md                  | 14 ++------------
 README.md                  | 16 +++++-----------
 configs/router-config.json | 21 +--------------------
 docker-compose.yml         |  3 ---
 shannon                    |  8 ++++----
 6 files changed, 15 insertions(+), 70 deletions(-)

diff --git a/.env.example b/.env.example
index fd00877..c36aced 100644
--- a/.env.example
+++ b/.env.example
@@ -22,29 +22,12 @@ ANTHROPIC_API_KEY=your-api-key-here
 # OPENAI_API_KEY=sk-your-openai-key
 # ROUTER_DEFAULT=openai,gpt-5.2
 
-# --- Google Gemini ---
-# GEMINI_API_KEY=your-gemini-key
-# ROUTER_DEFAULT=gemini,gemini-2.5-pro
-
-# --- DeepSeek (cheapest option) ---
-# DEEPSEEK_API_KEY=your-together-or-deepseek-key
-# DEEPSEEK_API_BASE=https://api.together.xyz/v1/chat/completions  # Default: Together.ai
-# ROUTER_DEFAULT=deepseek,deepseek-ai/DeepSeek-V3
-#
-# To use DeepSeek's official API instead:
-# DEEPSEEK_API_BASE=https://api.deepseek.com/chat/completions
-# ROUTER_DEFAULT=deepseek,deepseek-chat
-
-# --- OpenRouter (access 100+ models via single API) ---
+# --- OpenRouter (access Gemini 3 models via single API) ---
 # OPENROUTER_API_KEY=sk-or-your-openrouter-key
-# ROUTER_DEFAULT=openrouter,anthropic/claude-sonnet-4
+# ROUTER_DEFAULT=openrouter,google/gemini-3-pro-preview
 
 # =============================================================================
 # Available Models
 # =============================================================================
 # OpenAI:     gpt-5.2, gpt-5-mini
-# Gemini:     gemini-2.5-pro
-# DeepSeek:   (Together.ai) deepseek-ai/DeepSeek-V3
-#             (Official)    deepseek-chat
-# OpenRouter: anthropic/claude-sonnet-4, google/gemini-3-pro-preview,
-#             openai/gpt-5.2 (100+ more)
+# OpenRouter: google/gemini-3-pro-preview, google/gemini-3-flash-preview
diff --git a/CLAUDE.md b/CLAUDE.md
index 8d2d55c..be22c68 100644
--- a/CLAUDE.md
+++ b/CLAUDE.md
@@ -282,9 +282,7 @@ Shannon supports routing Claude Agent SDK requests through alternative LLM provi
 | Provider | Models | Use Case |
 |----------|--------|----------|
 | OpenAI | `gpt-5.2`, `gpt-5-mini` | Good tool use, balanced cost/performance |
-| Gemini | `gemini-2.5-pro` | Long context (1M+ tokens), strong reasoning |
-| DeepSeek | `deepseek-ai/DeepSeek-V3`, `deepseek-chat` | Cheapest option for dev/testing |
-| OpenRouter | `anthropic/claude-sonnet-4`, `google/gemini-3-pro-preview`, `openai/gpt-5.2` | Multi-provider access via single API |
+| OpenRouter | `google/gemini-3-pro-preview`, `google/gemini-3-flash-preview` | Access to Gemini 3 models via single API |
 
 **Configuration (in .env):**
 ```bash
@@ -292,17 +290,9 @@ Shannon supports routing Claude Agent SDK requests through alternative LLM provi
 OPENAI_API_KEY=sk-your-key
 ROUTER_DEFAULT=openai,gpt-5.2
 
-# Gemini
-GEMINI_API_KEY=your-gemini-key
-ROUTER_DEFAULT=gemini,gemini-2.5-pro
-
-# DeepSeek (via Together.ai)
-DEEPSEEK_API_KEY=your-together-key
-ROUTER_DEFAULT=deepseek,deepseek-ai/DeepSeek-V3
-
 # OpenRouter
 OPENROUTER_API_KEY=sk-or-your-key
-ROUTER_DEFAULT=openrouter,anthropic/claude-sonnet-4
+ROUTER_DEFAULT=openrouter,google/gemini-3-pro-preview
 ```
 
 **Note:** Shannon is optimized for Anthropic's Claude models. Alternative providers are useful for cost savings during development but may produce varying results.
diff --git a/README.md b/README.md
index a0cf107..5bb0049 100644
--- a/README.md
+++ b/README.md
@@ -269,10 +269,6 @@ Shannon can route requests through alternative AI providers instead of Anthropic
    # Choose one provider:
    OPENAI_API_KEY=sk-...
    # OR
-   GEMINI_API_KEY=...
-   # OR
-   DEEPSEEK_API_KEY=...
-   # OR
    OPENROUTER_API_KEY=sk-or-...
 
    # Set default model:
@@ -286,13 +282,11 @@ Shannon can route requests through alternative AI providers instead of Anthropic
 
 #### Supported Providers
 
-| Provider | Models | Approx. Cost | Notes |
-|----------|--------|--------------|-------|
-| **Anthropic** (default) | Claude Sonnet 4 | $3/$15 per M tokens | Best quality, recommended |
-| **OpenAI** | gpt-5.2, gpt-5-mini | $2.50/$10 per M tokens | Good alternative |
-| **Google Gemini** | gemini-2.5-pro | ~$1.25/$5 per M tokens | Long context (1M+), strong reasoning |
-| **DeepSeek** | DeepSeek-V3 | ~$0.14/$0.28 per M tokens | Cheapest option |
-| **OpenRouter** | 100+ models | Varies | Single API for many models |
+| Provider | Models | Notes |
+|----------|--------|-------|
+| **Anthropic** | Claude Sonnet 4 | Best quality, recommended |
+| **OpenAI** | gpt-5.2, gpt-5-mini | Good alternative |
+| **OpenRouter** | google/gemini-3-pro-preview, google/gemini-3-flash-preview | Access to Gemini 3 models |
 
 #### Disclaimer
 
diff --git a/configs/router-config.json b/configs/router-config.json
index d1a430f..f12973c 100644
--- a/configs/router-config.json
+++ b/configs/router-config.json
@@ -15,32 +15,13 @@
         "use": [["maxcompletiontokens", { "max_completion_tokens": 16384 }]]
       }
     },
-    {
-      "name": "gemini",
-      "api_base_url": "https://generativelanguage.googleapis.com/v1beta/models/",
-      "api_key": "$GEMINI_API_KEY",
-      "models": ["gemini-2.5-pro"],
-      "transformer": {
-        "use": ["gemini"]
-      }
-    },
-    {
-      "name": "deepseek",
-      "api_base_url": "$DEEPSEEK_API_BASE",
-      "api_key": "$DEEPSEEK_API_KEY",
-      "models": ["deepseek-ai/DeepSeek-V3", "deepseek-chat"],
-      "transformer": {
-        "use": ["deepseek", "enhancetool"]
-      }
-    },
     {
       "name": "openrouter",
       "api_base_url": "https://openrouter.ai/api/v1/chat/completions",
       "api_key": "$OPENROUTER_API_KEY",
       "models": [
-        "anthropic/claude-sonnet-4",
         "google/gemini-3-pro-preview",
-        "openai/gpt-5.2"
+        "google/gemini-3-flash-preview"
       ],
       "transformer": {
         "use": ["openrouter"]
diff --git a/docker-compose.yml b/docker-compose.yml
index f551b58..26cbdfa 100644
--- a/docker-compose.yml
+++ b/docker-compose.yml
@@ -58,9 +58,6 @@ services:
       - HOST=0.0.0.0
       - ANTHROPIC_API_KEY=${ANTHROPIC_API_KEY:-}
       - OPENAI_API_KEY=${OPENAI_API_KEY:-}
-      - GEMINI_API_KEY=${GEMINI_API_KEY:-}
-      - DEEPSEEK_API_KEY=${DEEPSEEK_API_KEY:-}
-      - DEEPSEEK_API_BASE=${DEEPSEEK_API_BASE:-https://api.together.xyz/v1/chat/completions}
       - OPENROUTER_API_KEY=${OPENROUTER_API_KEY:-}
       - ROUTER_DEFAULT=${ROUTER_DEFAULT:-openai,gpt-4o}
     healthcheck:
diff --git a/shannon b/shannon
index 760b0b1..e971a2a 100755
--- a/shannon
+++ b/shannon
@@ -125,12 +125,12 @@ cmd_start() {
 
   # Check for API key (router mode can use alternative provider API keys)
   if [ -z "$ANTHROPIC_API_KEY" ] && [ -z "$CLAUDE_CODE_OAUTH_TOKEN" ]; then
-    if [ "$ROUTER" = "true" ] && { [ -n "$OPENAI_API_KEY" ] || [ -n "$GEMINI_API_KEY" ] || [ -n "$DEEPSEEK_API_KEY" ] || [ -n "$OPENROUTER_API_KEY" ]; }; then
+    if [ "$ROUTER" = "true" ] && { [ -n "$OPENAI_API_KEY" ] || [ -n "$OPENROUTER_API_KEY" ]; }; then
       # Router mode with alternative provider - set a placeholder for SDK init
       export ANTHROPIC_API_KEY="router-mode"
     else
       echo "ERROR: Set ANTHROPIC_API_KEY or CLAUDE_CODE_OAUTH_TOKEN in .env"
-      echo "       (or use ROUTER=true with OPENAI_API_KEY, GEMINI_API_KEY, DEEPSEEK_API_KEY, or OPENROUTER_API_KEY)"
+      echo "       (or use ROUTER=true with OPENAI_API_KEY or OPENROUTER_API_KEY)"
       exit 1
     fi
   fi
@@ -166,8 +166,8 @@ cmd_start() {
       echo "Starting claude-code-router..."
 
       # Check for provider API keys
-      if [ -z "$OPENAI_API_KEY" ] && [ -z "$GEMINI_API_KEY" ] && [ -z "$DEEPSEEK_API_KEY" ] && [ -z "$OPENROUTER_API_KEY" ]; then
-        echo "WARNING: No provider API key set (OPENAI_API_KEY, GEMINI_API_KEY, DEEPSEEK_API_KEY, or OPENROUTER_API_KEY). Router may not work."
+      if [ -z "$OPENAI_API_KEY" ] && [ -z "$OPENROUTER_API_KEY" ]; then
+        echo "WARNING: No provider API key set (OPENAI_API_KEY or OPENROUTER_API_KEY). Router may not work."
       fi
 
       # Start router with profile

From 25fde5240a34b43c5d7a49b1b40f9db5cdefe9ca Mon Sep 17 00:00:00 2001
From: ajmallesh <ajmallesh@gmail.com>
Date: Tue, 20 Jan 2026 09:55:40 -0800
Subject: [PATCH 8/9] docs: remove DeepSeek references from router mode
 documentation

---
 README.md | 19 +++++++++----------
 1 file changed, 9 insertions(+), 10 deletions(-)

diff --git a/README.md b/README.md
index 5bb0049..4affe97 100644
--- a/README.md
+++ b/README.md
@@ -103,7 +103,7 @@ Shannon is available in two editions:
 - **Docker** - Container runtime ([Install Docker](https://docs.docker.com/get-docker/))
 - **AI Provider Credentials** (choose one):
   - **Anthropic API key or Claude Code OAuth token** (recommended) - Get from [Anthropic Console](https://console.anthropic.com)
-  - **Alternative providers via Router Mode** - OpenAI, Google Gemini, DeepSeek, or OpenRouter (see [Router Mode](#router-mode-alternative-providers))
+  - **Alternative providers via Router Mode** - OpenAI or Google Gemini via OpenRouter (see [Router Mode](#router-mode-alternative-providers))
 
 ### Quick Start
 
@@ -257,9 +257,8 @@ If your application uses two-factor authentication, simply add the TOTP secret t
 
 ### Router Mode (Alternative Providers)
 
-Shannon can route requests through alternative AI providers instead of Anthropic. This is useful for:
-- **Cost optimization** - DeepSeek is significantly cheaper (~$0.14/M input tokens vs $3/M for Claude)
-- **Model experimentation** - Test with GPT-5.2, Gemini 3, or open-source models
+Shannon can route requests through alternative AI providers using [claude-code-router](https://github.com/musistudio/claude-code-router). This is useful for:
+- **Model experimentation** - Test with GPT-5.2 or Gemini 3 models
 - **API availability** - Use OpenRouter if Anthropic API is unavailable in your region
 
 #### Quick Setup
@@ -282,11 +281,11 @@ Shannon can route requests through alternative AI providers instead of Anthropic
 
 #### Supported Providers
 
-| Provider | Models | Notes |
-|----------|--------|-------|
-| **Anthropic** | Claude Sonnet 4 | Best quality, recommended |
-| **OpenAI** | gpt-5.2, gpt-5-mini | Good alternative |
-| **OpenRouter** | google/gemini-3-pro-preview, google/gemini-3-flash-preview | Access to Gemini 3 models |
+| Provider | Models |
+|----------|--------|
+| **Anthropic** | Claude Sonnet 4 |
+| **OpenAI** | gpt-5.2, gpt-5-mini |
+| **OpenRouter** | google/gemini-3-pro-preview, google/gemini-3-flash-preview |
 
 #### Disclaimer
 
@@ -470,7 +469,7 @@ Shannon is designed for legitimate security auditing purposes only.
 #### **5. Cost & Performance**
 
 - **Time**: As of the current version, a full test run typically takes **1 to 1.5 hours** to complete.
-- **Cost**: Running the full test using Anthropic's Claude 4.5 Sonnet model may incur costs of approximately **$50 USD**. Using Router Mode with DeepSeek can reduce this to **~$5 USD** (see [Router Mode](#router-mode-alternative-providers)). Costs vary based on model pricing and application complexity.
+- **Cost**: Running the full test using Anthropic's Claude 4.5 Sonnet model may incur costs of approximately **$50 USD**. Costs vary based on model pricing and application complexity.
 
 #### **6. Windows Antivirus False Positives**
 

From a15408e23f0a385ee630481f8dd0eda8305b8e78 Mon Sep 17 00:00:00 2001
From: ajmallesh <ajmallesh@gmail.com>
Date: Tue, 20 Jan 2026 16:42:16 -0800
Subject: [PATCH 9/9] docs: remove Gemini 3 Pro from supported router models

---
 .env.example               | 4 ++--
 CLAUDE.md                  | 4 ++--
 README.md                  | 2 +-
 configs/router-config.json | 1 -
 4 files changed, 5 insertions(+), 6 deletions(-)

diff --git a/.env.example b/.env.example
index c36aced..b9aab98 100644
--- a/.env.example
+++ b/.env.example
@@ -24,10 +24,10 @@ ANTHROPIC_API_KEY=your-api-key-here
 
 # --- OpenRouter (access Gemini 3 models via single API) ---
 # OPENROUTER_API_KEY=sk-or-your-openrouter-key
-# ROUTER_DEFAULT=openrouter,google/gemini-3-pro-preview
+# ROUTER_DEFAULT=openrouter,google/gemini-3-flash-preview
 
 # =============================================================================
 # Available Models
 # =============================================================================
 # OpenAI:     gpt-5.2, gpt-5-mini
-# OpenRouter: google/gemini-3-pro-preview, google/gemini-3-flash-preview
+# OpenRouter: google/gemini-3-flash-preview
diff --git a/CLAUDE.md b/CLAUDE.md
index be22c68..c73d3c9 100644
--- a/CLAUDE.md
+++ b/CLAUDE.md
@@ -282,7 +282,7 @@ Shannon supports routing Claude Agent SDK requests through alternative LLM provi
 | Provider | Models | Use Case |
 |----------|--------|----------|
 | OpenAI | `gpt-5.2`, `gpt-5-mini` | Good tool use, balanced cost/performance |
-| OpenRouter | `google/gemini-3-pro-preview`, `google/gemini-3-flash-preview` | Access to Gemini 3 models via single API |
+| OpenRouter | `google/gemini-3-flash-preview` | Access to Gemini 3 models via single API |
 
 **Configuration (in .env):**
 ```bash
@@ -292,7 +292,7 @@ ROUTER_DEFAULT=openai,gpt-5.2
 
 # OpenRouter
 OPENROUTER_API_KEY=sk-or-your-key
-ROUTER_DEFAULT=openrouter,google/gemini-3-pro-preview
+ROUTER_DEFAULT=openrouter,google/gemini-3-flash-preview
 ```
 
 **Note:** Shannon is optimized for Anthropic's Claude models. Alternative providers are useful for cost savings during development but may produce varying results.
diff --git a/README.md b/README.md
index 4affe97..48909c8 100644
--- a/README.md
+++ b/README.md
@@ -285,7 +285,7 @@ Shannon can route requests through alternative AI providers using [claude-code-r
 |----------|--------|
 | **Anthropic** | Claude Sonnet 4 |
 | **OpenAI** | gpt-5.2, gpt-5-mini |
-| **OpenRouter** | google/gemini-3-pro-preview, google/gemini-3-flash-preview |
+| **OpenRouter** | google/gemini-3-flash-preview |
 
 #### Disclaimer
 
diff --git a/configs/router-config.json b/configs/router-config.json
index f12973c..cf57b1e 100644
--- a/configs/router-config.json
+++ b/configs/router-config.json
@@ -20,7 +20,6 @@
       "api_base_url": "https://openrouter.ai/api/v1/chat/completions",
       "api_key": "$OPENROUTER_API_KEY",
       "models": [
-        "google/gemini-3-pro-preview",
         "google/gemini-3-flash-preview"
       ],
       "transformer": {