From 3fbb096c906e1a870433916621fb215819a51d03 Mon Sep 17 00:00:00 2001
From: Markus Waldheim <markus@waldheim.dev>
Date: Tue, 10 Feb 2026 18:48:29 +0100
Subject: [PATCH 01/13] feat: implement multi-provider support and session
 management

This change introduces a provider-based architecture to support multiple LLM backends (Claude, Gemini, Copilot).
It also adds a session manager and tool executor to centralize execution logic and improve session continuity.

- Added lib/providers/base.sh, claude.sh, gemini.sh, copilot.sh
- Added lib/session_manager.sh and lib/tool_executor.sh
- Updated ralph_enable.sh and ralph_loop.sh to use the new provider system
- Added tests for providers and updated existing tests
---
 ANALYSIS_REPORT.md                        |  66 ++
 CLAUDE.md                                 |  50 +-
 IMPLEMENTATION_PLAN_MULTI_PROVIDER.md     |  65 ++
 README.md                                 |  13 +-
 lib/enable_core.sh                        |   9 +-
 lib/providers/base.sh                     |  21 +
 lib/providers/claude.sh                   | 333 ++++++++
 lib/providers/copilot.sh                  | 101 +++
 lib/providers/gemini.sh                   |  86 +++
 lib/session_manager.sh                    | 116 +++
 lib/tool_executor.sh                      |  95 +++
 ralph_enable.sh                           |  54 +-
 ralph_loop.sh                             | 903 +---------------------
 templates/system_prompts/generic_agent.md |  63 ++
 tests/unit/test_cli_modern.bats           |  38 +-
 tests/unit/test_providers.bats            |  69 ++
 tests/unit/test_session_continuity.bats   |   2 +-
 17 files changed, 1121 insertions(+), 963 deletions(-)
 create mode 100644 ANALYSIS_REPORT.md
 create mode 100644 IMPLEMENTATION_PLAN_MULTI_PROVIDER.md
 create mode 100644 lib/providers/base.sh
 create mode 100644 lib/providers/claude.sh
 create mode 100644 lib/providers/copilot.sh
 create mode 100644 lib/providers/gemini.sh
 create mode 100644 lib/session_manager.sh
 create mode 100644 lib/tool_executor.sh
 create mode 100644 templates/system_prompts/generic_agent.md
 create mode 100644 tests/unit/test_providers.bats

diff --git a/ANALYSIS_REPORT.md b/ANALYSIS_REPORT.md
new file mode 100644
index 00000000..3265a9cc
--- /dev/null
+++ b/ANALYSIS_REPORT.md
@@ -0,0 +1,66 @@
+# Analysis: Supporting Gemini & GitHub Copilot in Ralph
+
+## 1. Current Architecture vs. Required Architecture
+
+Currently, **Ralph is a Supervisor**, not an Agent.
+*   **Ralph's Job:** It watches `claude-code`, ensures it doesn't get stuck, manages its rate limits, and decides when to stop.
+*   **Claude Code's Job:** It acts as the **Agent**. It reads files, thinks, decides to edit a file, runs `sed`/`git`, checks the result, and iterates.
+
+**The "Agent Gap":**
+Standard CLIs for Gemini (`gemini`) and GitHub Copilot (`gh copilot`) are primarily **Text-In/Text-Out** interfaces. They generate code snippets or explanations but **do not** natively execute tools (like writing files or running tests) in a continuous loop on your terminal.
+
+To support them, Ralph cannot just "wrap" them. Ralph must **become the Agent Runtime**.
+
+## 2. Transformation Required
+
+To support non-agentic CLIs (like Gemini/Copilot), Ralph must expand its responsibilities:
+
+| Feature | Current (Claude Code) | Proposed (Gemini/Copilot) |
+| :--- | :--- | :--- |
+| **Thinking** | Claude Code | Gemini / Copilot |
+| **Tool Execution** | **Claude Code** | **Ralph (New)** |
+| **Loop Management** | Ralph | Ralph |
+| **State/Memory** | Claude Code | Ralph (New) |
+
+## 3. Key Components to Build
+
+### A. Provider Abstraction Layer (`lib/providers/`)
+We need a standard interface for interacting with different AIs.
+*   `init_session()`: Start a conversation.
+*   `send_message(prompt, context)`: Send user input + file context.
+*   `parse_response(output)`: Extract text content AND **Tool Calls**.
+
+### B. Tool Execution Engine (`lib/tool_executor.sh`)
+Since Gemini/Copilot won't edit files themselves, Ralph must do it.
+*   **Protocol:** Define a format for the AI to request actions (e.g., XML tags like `<write_file path="...">content</write_file>` or JSON function calls).
+*   **Executor:** A script that parses these requests and runs:
+    *   `write_file`: create/update files.
+    *   `run_command`: execute bash commands (with safety checks).
+    *   `read_file`: read file content to feed back to the AI.
+
+### C. Prompt Engineering (`templates/prompts/`)
+*   **Claude:** Uses its built-in system prompt.
+*   **Gemini/Copilot:** We must inject a **System Prompt** that teaches them:
+    *   "You are an autonomous coding agent."
+    *   "You have access to these tools: read_file, write_file..."
+    *   "To use a tool, output this specific format..."
+
+## 4. Implementation Steps
+
+1.  **Refactor `ralph_loop.sh`**:
+    *   Replace direct `claude` calls with `provider.send_message`.
+    *   Add a check: Does the provider handle tools?
+        *   **Yes (Claude):** Do nothing (current behavior).
+        *   **No (Gemini):** Parse output -> Run `ToolExecutor` -> Feed result back to `provider.send_message`.
+
+2.  **Create Provider Adapters**:
+    *   `lib/providers/claude.sh`: Wraps existing logic.
+    *   `lib/providers/gemini.sh`: Wraps `gemini-cli` (or API curl calls), handles JSON parsing.
+    *   `lib/providers/copilot.sh`: Wraps `gh copilot suggest` (more complex due to interactive nature, might need `expect` or API usage).
+
+3.  **Build the Runtime**:
+    *   Implement `lib/tool_executor.sh`.
+    *   Implement "Tool Feedback Loop" in `ralph_loop.sh`.
+
+## 5. Conclusion
+Making Ralph compatible with Gemini/Copilot is a **major architectural upgrade**. It moves Ralph from being a "Process Manager" to being a "ReAct (Reason+Act) Agent Framework".
diff --git a/CLAUDE.md b/CLAUDE.md
index 36c04ae6..e19757b0 100644
--- a/CLAUDE.md
+++ b/CLAUDE.md
@@ -10,51 +10,27 @@ See [README.md](README.md) for version info, changelog, and user documentation.
 
 ## Core Architecture
 
-The system consists of four main bash scripts and a modular library system:
+The system consists of a modular provider architecture and a core loop:
 
 ### Main Scripts
 
-1. **ralph_loop.sh** - The main autonomous loop that executes Claude Code repeatedly
+1. **ralph_loop.sh** - The main autonomous loop that executes the selected AI provider
 2. **ralph_monitor.sh** - Live monitoring dashboard for tracking loop status
 3. **setup.sh** - Project initialization script for new Ralph projects
-4. **create_files.sh** - Bootstrap script that creates the entire Ralph system
-5. **ralph_import.sh** - PRD/specification import tool that converts documents to Ralph format
-   - Uses modern Claude Code CLI with `--output-format json` for structured responses
-   - Implements `detect_response_format()` and `parse_conversion_response()` for JSON parsing
-   - Backward compatible with older CLI versions (automatic text fallback)
-6. **ralph_enable.sh** - Interactive wizard for enabling Ralph in existing projects
-   - Multi-step wizard with environment detection, task source selection, configuration
-   - Imports tasks from beads, GitHub Issues, or PRD documents
-   - Generates `.ralphrc` project configuration file
-7. **ralph_enable_ci.sh** - Non-interactive version for CI/automation
-   - Same functionality as interactive version with CLI flags
-   - JSON output mode for machine parsing
-   - Exit codes: 0 (success), 1 (error), 2 (already enabled)
+4. **ralph_import.sh** - PRD/specification import tool (uses Claude)
+5. **ralph_enable.sh** - Interactive wizard for enabling Ralph in existing projects (includes Provider selection)
 
 ### Library Components (lib/)
 
-The system uses a modular architecture with reusable components in the `lib/` directory:
-
-1. **lib/circuit_breaker.sh** - Circuit breaker pattern implementation
-   - Prevents runaway loops by detecting stagnation
-   - Three states: CLOSED (normal), HALF_OPEN (monitoring), OPEN (halted)
-   - Configurable thresholds for no-progress and error detection
-   - Automatic state transitions and recovery
-
-2. **lib/response_analyzer.sh** - Intelligent response analysis
-   - Analyzes Claude Code output for completion signals
-   - **JSON output format detection and parsing** (with text fallback)
-   - Supports both flat JSON format and Claude CLI format (`result`, `sessionId`, `metadata`)
-   - Extracts structured fields: status, exit_signal, work_type, files_modified
-   - **Session management**: `store_session_id()`, `get_last_session_id()`, `should_resume_session()`
-   - Automatic session persistence to `.ralph/.claude_session_id` file with 24-hour expiration
-   - Session lifecycle: `get_session_id()`, `reset_session()`, `log_session_transition()`, `init_session_tracking()`
-   - Session history tracked in `.ralph/.ralph_session_history` (last 50 transitions)
-   - Session auto-reset on: circuit breaker open, manual interrupt, project completion
-   - Detects test-only loops and stuck error patterns
-   - Two-stage error filtering to eliminate false positives
-   - Multi-line error matching for accurate stuck loop detection
-   - Confidence scoring for exit decisions
+1. **lib/providers/base.sh** - Provider loader and abstraction layer
+2. **lib/providers/claude.sh** - Claude Code CLI integration
+3. **lib/providers/gemini.sh** - Google Gemini CLI integration (Agent Mode)
+4. **lib/providers/copilot.sh** - GitHub Copilot CLI integration (Agent Mode)
+5. **lib/session_manager.sh** - Centralized session lifecycle management
+6. **lib/circuit_breaker.sh** - Circuit breaker pattern implementation
+7. **lib/response_analyzer.sh** - Intelligent response analysis (shared across providers)
+8. **lib/tool_executor.sh** - Generic tool execution runtime for non-agentic providers (Legacy/Future)
+9. **lib/date_utils.sh** & **lib/timeout_utils.sh** - Cross-platform utilities
 
 3. **lib/date_utils.sh** - Cross-platform date utilities
    - ISO timestamp generation for logging
diff --git a/IMPLEMENTATION_PLAN_MULTI_PROVIDER.md b/IMPLEMENTATION_PLAN_MULTI_PROVIDER.md
new file mode 100644
index 00000000..438765fd
--- /dev/null
+++ b/IMPLEMENTATION_PLAN_MULTI_PROVIDER.md
@@ -0,0 +1,65 @@
+# Implementation Plan: Multi-Provider Support
+
+This plan outlines the steps to transform Ralph into a multi-provider agent framework.
+
+## Phase 1: Modularization (The "Socket")
+**Goal:** Abstract the hardcoded `claude` commands into a plugin system.
+
+- [ ] **Create `lib/providers/` directory.**
+- [ ] **Create `lib/providers/base.sh`:** Define the interface (functions `provider_init`, `provider_chat`, `provider_parse`).
+- [ ] **Create `lib/providers/claude.sh`:** Move current `claude` CLI logic here.
+- [ ] **Update `ralph_loop.sh`**:
+    - Load the selected provider script based on `RALPH_PROVIDER` env var.
+    - Replace `execute_claude_code` with generic `execute_provider_loop`.
+
+## Phase 2: The Agent Runtime (The "Brain")
+**Goal:** Enable Ralph to execute tools for "dumb" LLMs.
+
+- [ ] **Design Tool Protocol:** Define how LLMs should request actions (e.g., Markdown code blocks or XML).
+    - Example:
+      ```xml
+      <tool name="write_file">
+      <path>src/main.py</path>
+      <content>print("hello")</content>
+      </tool>
+      ```
+- [ ] **Create `lib/tool_executor.sh`:**
+    - Function `extract_tool_calls(llm_output)`
+    - Function `execute_tool(name, args)`
+    - Safety checks (prevent `rm -rf /`).
+- [ ] **Create `templates/system_prompts/generic_agent.md`:**
+    - A master prompt that explains available tools and the output format to the LLM.
+
+## Phase 3: Gemini Adapter
+**Goal:** Connect Google Gemini.
+
+- [ ] **Prerequisite:** Install `gemini` CLI or use `curl` with API Key.
+- [ ] **Create `lib/providers/gemini.sh`:**
+    - Implement `provider_chat`:
+        - Construct payload with `templates/system_prompts/generic_agent.md` + User Prompt + History.
+        - Call API.
+    - Implement `provider_parse`:
+        - Extract text.
+        - Detect if tool calls are present.
+
+## Phase 4: GitHub Copilot Adapter
+**Goal:** Connect GitHub Copilot.
+
+- [ ] **Investigation:** Determine best CLI entry point (`gh copilot` vs raw API).
+- [ ] **Create `lib/providers/copilot.sh`:**
+    - Similar adaptation as Gemini.
+    - *Note:* Copilot often refuses "system prompts" in CLI. May require "User" role spoofing.
+
+## Phase 5: Configuration Update
+**Goal:** User-friendly switching.
+
+- [ ] **Update `ralph-setup` / `ralph-enable`:**
+    - Ask "Which AI provider do you want to use?"
+    - Generate `.ralphrc` with `RALPH_PROVIDER=gemini`.
+- [ ] **Update `.ralphrc` template:** Add provider configuration sections.
+
+## Estimated Effort
+- **Phase 1:** 2 days (Refactoring)
+- **Phase 2:** 3-4 days (Security & Logic)
+- **Phase 3:** 1-2 days (Integration)
+- **Total:** ~1-2 weeks for a robust MVP.
diff --git a/README.md b/README.md
index 0179d141..5c1422f2 100644
--- a/README.md
+++ b/README.md
@@ -16,25 +16,26 @@ Ralph is an implementation of the Geoffrey Huntley's technique for Claude Code t
 
 ## Project Status
 
-**Version**: v0.11.4 - Active Development
+**Version**: v0.12.0 - Multi-Provider Support
 **Core Features**: Working and tested
-**Test Coverage**: 484 tests, 100% pass rate
+**Providers**: Claude Code (Anthropic), Google Gemini, GitHub Copilot
 
 ### What's Working Now
+- **Multi-Provider Support**: Switch between Claude, Gemini, and Copilot
+- **Agentic Loops for all providers**: Native support for agentic CLIs
 - Autonomous development loops with intelligent exit detection
 - **Dual-condition exit gate**: Requires BOTH completion indicators AND explicit EXIT_SIGNAL
 - Rate limiting with hourly reset (100 calls/hour, configurable)
 - Circuit breaker with advanced error detection (prevents runaway loops)
 - Response analyzer with semantic understanding and two-stage error filtering
 - **JSON output format support with automatic fallback to text parsing**
-- **Session continuity with `--resume` flag for context preservation (no session hijacking)**
-- **Session expiration with configurable timeout (default: 24 hours)**
+- **Session continuity with `--resume` flag for context preservation**
 - **Modern CLI flags: `--output-format`, `--allowed-tools`, `--no-continue`**
 - **Interactive project enablement with `ralph-enable` wizard**
 - **`.ralphrc` configuration file for project settings**
-- **Live streaming output with `--live` flag for real-time Claude Code visibility**
+- **Live streaming output with `--live` flag (Claude only)**
 - Multi-line error matching for accurate stuck loop detection
-- 5-hour API limit handling with user prompts
+- 5-hour API limit handling with user prompts (Claude only)
 - tmux integration for live monitoring
 - PRD import functionality
 - **CI/CD pipeline with GitHub Actions**
diff --git a/lib/enable_core.sh b/lib/enable_core.sh
index f276a3fd..4be18243 100755
--- a/lib/enable_core.sh
+++ b/lib/enable_core.sh
@@ -662,6 +662,7 @@ FIXPLANEOF
 #   $1 (project_name) - Project name
 #   $2 (project_type) - Project type
 #   $3 (task_sources) - Task sources (local, beads, github)
+#   $4 (provider) - AI Provider (claude, gemini, copilot)
 #
 # Outputs to stdout
 #
@@ -669,6 +670,7 @@ generate_ralphrc() {
     local project_name="${1:-$(basename "$(pwd)")}"
     local project_type="${2:-unknown}"
     local task_sources="${3:-local}"
+    local provider="${4:-claude}"
 
     cat << RALPHRCEOF
 # .ralphrc - Ralph project configuration
@@ -679,6 +681,10 @@ generate_ralphrc() {
 PROJECT_NAME="${project_name}"
 PROJECT_TYPE="${project_type}"
 
+# AI Provider Configuration
+# Options: claude, gemini, copilot
+RALPH_PROVIDER="${provider}"
+
 # Loop settings
 MAX_CALLS_PER_HOUR=100
 CLAUDE_TIMEOUT_MINUTES=15
@@ -729,6 +735,7 @@ enable_ralph_in_directory() {
     local project_name="${ENABLE_PROJECT_NAME:-}"
     local project_type="${ENABLE_PROJECT_TYPE:-}"
     local task_content="${ENABLE_TASK_CONTENT:-}"
+    local provider="${ENABLE_PROVIDER:-claude}"
 
     # Check existing state (use || true to prevent set -e from exiting)
     check_existing_ralph || true
@@ -789,7 +796,7 @@ enable_ralph_in_directory() {
 
     # Generate .ralphrc
     local ralphrc_content
-    ralphrc_content=$(generate_ralphrc "$project_name" "$DETECTED_PROJECT_TYPE" "$task_sources")
+    ralphrc_content=$(generate_ralphrc "$project_name" "$DETECTED_PROJECT_TYPE" "$task_sources" "$provider")
     safe_create_file ".ralphrc" "$ralphrc_content"
 
     enable_log "SUCCESS" "Ralph enabled successfully!"
diff --git a/lib/providers/base.sh b/lib/providers/base.sh
new file mode 100644
index 00000000..f2feef03
--- /dev/null
+++ b/lib/providers/base.sh
@@ -0,0 +1,21 @@
+#!/bin/bash
+# Base Provider Loader for Ralph
+
+# Load the configured provider
+load_provider() {
+    local provider_name="${RALPH_PROVIDER:-claude}"
+    local provider_script="$RALPH_HOME/lib/providers/${provider_name}.sh"
+    
+    # Fallback to local path if RALPH_HOME not set or script not found
+    if [[ ! -f "$provider_script" ]]; then
+        provider_script="$(dirname "${BASH_SOURCE[0]}")/${provider_name}.sh"
+    fi
+
+    if [[ -f "$provider_script" ]]; then
+        source "$provider_script"
+        log_status "INFO" "Loaded AI provider: $provider_name"
+    else
+        log_status "ERROR" "AI provider script not found: $provider_script"
+        exit 1
+    fi
+}
diff --git a/lib/providers/claude.sh b/lib/providers/claude.sh
new file mode 100644
index 00000000..499485a5
--- /dev/null
+++ b/lib/providers/claude.sh
@@ -0,0 +1,333 @@
+#!/bin/bash
+# Claude Provider for Ralph
+# Implements the Claude Code CLI integration
+
+# Provider-specific configuration
+CLAUDE_CODE_CMD="claude"
+CLAUDE_MIN_VERSION="2.0.76"
+
+# Load Claude-specific logic
+provider_init() {
+    check_claude_version
+}
+
+# Check Claude CLI version for compatibility with modern flags
+check_claude_version() {
+    local version=$($CLAUDE_CODE_CMD --version 2>/dev/null | grep -oE '[0-9]+\.[0-9]+\.[0-9]+' | head -1)
+
+    if [[ -z "$version" ]]; then
+        log_status "WARN" "Cannot detect Claude CLI version, assuming compatible"
+        return 0
+    fi
+
+    # Compare versions (simplified semver comparison)
+    local required="$CLAUDE_MIN_VERSION"
+
+    # Convert to comparable integers (major * 10000 + minor * 100 + patch)
+    local ver_parts=(${version//./ })
+    local req_parts=(${required//./ })
+
+    local ver_num=$((${ver_parts[0]:-0} * 10000 + ${ver_parts[1]:-0} * 100 + ${ver_parts[2]:-0}))
+    local req_num=$((${req_parts[0]:-0} * 10000 + ${req_parts[1]:-0} * 100 + ${req_parts[2]:-0}))
+
+    if [[ $ver_num -lt $req_num ]]; then
+        log_status "WARN" "Claude CLI version $version < $required. Some modern features may not work."
+        log_status "WARN" "Consider upgrading: npm update -g @anthropic-ai/claude-code"
+        return 1
+    fi
+
+    log_status "INFO" "Claude CLI version $version (>= $required) - modern features enabled"
+    return 0
+}
+
+# Validate allowed tools against whitelist
+validate_allowed_tools() {
+    local tools_input=$1
+    local VALID_TOOL_PATTERNS=(
+        "Write" "Read" "Edit" "MultiEdit" "Glob" "Grep" "Task" "TodoWrite"
+        "WebFetch" "WebSearch" "Bash" "Bash(git *)" "Bash(npm *)"
+        "Bash(bats *)" "Bash(python *)" "Bash(node *)" "NotebookEdit"
+    )
+
+    if [[ -z "$tools_input" ]]; then
+        return 0
+    fi
+
+    local IFS=','
+    read -ra tools <<< "$tools_input"
+
+    for tool in "${tools[@]}"; do
+        tool=$(echo "$tool" | sed 's/^[[:space:]]*//;s/[[:space:]]*$//')
+        [[ -z "$tool" ]] && continue
+        local valid=false
+        for pattern in "${VALID_TOOL_PATTERNS[@]}"; do
+            if [[ "$tool" == "$pattern" || "$tool" =~ ^Bash\(.+\)$ ]]; then
+                valid=true
+                break
+            fi
+        done
+        if [[ "$valid" == "false" ]]; then
+            echo "Error: Invalid tool: '$tool'" >&2
+            return 1
+        fi
+    done
+    return 0
+}
+
+# Build loop context for Claude Code session
+build_loop_context() {
+    local loop_count=$1
+    local context="Loop #$loop_count. "
+
+    if [[ -f "$RALPH_DIR/fix_plan.md" ]]; then
+        local incomplete_tasks=$(grep -cE "^[[:space:]]*- \[ \]" "$RALPH_DIR/fix_plan.md" 2>/dev/null || true)
+        context+="Remaining tasks: ${incomplete_tasks:-0}. "
+    fi
+
+    if [[ -f "$RALPH_DIR/.circuit_breaker_state" ]]; then
+        local cb_state=$(jq -r '.state // "UNKNOWN"' "$RALPH_DIR/.circuit_breaker_state" 2>/dev/null)
+        [[ "$cb_state" != "CLOSED" && -n "$cb_state" && "$cb_state" != "null" ]] && context+="Circuit breaker: $cb_state. "
+    fi
+
+    if [[ -f "$RALPH_DIR/.response_analysis" ]]; then
+        local prev_summary=$(jq -r '.analysis.work_summary // ""' "$RALPH_DIR/.response_analysis" 2>/dev/null | head -c 200)
+        [[ -n "$prev_summary" && "$prev_summary" != "null" ]] && context+="Previous: $prev_summary"
+    fi
+
+    echo "${context:0:500}"
+}
+
+# Initialize or resume Claude session
+init_claude_session() {
+    local session_file="$RALPH_DIR/.claude_session_id"
+    if [[ -f "$session_file" ]]; then
+        local age_hours=$(get_session_file_age_hours "$session_file")
+        if [[ $age_hours -eq -1 ]] || [[ $age_hours -ge $CLAUDE_SESSION_EXPIRY_HOURS ]]; then
+            rm -f "$session_file"
+            echo ""
+        else
+            cat "$session_file" 2>/dev/null
+        fi
+    else
+        echo ""
+    fi
+}
+
+# Execute provider loop
+provider_execute() {
+    local loop_count=$1
+    local prompt_file=$2
+    local live_mode=$3
+    
+    # Implementation follows the logic from execute_claude_code
+    execute_claude_code "$loop_count" "$prompt_file" "$live_mode"
+}
+
+# Internal helper to execute Claude Code (extracted from ralph_loop.sh)
+execute_claude_code() {
+    local timestamp=$(date '+%Y-%m-%d_%H-%M-%S')
+    local output_file="$LOG_DIR/claude_output_${timestamp}.log"
+    local loop_count=$1
+    local calls_made=$(cat "$CALL_COUNT_FILE" 2>/dev/null || echo "0")
+    calls_made=$((calls_made + 1))
+
+    # Fix #141: Capture git HEAD SHA at loop start to detect commits as progress
+    local loop_start_sha=""
+    if command -v git &>/dev/null && git rev-parse --git-dir &>/dev/null 2>&1; then
+        loop_start_sha=$(git rev-parse HEAD 2>/dev/null || echo "")
+    fi
+    echo "$loop_start_sha" > "$RALPH_DIR/.loop_start_sha"
+
+    log_status "LOOP" "Executing Claude Code (Call $calls_made/$MAX_CALLS_PER_HOUR)"
+    local timeout_seconds=$((CLAUDE_TIMEOUT_MINUTES * 60))
+    log_status "INFO" "⏳ Starting Claude Code execution... (timeout: ${CLAUDE_TIMEOUT_MINUTES}m)"
+
+    # Build loop context for session continuity
+    local loop_context=""
+    if [[ "$CLAUDE_USE_CONTINUE" == "true" ]]; then
+        loop_context=$(build_loop_context "$loop_count")
+        if [[ -n "$loop_context" && "$VERBOSE_PROGRESS" == "true" ]]; then
+            log_status "INFO" "Loop context: $loop_context"
+        fi
+    fi
+
+    # Initialize or resume session
+    local session_id=""
+    if [[ "$CLAUDE_USE_CONTINUE" == "true" ]]; then
+        session_id=$(init_claude_session)
+    fi
+
+    # Live mode requires JSON output (stream-json) — override text format
+    if [[ "$LIVE_OUTPUT" == "true" && "$CLAUDE_OUTPUT_FORMAT" == "text" ]]; then
+        log_status "WARN" "Live mode requires JSON output format. Overriding text → json for this session."
+        CLAUDE_OUTPUT_FORMAT="json"
+    fi
+
+    # Build the Claude CLI command with modern flags
+    local use_modern_cli=false
+    if build_claude_command "$PROMPT_FILE" "$loop_context" "$session_id"; then
+        use_modern_cli=true
+        log_status "INFO" "Using modern CLI mode (${CLAUDE_OUTPUT_FORMAT} output)"
+    else
+        log_status "WARN" "Failed to build modern CLI command, falling back to legacy mode"
+        if [[ "$LIVE_OUTPUT" == "true" ]]; then
+            log_status "ERROR" "Live mode requires a built Claude command. Falling back to background mode."
+            LIVE_OUTPUT=false
+        fi
+    fi
+
+    # Execute Claude Code
+    local exit_code=0
+    echo -e "\n\n=== Loop #$loop_count - $(date '+%Y-%m-%d %H:%M:%S') ===" > "$LIVE_LOG_FILE"
+
+    if [[ "$LIVE_OUTPUT" == "true" ]]; then
+        # LIVE MODE implementation (same as in ralph_loop.sh)
+        if ! command -v jq &> /dev/null || ! command -v stdbuf &> /dev/null; then
+            log_status "ERROR" "Live mode dependencies missing. Falling back to background mode."
+            LIVE_OUTPUT=false
+        fi
+    fi
+
+    if [[ "$LIVE_OUTPUT" == "true" ]]; then
+        log_status "INFO" "📺 Live output mode enabled - showing Claude Code streaming..."
+        echo -e "${PURPLE}━━━━━━━━━━━━━━━━ Claude Code Output ━━━━━━━━━━━━━━━━${NC}"
+
+        local -a LIVE_CMD_ARGS=()
+        local skip_next=false
+        for arg in "${CLAUDE_CMD_ARGS[@]}"; do
+            if [[ "$skip_next" == "true" ]]; then
+                LIVE_CMD_ARGS+=("stream-json"); skip_next=false
+            elif [[ "$arg" == "--output-format" ]]; then
+                LIVE_CMD_ARGS+=("$arg"); skip_next=true
+            else
+                LIVE_CMD_ARGS+=("$arg")
+            fi
+        done
+        LIVE_CMD_ARGS+=("--verbose" "--include-partial-messages")
+
+        local jq_filter='if .type == "stream_event" then if .event.type == "content_block_delta" and .event.delta.type == "text_delta" then .event.delta.text elif .event.type == "content_block_start" and .event.content_block.type == "tool_use" then "\n\n⚡ [" + .event.content_block.name + "]\n" elif .event.type == "content_block_stop" then "\n" else empty end else empty end'
+
+        set -o pipefail
+        portable_timeout ${timeout_seconds}s stdbuf -oL "${LIVE_CMD_ARGS[@]}" < /dev/null 2>&1 | stdbuf -oL tee "$output_file" | stdbuf -oL jq --unbuffered -j "$jq_filter" 2>/dev/null | tee "$LIVE_LOG_FILE"
+        local -a pipe_status=("${PIPESTATUS[@]}")
+        set +o pipefail
+        exit_code=${pipe_status[0]}
+        echo ""
+        echo -e "${PURPLE}━━━━━━━━━━━━━━━━ End of Output ━━━━━━━━━━━━━━━━━━━${NC}"
+
+        if [[ "$CLAUDE_USE_CONTINUE" == "true" && -f "$output_file" ]]; then
+            local stream_output_file="${output_file%.log}_stream.log"
+            cp "$output_file" "$stream_output_file"
+            local result_line=$(grep -E '"type"[[:space:]]*:[[:space:]]*"result"' "$output_file" 2>/dev/null | tail -1)
+            if [[ -n "$result_line" ]] && echo "$result_line" | jq -e . >/dev/null 2>&1; then
+                echo "$result_line" > "$output_file"
+            fi
+        fi
+    else
+        # BACKGROUND MODE
+        if [[ "$use_modern_cli" == "true" ]]; then
+            portable_timeout ${timeout_seconds}s "${CLAUDE_CMD_ARGS[@]}" < /dev/null > "$output_file" 2>&1 &
+        else
+            portable_timeout ${timeout_seconds}s $CLAUDE_CODE_CMD < "$PROMPT_FILE" > "$output_file" 2>&1 &
+        fi
+        local claude_pid=$!
+        local progress_counter=0
+        while kill -0 $claude_pid 2>/dev/null; do
+            progress_counter=$((progress_counter + 1))
+            local last_line=""
+            if [[ -f "$output_file" && -s "$output_file" ]]; then
+                last_line=$(tail -1 "$output_file" 2>/dev/null | head -c 80)
+                cp "$output_file" "$LIVE_LOG_FILE" 2>/dev/null
+            fi
+            cat > "$PROGRESS_FILE" << EOF
+{ "status": "executing", "elapsed_seconds": $((progress_counter * 10)), "last_output": "$last_line", "timestamp": "$(date '+%Y-%m-%d %H:%M:%S')" }
+EOF
+            sleep 10
+        done
+        wait $claude_pid
+        exit_code=$?
+    fi
+
+    if [ $exit_code -eq 0 ]; then
+        echo "$calls_made" > "$CALL_COUNT_FILE"
+        echo '{"status": "completed", "timestamp": "'$(date '+%Y-%m-%d %H:%M:%S')'"}' > "$PROGRESS_FILE"
+        log_status "SUCCESS" "✅ Claude Code execution completed successfully"
+        [[ "$CLAUDE_USE_CONTINUE" == "true" ]] && save_claude_session "$output_file"
+        log_status "INFO" "🔍 Analyzing Claude Code response..."
+        analyze_response "$output_file" "$loop_count"
+        update_exit_signals
+        log_analysis_summary
+        
+        local files_changed=0
+        local current_sha=""
+        if command -v git &>/dev/null && git rev-parse --git-dir &>/dev/null 2>&1; then
+            current_sha=$(git rev-parse HEAD 2>/dev/null || echo "")
+            if [[ -n "$loop_start_sha" && -n "$current_sha" && "$loop_start_sha" != "$current_sha" ]]; then
+                files_changed=$({ git diff --name-only "$loop_start_sha" "$current_sha"; git diff --name-only HEAD; git diff --name-only --cached; } | sort -u | wc -l)
+            else
+                files_changed=$({ git diff --name-only; git diff --name-only --cached; } | sort -u | wc -l)
+            fi
+        fi
+
+        local has_errors="false"
+        if grep -v '"[^"]*error[^"]*":' "$output_file" 2>/dev/null | grep -qE '(^Error:|^ERROR:|^error:|\]: error|Link: error|Error occurred|failed with error|[Ee]xception|Fatal|FATAL)'; then
+            has_errors="true"
+            log_status "WARN" "Errors detected in output"
+        fi
+        local output_length=$(wc -c < "$output_file" 2>/dev/null || echo 0)
+        record_loop_result "$loop_count" "$files_changed" "$has_errors" "$output_length"
+        [[ $? -ne 0 ]] && return 3
+        return 0
+    else
+        echo '{"status": "failed", "timestamp": "'$(date '+%Y-%m-%d %H:%M:%S')'"}' > "$PROGRESS_FILE"
+        if grep -qi "5.*hour.*limit\|limit.*reached.*try.*back\|usage.*limit.*reached" "$output_file"; then
+            log_status "ERROR" "🚫 Claude API 5-hour usage limit reached"
+            return 2
+        else
+            log_status "ERROR" "❌ Claude Code execution failed"
+            return 1
+        fi
+    fi
+}
+
+# Build Claude CLI command with modern flags using array (shell-injection safe)
+build_claude_command() {
+    local prompt_file=$1
+    local loop_context=$2
+    local session_id=$3
+    CLAUDE_CMD_ARGS=("$CLAUDE_CODE_CMD")
+    [[ ! -f "$prompt_file" ]] && return 1
+    [[ "$CLAUDE_OUTPUT_FORMAT" == "json" ]] && CLAUDE_CMD_ARGS+=("--output-format" "json")
+    if [[ -n "$CLAUDE_ALLOWED_TOOLS" ]]; then
+        CLAUDE_CMD_ARGS+=("--allowedTools")
+        local IFS=','
+        read -ra tools_array <<< "$CLAUDE_ALLOWED_TOOLS"
+        for tool in "${tools_array[@]}"; do
+            tool=$(echo "$tool" | xargs); [[ -n "$tool" ]] && CLAUDE_CMD_ARGS+=("$tool")
+        done
+    fi
+    [[ "$CLAUDE_USE_CONTINUE" == "true" && -n "$session_id" ]] && CLAUDE_CMD_ARGS+=("--resume" "$session_id")
+    [[ -n "$loop_context" ]] && CLAUDE_CMD_ARGS+=("--append-system-prompt" "$loop_context")
+    CLAUDE_CMD_ARGS+=("-p" "$(cat "$prompt_file")")
+}
+
+# Save session ID after successful execution
+save_claude_session() {
+    local output_file=$1
+    if [[ -f "$output_file" ]]; then
+        local session_id=$(jq -r '.metadata.session_id // .session_id // empty' "$output_file" 2>/dev/null)
+        [[ -n "$session_id" && "$session_id" != "null" ]] && echo "$session_id" > "$RALPH_DIR/.claude_session_id"
+    fi
+}
+
+# Helper for session age
+get_session_file_age_hours() {
+    local file=$1
+    [[ ! -f "$file" ]] && echo "0" && return
+    local file_mtime
+    if file_mtime=$(stat -c %Y "$file" 2>/dev/null); then :
+    elif file_mtime=$(stat -f %m "$file" 2>/dev/null); then :
+    else file_mtime=$(date -r "$file" +%s 2>/dev/null); fi
+    [[ -z "$file_mtime" || "$file_mtime" == "0" ]] && echo "-1" && return
+    echo "$(( ($(date +%s) - file_mtime) / 3600 ))"
+}
diff --git a/lib/providers/copilot.sh b/lib/providers/copilot.sh
new file mode 100644
index 00000000..23b53b22
--- /dev/null
+++ b/lib/providers/copilot.sh
@@ -0,0 +1,101 @@
+#!/bin/bash
+# GitHub Copilot Provider for Ralph
+# Implements the GitHub Copilot CLI integration
+
+# Provider-specific configuration
+COPILOT_CMD="copilot"
+
+provider_init() {
+    if ! command -v "$COPILOT_CMD" &> /dev/null; then
+        log_status "ERROR" "Copilot CLI not found. Please install 'gh copilot' or 'copilot'."
+        exit 1
+    fi
+    log_status "INFO" "GitHub Copilot provider initialized."
+}
+
+provider_execute() {
+    local loop_count=$1
+    local prompt_file=$2
+    local live_mode=$3
+    
+    local timestamp=$(date '+%Y-%m-%d_%H-%M-%S')
+    local output_file="$LOG_DIR/copilot_output_${timestamp}.log"
+    local session_file="$RALPH_DIR/.copilot_session_id"
+    
+    local session_arg=""
+    if [[ "$CLAUDE_USE_CONTINUE" == "true" ]]; then
+        # Copilot uses --resume [sessionId]
+        # We need to extract the session ID from previous runs if possible
+        # Currently we don't have a reliable way to get sessionId from stdout unless we parse it
+        # For now, we try --resume without ID which resumes "most recent"
+        session_arg="--resume" 
+    fi
+    
+    # Build loop context
+    local loop_context=$(build_loop_context "$loop_count")
+    local prompt_content=$(cat "$prompt_file")
+    local full_prompt="$loop_context
+
+$prompt_content"
+    
+    log_status "INFO" "Executing Copilot CLI..."
+    
+    # Execute Copilot
+    # We use --allow-all-tools to enable agentic behavior
+    # We use --no-ask-user to prevent blocking prompts
+    # We capture stdout/stderr to output_file
+    
+    # Note: We cannot easily stream output in real-time AND capture it cleanly for analysis without named pipes or complex redirection,
+    # but since this is a bash script, we can use the same trick as in ralph_loop.sh if needed.
+    # For now, simplistic execution.
+    
+    $COPILOT_CMD -p "$full_prompt" 
+        $session_arg 
+        --allow-all-tools 
+        --no-ask-user 
+        > "$output_file" 2>&1
+    
+    local exit_code=$?
+    
+    if [ $exit_code -eq 0 ]; then
+        log_status "SUCCESS" "Copilot execution completed."
+        
+        # Analyze response
+        # Copilot output is text, so we rely on text heuristics
+        analyze_response "$output_file" "$loop_count"
+        update_exit_signals
+        return 0
+    else
+        log_status "ERROR" "Copilot execution failed."
+        return 1
+    fi
+}
+
+validate_allowed_tools() {
+    # Copilot manages its own permissions via --allow-tool flags.
+    # We could map ALLOWED_TOOLS to --allow-tool flags here.
+    return 0
+}
+
+# Helper to build loop context
+build_loop_context() {
+    local loop_count=$1
+    local context="Loop #$loop_count. "
+
+    if [[ -f "$RALPH_DIR/fix_plan.md" ]]; then
+        local incomplete_tasks=$(grep -cE "^[[:space:]]*- \[ \]" "$RALPH_DIR/fix_plan.md" 2>/dev/null || true)
+        context+="Remaining tasks: ${incomplete_tasks:-0}. "
+    fi
+
+    if [[ -f "$RALPH_DIR/.circuit_breaker_state" ]]; then
+        local cb_state=$(jq -r '.state // "UNKNOWN"' "$RALPH_DIR/.circuit_breaker_state" 2>/dev/null)
+        [[ "$cb_state" != "CLOSED" && -n "$cb_state" && "$cb_state" != "null" ]] && context+="Circuit breaker: $cb_state. "
+    fi
+
+    if [[ -f "$RALPH_DIR/.response_analysis" ]]; then
+        local prev_summary=$(jq -r '.analysis.work_summary // ""' "$RALPH_DIR/.response_analysis" 2>/dev/null | head -c 200)
+        [[ -n "$prev_summary" && "$prev_summary" != "null" ]] && context+="Previous: $prev_summary"
+    fi
+
+    echo "${context:0:500}"
+}
diff --git a/lib/providers/gemini.sh b/lib/providers/gemini.sh
new file mode 100644
index 00000000..e919b379
--- /dev/null
+++ b/lib/providers/gemini.sh
@@ -0,0 +1,86 @@
+#!/bin/bash
+# Gemini Provider for Ralph
+# Implements the Gemini CLI integration (Native Agent Mode)
+
+# Provider-specific configuration
+GEMINI_CMD="gemini"
+
+provider_init() {
+    if ! command -v "$GEMINI_CMD" &> /dev/null; then
+        log_status "ERROR" "Gemini CLI not found. Please install 'gemini'."
+        exit 1
+    fi
+    log_status "INFO" "Gemini CLI provider initialized."
+}
+
+provider_execute() {
+    local loop_count=$1
+    local prompt_file=$2
+    local live_mode=$3
+    
+    local timestamp=$(date '+%Y-%m-%d_%H-%M-%S')
+    local output_file="$LOG_DIR/gemini_output_${timestamp}.log"
+    
+    local session_arg=""
+    if [[ "$CLAUDE_USE_CONTINUE" == "true" ]]; then
+        # Gemini uses --resume latest or session ID
+        session_arg="--resume latest" 
+    fi
+    
+    # Build loop context
+    local loop_context=$(build_loop_context "$loop_count")
+    local prompt_content=$(cat "$prompt_file")
+    local full_prompt="$loop_context\n\n$prompt_content"
+    
+    log_status "INFO" "Executing Gemini CLI (Agent Mode)..."
+    
+    # Execute Gemini
+    # We use --yolo to enable autonomous agent behavior (auto-approve tools)
+    # We use -p for non-interactive prompt
+    
+    $GEMINI_CMD -p "$full_prompt" \
+        $session_arg \
+        --yolo \
+        --output-format text \
+        > "$output_file" 2>&1
+    
+    local exit_code=$?
+    
+    if [ $exit_code -eq 0 ]; then
+        log_status "SUCCESS" "Gemini execution completed."
+        analyze_response "$output_file" "$loop_count"
+        update_exit_signals
+        return 0
+    else
+        log_status "ERROR" "Gemini execution failed."
+        return 1
+    fi
+}
+
+validate_allowed_tools() {
+    # Gemini manages its own tools
+    return 0
+}
+
+# Helper to build loop context
+build_loop_context() {
+    local loop_count=$1
+    local context="Loop #$loop_count. "
+
+    if [[ -f "$RALPH_DIR/fix_plan.md" ]]; then
+        local incomplete_tasks=$(grep -cE "^[[:space:]]*- \[ \]" "$RALPH_DIR/fix_plan.md" 2>/dev/null || true)
+        context+="Remaining tasks: ${incomplete_tasks:-0}. "
+    fi
+
+    if [[ -f "$RALPH_DIR/.circuit_breaker_state" ]]; then
+        local cb_state=$(jq -r '.state // "UNKNOWN"' "$RALPH_DIR/.circuit_breaker_state" 2>/dev/null)
+        [[ "$cb_state" != "CLOSED" && -n "$cb_state" && "$cb_state" != "null" ]] && context+="Circuit breaker: $cb_state. "
+    fi
+
+    if [[ -f "$RALPH_DIR/.response_analysis" ]]; then
+        local prev_summary=$(jq -r '.analysis.work_summary // ""' "$RALPH_DIR/.response_analysis" 2>/dev/null | head -c 200)
+        [[ -n "$prev_summary" && "$prev_summary" != "null" ]] && context+="Previous: $prev_summary"
+    fi
+
+    echo "${context:0:500}"
+}
diff --git a/lib/session_manager.sh b/lib/session_manager.sh
new file mode 100644
index 00000000..abc900c0
--- /dev/null
+++ b/lib/session_manager.sh
@@ -0,0 +1,116 @@
+#!/bin/bash
+# Session Management Component for Ralph
+
+# Session file location
+RALPH_SESSION_FILE="$RALPH_DIR/.ralph_session"
+RALPH_SESSION_HISTORY_FILE="$RALPH_DIR/.ralph_session_history"
+CLAUDE_SESSION_FILE="$RALPH_DIR/.claude_session_id"
+
+# Get current session ID from Ralph session file
+get_session_id() {
+    if [[ ! -f "$RALPH_SESSION_FILE" ]]; then
+        echo ""
+        return 0
+    fi
+    local session_id
+    session_id=$(jq -r '.session_id // ""' "$RALPH_SESSION_FILE" 2>/dev/null)
+    [[ -z "$session_id" || "$session_id" == "null" ]] && session_id=""
+    echo "$session_id"
+    return 0
+}
+
+# Reset session with reason logging
+reset_session() {
+    local reason=${1:-"manual_reset"}
+    local reset_timestamp=$(get_iso_timestamp)
+
+    jq -n \
+        --arg session_id "" \
+        --arg created_at "" \
+        --arg last_used "" \
+        --arg reset_at "$reset_timestamp" \
+        --arg reset_reason "$reason" \
+        '{
+            session_id: $session_id,
+            created_at: $created_at,
+            last_used: $last_used,
+            reset_at: $reset_at,
+            reset_reason: $reset_reason
+        }' > "$RALPH_SESSION_FILE"
+
+    rm -f "$CLAUDE_SESSION_FILE" 2>/dev/null
+
+    if [[ -f "$RALPH_DIR/.exit_signals" ]]; then
+        echo '{"test_only_loops": [], "done_signals": [], "completion_indicators": []}' > "$RALPH_DIR/.exit_signals"
+    fi
+    rm -f "$RALPH_DIR/.response_analysis" 2>/dev/null
+
+    log_session_transition "active" "reset" "$reason" "${loop_count:-0}" || true
+    log_status "INFO" "Session reset: $reason"
+}
+
+# Log session state transitions
+log_session_transition() {
+    local from_state=$1
+    local to_state=$2
+    local reason=$3
+    local loop_number=${4:-0}
+    local ts=$(get_iso_timestamp)
+
+    local transition=$(jq -n -c \
+        --arg timestamp "$ts" \
+        --arg from_state "$from_state" \
+        --arg to_state "$to_state" \
+        --arg reason "$reason" \
+        --argjson loop_number "$loop_number" \
+        '{
+            timestamp: $timestamp,
+            from_state: $from_state,
+            to_state: $to_state,
+            reason: $reason,
+            loop_number: $loop_number
+        }')
+
+    local history='[]'
+    if [[ -f "$RALPH_SESSION_HISTORY_FILE" ]]; then
+        history=$(cat "$RALPH_SESSION_HISTORY_FILE" 2>/dev/null)
+        jq empty <<<"$history" 2>/dev/null || history='[]'
+    fi
+
+    echo "$history" | jq ". += [$transition] | .[-50:]" > "$RALPH_SESSION_HISTORY_FILE"
+}
+
+# Generate a unique session ID
+generate_session_id() {
+    echo "ralph-$(date +%s)-$RANDOM"
+}
+
+# Initialize session tracking
+init_session_tracking() {
+    local ts=$(get_iso_timestamp)
+    if [[ ! -f "$RALPH_SESSION_FILE" ]]; then
+        local new_sid=$(generate_session_id)
+        jq -n \
+            --arg session_id "$new_sid" \
+            --arg created_at "$ts" \
+            --arg last_used "$ts" \
+            --arg reset_at "" \
+            --arg reset_reason "" \
+            '{
+                session_id: $session_id,
+                created_at: $created_at,
+                last_used: $last_used,
+                reset_at: $reset_at,
+                reset_reason: $reset_reason
+            }' > "$RALPH_SESSION_FILE"
+        log_status "INFO" "Initialized session tracking (session: $new_sid)"
+    fi
+}
+
+# Update last_used timestamp
+update_session_last_used() {
+    [[ ! -f "$RALPH_SESSION_FILE" ]] && return 0
+    local ts=$(get_iso_timestamp)
+    local updated=$(jq --arg last_used "$ts" '.last_used = $last_used' "$RALPH_SESSION_FILE" 2>/dev/null)
+    [[ -n "$updated" ]] && echo "$updated" > "$RALPH_SESSION_FILE"
+}
\ No newline at end of file
diff --git a/lib/tool_executor.sh b/lib/tool_executor.sh
new file mode 100644
index 00000000..98690b1d
--- /dev/null
+++ b/lib/tool_executor.sh
@@ -0,0 +1,95 @@
+#!/bin/bash
+# Tool Executor Component for Ralph - Specific Parsing
+# Handles extraction and execution of tool calls from LLM output
+
+# Execute a tool call
+execute_tool() {
+    local tool_name="$1"
+    local content="$2"
+
+    log_status "INFO" "🛠 Executing tool: $tool_name"
+    
+    case "$tool_name" in
+        "read_file")
+            local path=$(echo "$content" | perl -0777 -ne 'print $1 if /<arg name="path">(.*?)<\/arg>/s')
+            if [[ -f "$path" ]]; then
+                echo "--- TOOL RESULT ($tool_name) ---"
+                cat "$path"
+                echo "-------------------------------"
+            else
+                echo "Error: File not found: $path"
+            fi
+            ;;
+        "write_file")
+            local path=$(echo "$content" | perl -0777 -ne 'print $1 if /<arg name="path">(.*?)<\/arg>/s')
+            local file_content=$(echo "$content" | perl -0777 -ne 'print $1 if /<arg name="content">(.*?)<\/arg>/s')
+            
+            if [[ -n "$path" ]]; then
+                mkdir -p "$(dirname "$path")"
+                echo "$file_content" > "$path"
+                echo "--- TOOL RESULT ($tool_name) ---"
+                echo "Successfully wrote to $path"
+                echo "-------------------------------"
+            else
+                echo "Error: Missing path for write_file"
+            fi
+            ;;
+        "run_command")
+            local cmd=$(echo "$content" | perl -0777 -ne 'print $1 if /<arg name="command">(.*?)<\/arg>/s')
+            if [[ -n "$cmd" ]]; then
+                if [[ "$cmd" == *"rm -rf /"* ]]; then
+                    echo "Error: Dangerous command blocked"
+                else
+                    echo "--- TOOL RESULT ($tool_name) ---"
+                    eval "$cmd" 2>&1
+                    echo "-------------------------------"
+                fi
+            else
+                echo "Error: Missing command for run_command"
+            fi
+            ;;
+        "list_files")
+            local dir=$(echo "$content" | perl -0777 -ne 'print $1 if /<arg name="directory">(.*?)<\/arg>/s')
+            dir=${dir:-"."}
+            echo "--- TOOL RESULT ($tool_name) ---"
+            ls -R "$dir"
+            echo "-------------------------------"
+            ;;
+        *)
+            echo "Error: Unknown tool: $tool_name"
+            ;;
+    esac
+}
+
+# Process AI response for tool calls
+run_tools_if_requested() {
+    local input_file="$1"
+    local results_file=$(mktemp)
+    
+    local found_tools=false
+    local temp_blocks_dir=$(mktemp -d)
+    
+    # Use perl to extract each tool_call block
+    perl -0777 -ne 'my $i=0; while (/<tool_call(.*?)<\/tool_call>/sg) { open my $fh, ">", "'$temp_blocks_dir'/block_$i.txt"; print $fh "<tool_call$1</tool_call>"; close $fh; $i++; }' "$input_file"
+    
+    for block_file in "$temp_blocks_dir"/block_*.txt; do
+        if [[ -f "$block_file" ]]; then
+            found_tools=true
+            local block_content=$(cat "$block_file")
+            # Extract tool name from the first line of the block
+            local tool_name=$(echo "$block_content" | head -n 1 | sed -n 's/.*<tool_call name="\([^"]*\)".*/\1/p')
+            execute_tool "$tool_name" "$block_content" >> "$results_file"
+        fi
+    done
+    
+    rm -rf "$temp_blocks_dir"
+    
+    if [[ "$found_tools" == "true" ]]; then
+        cat "$results_file"
+        rm "$results_file"
+        return 0
+    else
+        rm "$results_file"
+        return 1
+    fi
+}
\ No newline at end of file
diff --git a/ralph_enable.sh b/ralph_enable.sh
index 3f412cd5..4f3a817b 100755
--- a/ralph_enable.sh
+++ b/ralph_enable.sh
@@ -336,11 +336,55 @@ phase_task_source_selection() {
 }
 
 # =============================================================================
-# PHASE 3: CONFIGURATION
+# PHASE 3: AI PROVIDER SELECTION
+# =============================================================================
+
+phase_provider_selection() {
+    print_header "AI Provider Selection" "Phase 3 of 6"
+
+    # Default provider
+    CONFIG_PROVIDER="claude"
+
+    if [[ "$NON_INTERACTIVE" == "true" ]]; then
+        echo "Using default provider: $CONFIG_PROVIDER"
+        return 0
+    fi
+
+    echo "Select the AI provider to use:"
+    echo ""
+
+    local options=("Claude Code (Anthropic)" "Google Gemini" "GitHub Copilot (Coming Soon)")
+    local selection
+    selection=$(select_option "Select provider" "${options[@]}")
+
+    case "$selection" in
+        "Claude Code (Anthropic)")
+            CONFIG_PROVIDER="claude"
+            ;;
+        "Google Gemini")
+            CONFIG_PROVIDER="gemini"
+            if [[ -z "$GEMINI_API_KEY" ]]; then
+                echo ""
+                print_warning "GEMINI_API_KEY is not set in your environment."
+                echo "Please ensure it is set before running Ralph."
+            fi
+            ;;
+        "GitHub Copilot (Coming Soon)")
+            CONFIG_PROVIDER="copilot"
+            print_warning "Copilot support is experimental."
+            ;;
+    esac
+
+    echo ""
+    echo "Selected provider: $CONFIG_PROVIDER"
+}
+
+# =============================================================================
+# PHASE 4: CONFIGURATION
 # =============================================================================
 
 phase_configuration() {
-    print_header "Configuration" "Phase 3 of 5"
+    print_header "Configuration" "Phase 4 of 6"
 
     # Project name
     if [[ "$NON_INTERACTIVE" != "true" ]]; then
@@ -385,16 +429,17 @@ phase_configuration() {
     print_summary "Configuration" \
         "Project=$CONFIG_PROJECT_NAME" \
         "Type=$DETECTED_PROJECT_TYPE" \
+        "Provider=$CONFIG_PROVIDER" \
         "Max calls/hour=$CONFIG_MAX_CALLS" \
         "Task sources=${SELECTED_SOURCES:-none}"
 }
 
 # =============================================================================
-# PHASE 4: FILE GENERATION
+# PHASE 5: FILE GENERATION
 # =============================================================================
 
 phase_file_generation() {
-    print_header "File Generation" "Phase 4 of 5"
+    print_header "File Generation" "Phase 5 of 6"
 
     # Import tasks if sources selected
     local imported_tasks=""
@@ -438,6 +483,7 @@ phase_file_generation() {
     export ENABLE_SKIP_TASKS="$SKIP_TASKS"
     export ENABLE_PROJECT_NAME="$CONFIG_PROJECT_NAME"
     export ENABLE_TASK_CONTENT="$imported_tasks"
+    export ENABLE_PROVIDER="$CONFIG_PROVIDER"
 
     # Run core enable logic
     echo "Creating Ralph configuration..."
diff --git a/ralph_loop.sh b/ralph_loop.sh
index 683d6543..a4a844d3 100755
--- a/ralph_loop.sh
+++ b/ralph_loop.sh
@@ -16,10 +16,12 @@ source "$SCRIPT_DIR/lib/date_utils.sh"
 source "$SCRIPT_DIR/lib/timeout_utils.sh"
 source "$SCRIPT_DIR/lib/response_analyzer.sh"
 source "$SCRIPT_DIR/lib/circuit_breaker.sh"
+source "$SCRIPT_DIR/lib/providers/base.sh"
 
 # Configuration
 # Ralph-specific files live in .ralph/ subfolder
 RALPH_DIR=".ralph"
+source "$SCRIPT_DIR/lib/session_manager.sh"
 PROMPT_FILE="$RALPH_DIR/PROMPT.md"
 LOG_DIR="$RALPH_DIR/logs"
 DOCS_DIR="$RALPH_DIR/docs/generated"
@@ -520,896 +522,10 @@ should_exit_gracefully() {
 }
 
 # =============================================================================
-# MODERN CLI HELPER FUNCTIONS (Phase 1.1)
+# PROVIDER-SPECIFIC LOGIC (Moved to lib/providers/)
 # =============================================================================
 
-# Check Claude CLI version for compatibility with modern flags
-check_claude_version() {
-    local version=$($CLAUDE_CODE_CMD --version 2>/dev/null | grep -oE '[0-9]+\.[0-9]+\.[0-9]+' | head -1)
-
-    if [[ -z "$version" ]]; then
-        log_status "WARN" "Cannot detect Claude CLI version, assuming compatible"
-        return 0
-    fi
-
-    # Compare versions (simplified semver comparison)
-    local required="$CLAUDE_MIN_VERSION"
-
-    # Convert to comparable integers (major * 10000 + minor * 100 + patch)
-    local ver_parts=(${version//./ })
-    local req_parts=(${required//./ })
-
-    local ver_num=$((${ver_parts[0]:-0} * 10000 + ${ver_parts[1]:-0} * 100 + ${ver_parts[2]:-0}))
-    local req_num=$((${req_parts[0]:-0} * 10000 + ${req_parts[1]:-0} * 100 + ${req_parts[2]:-0}))
-
-    if [[ $ver_num -lt $req_num ]]; then
-        log_status "WARN" "Claude CLI version $version < $required. Some modern features may not work."
-        log_status "WARN" "Consider upgrading: npm update -g @anthropic-ai/claude-code"
-        return 1
-    fi
-
-    log_status "INFO" "Claude CLI version $version (>= $required) - modern features enabled"
-    return 0
-}
-
-# Validate allowed tools against whitelist
-# Returns 0 if valid, 1 if invalid with error message
-validate_allowed_tools() {
-    local tools_input=$1
-
-    if [[ -z "$tools_input" ]]; then
-        return 0  # Empty is valid (uses defaults)
-    fi
-
-    # Split by comma
-    local IFS=','
-    read -ra tools <<< "$tools_input"
-
-    for tool in "${tools[@]}"; do
-        # Trim whitespace
-        tool=$(echo "$tool" | sed 's/^[[:space:]]*//;s/[[:space:]]*$//')
-
-        if [[ -z "$tool" ]]; then
-            continue
-        fi
-
-        local valid=false
-
-        # Check against valid patterns
-        for pattern in "${VALID_TOOL_PATTERNS[@]}"; do
-            if [[ "$tool" == "$pattern" ]]; then
-                valid=true
-                break
-            fi
-
-            # Check for Bash(*) pattern - any Bash with parentheses is allowed
-            if [[ "$tool" =~ ^Bash\(.+\)$ ]]; then
-                valid=true
-                break
-            fi
-        done
-
-        if [[ "$valid" == "false" ]]; then
-            echo "Error: Invalid tool in --allowed-tools: '$tool'"
-            echo "Valid tools: ${VALID_TOOL_PATTERNS[*]}"
-            echo "Note: Bash(...) patterns with any content are allowed (e.g., 'Bash(git *)')"
-            return 1
-        fi
-    done
-
-    return 0
-}
-
-# Build loop context for Claude Code session
-# Provides loop-specific context via --append-system-prompt
-build_loop_context() {
-    local loop_count=$1
-    local context=""
-
-    # Add loop number
-    context="Loop #${loop_count}. "
-
-    # Extract incomplete tasks from fix_plan.md
-    # Bug #3 Fix: Support indented markdown checkboxes with [[:space:]]* pattern
-    if [[ -f "$RALPH_DIR/fix_plan.md" ]]; then
-        local incomplete_tasks=$(grep -cE "^[[:space:]]*- \[ \]" "$RALPH_DIR/fix_plan.md" 2>/dev/null || true)
-        [[ -z "$incomplete_tasks" ]] && incomplete_tasks=0
-        context+="Remaining tasks: ${incomplete_tasks}. "
-    fi
-
-    # Add circuit breaker state
-    if [[ -f "$RALPH_DIR/.circuit_breaker_state" ]]; then
-        local cb_state=$(jq -r '.state // "UNKNOWN"' "$RALPH_DIR/.circuit_breaker_state" 2>/dev/null)
-        if [[ "$cb_state" != "CLOSED" && "$cb_state" != "null" && -n "$cb_state" ]]; then
-            context+="Circuit breaker: ${cb_state}. "
-        fi
-    fi
-
-    # Add previous loop summary (truncated)
-    if [[ -f "$RESPONSE_ANALYSIS_FILE" ]]; then
-        local prev_summary=$(jq -r '.analysis.work_summary // ""' "$RESPONSE_ANALYSIS_FILE" 2>/dev/null | head -c 200)
-        if [[ -n "$prev_summary" && "$prev_summary" != "null" ]]; then
-            context+="Previous: ${prev_summary}"
-        fi
-    fi
-
-    # Limit total length to ~500 chars
-    echo "${context:0:500}"
-}
-
-# Get session file age in hours (cross-platform)
-# Returns: age in hours on stdout, or -1 if stat fails
-# Note: Returns 0 for files less than 1 hour old
-get_session_file_age_hours() {
-    local file=$1
-
-    if [[ ! -f "$file" ]]; then
-        echo "0"
-        return
-    fi
-
-    # Get file modification time using capability detection
-    # Handles macOS with Homebrew coreutils where stat flags differ
-    local file_mtime
-
-    # Try GNU stat first (Linux, macOS with Homebrew coreutils)
-    if file_mtime=$(stat -c %Y "$file" 2>/dev/null) && [[ -n "$file_mtime" && "$file_mtime" =~ ^[0-9]+$ ]]; then
-        : # success
-    # Try BSD stat (native macOS)
-    elif file_mtime=$(stat -f %m "$file" 2>/dev/null) && [[ -n "$file_mtime" && "$file_mtime" =~ ^[0-9]+$ ]]; then
-        : # success
-    # Fallback to date -r (most portable)
-    elif file_mtime=$(date -r "$file" +%s 2>/dev/null) && [[ -n "$file_mtime" && "$file_mtime" =~ ^[0-9]+$ ]]; then
-        : # success
-    else
-        file_mtime=""
-    fi
-
-    # Handle stat failure - return -1 to indicate error
-    # This prevents false expiration when stat fails
-    if [[ -z "$file_mtime" || "$file_mtime" == "0" ]]; then
-        echo "-1"
-        return
-    fi
-
-    local current_time
-    current_time=$(date +%s)
-
-    local age_seconds=$((current_time - file_mtime))
-    local age_hours=$((age_seconds / 3600))
-
-    echo "$age_hours"
-}
-
-# Initialize or resume Claude session (with expiration check)
-#
-# Session Expiration Strategy:
-# - Default expiration: 24 hours (configurable via CLAUDE_SESSION_EXPIRY_HOURS)
-# - 24 hours chosen because: long enough for multi-day projects, short enough
-#   to prevent stale context from causing unpredictable behavior
-# - Sessions auto-expire to ensure Claude starts fresh periodically
-#
-# Returns (stdout):
-#   - Session ID string: when resuming a valid, non-expired session
-#   - Empty string: when starting new session (no file, expired, or stat error)
-#
-# Return codes:
-#   - 0: Always returns success (caller should check stdout for session ID)
-#
-init_claude_session() {
-    if [[ -f "$CLAUDE_SESSION_FILE" ]]; then
-        # Check session age
-        local age_hours
-        age_hours=$(get_session_file_age_hours "$CLAUDE_SESSION_FILE")
-
-        # Handle stat failure (-1) - treat as needing new session
-        # Don't expire sessions when we can't determine age
-        if [[ $age_hours -eq -1 ]]; then
-            log_status "WARN" "Could not determine session age, starting new session"
-            rm -f "$CLAUDE_SESSION_FILE"
-            echo ""
-            return 0
-        fi
-
-        # Check if session has expired
-        if [[ $age_hours -ge $CLAUDE_SESSION_EXPIRY_HOURS ]]; then
-            log_status "INFO" "Session expired (${age_hours}h old, max ${CLAUDE_SESSION_EXPIRY_HOURS}h), starting new session"
-            rm -f "$CLAUDE_SESSION_FILE"
-            echo ""
-            return 0
-        fi
-
-        # Session is valid, try to read it
-        local session_id=$(cat "$CLAUDE_SESSION_FILE" 2>/dev/null)
-        if [[ -n "$session_id" ]]; then
-            log_status "INFO" "Resuming Claude session: ${session_id:0:20}... (${age_hours}h old)"
-            echo "$session_id"
-            return 0
-        fi
-    fi
-
-    log_status "INFO" "Starting new Claude session"
-    echo ""
-}
-
-# Save session ID after successful execution
-save_claude_session() {
-    local output_file=$1
-
-    # Try to extract session ID from JSON output
-    if [[ -f "$output_file" ]]; then
-        local session_id=$(jq -r '.metadata.session_id // .session_id // empty' "$output_file" 2>/dev/null)
-        if [[ -n "$session_id" && "$session_id" != "null" ]]; then
-            echo "$session_id" > "$CLAUDE_SESSION_FILE"
-            log_status "INFO" "Saved Claude session: ${session_id:0:20}..."
-        fi
-    fi
-}
-
-# =============================================================================
-# SESSION LIFECYCLE MANAGEMENT FUNCTIONS (Phase 1.2)
-# =============================================================================
-
-# Get current session ID from Ralph session file
-# Returns: session ID string or empty if not found
-get_session_id() {
-    if [[ ! -f "$RALPH_SESSION_FILE" ]]; then
-        echo ""
-        return 0
-    fi
-
-    # Extract session_id from JSON file (SC2155: separate declare from assign)
-    local session_id
-    session_id=$(jq -r '.session_id // ""' "$RALPH_SESSION_FILE" 2>/dev/null)
-    local jq_status=$?
-
-    # Handle jq failure or null/empty results
-    if [[ $jq_status -ne 0 || -z "$session_id" || "$session_id" == "null" ]]; then
-        session_id=""
-    fi
-    echo "$session_id"
-    return 0
-}
-
-# Reset session with reason logging
-# Usage: reset_session "reason_for_reset"
-reset_session() {
-    local reason=${1:-"manual_reset"}
-
-    # Get current timestamp
-    local reset_timestamp
-    reset_timestamp=$(get_iso_timestamp)
-
-    # Always create/overwrite the session file using jq for safe JSON escaping
-    jq -n \
-        --arg session_id "" \
-        --arg created_at "" \
-        --arg last_used "" \
-        --arg reset_at "$reset_timestamp" \
-        --arg reset_reason "$reason" \
-        '{
-            session_id: $session_id,
-            created_at: $created_at,
-            last_used: $last_used,
-            reset_at: $reset_at,
-            reset_reason: $reset_reason
-        }' > "$RALPH_SESSION_FILE"
-
-    # Also clear the Claude session file for consistency
-    rm -f "$CLAUDE_SESSION_FILE" 2>/dev/null
-
-    # Clear exit signals to prevent stale completion indicators from causing premature exit (issue #91)
-    # This ensures a fresh start without leftover state from previous sessions
-    if [[ -f "$EXIT_SIGNALS_FILE" ]]; then
-        echo '{"test_only_loops": [], "done_signals": [], "completion_indicators": []}' > "$EXIT_SIGNALS_FILE"
-        [[ "${VERBOSE_PROGRESS:-}" == "true" ]] && log_status "INFO" "Cleared exit signals file"
-    fi
-
-    # Clear response analysis to prevent stale EXIT_SIGNAL from previous session
-    rm -f "$RESPONSE_ANALYSIS_FILE" 2>/dev/null
-
-    # Log the session transition (non-fatal to prevent script exit under set -e)
-    log_session_transition "active" "reset" "$reason" "${loop_count:-0}" || true
-
-    log_status "INFO" "Session reset: $reason"
-}
-
-# Log session state transitions to history file
-# Usage: log_session_transition from_state to_state reason loop_number
-log_session_transition() {
-    local from_state=$1
-    local to_state=$2
-    local reason=$3
-    local loop_number=${4:-0}
-
-    # Get timestamp once (SC2155: separate declare from assign)
-    local ts
-    ts=$(get_iso_timestamp)
-
-    # Create transition entry using jq for safe JSON (SC2155: separate declare from assign)
-    local transition
-    transition=$(jq -n -c \
-        --arg timestamp "$ts" \
-        --arg from_state "$from_state" \
-        --arg to_state "$to_state" \
-        --arg reason "$reason" \
-        --argjson loop_number "$loop_number" \
-        '{
-            timestamp: $timestamp,
-            from_state: $from_state,
-            to_state: $to_state,
-            reason: $reason,
-            loop_number: $loop_number
-        }')
-
-    # Read history file defensively - fallback to empty array on any failure
-    local history
-    if [[ -f "$RALPH_SESSION_HISTORY_FILE" ]]; then
-        history=$(cat "$RALPH_SESSION_HISTORY_FILE" 2>/dev/null)
-        # Validate JSON, fallback to empty array if corrupted
-        if ! echo "$history" | jq empty 2>/dev/null; then
-            history='[]'
-        fi
-    else
-        history='[]'
-    fi
-
-    # Append transition and keep only last 50 entries
-    local updated_history
-    updated_history=$(echo "$history" | jq ". += [$transition] | .[-50:]" 2>/dev/null)
-    local jq_status=$?
-
-    # Only write if jq succeeded
-    if [[ $jq_status -eq 0 && -n "$updated_history" ]]; then
-        echo "$updated_history" > "$RALPH_SESSION_HISTORY_FILE"
-    else
-        # Fallback: start fresh with just this transition
-        echo "[$transition]" > "$RALPH_SESSION_HISTORY_FILE"
-    fi
-}
-
-# Generate a unique session ID using timestamp and random component
-generate_session_id() {
-    local ts
-    ts=$(date +%s)
-    local rand
-    rand=$RANDOM
-    echo "ralph-${ts}-${rand}"
-}
-
-# Initialize session tracking (called at loop start)
-init_session_tracking() {
-    local ts
-    ts=$(get_iso_timestamp)
-
-    # Create session file if it doesn't exist
-    if [[ ! -f "$RALPH_SESSION_FILE" ]]; then
-        local new_session_id
-        new_session_id=$(generate_session_id)
-
-        jq -n \
-            --arg session_id "$new_session_id" \
-            --arg created_at "$ts" \
-            --arg last_used "$ts" \
-            --arg reset_at "" \
-            --arg reset_reason "" \
-            '{
-                session_id: $session_id,
-                created_at: $created_at,
-                last_used: $last_used,
-                reset_at: $reset_at,
-                reset_reason: $reset_reason
-            }' > "$RALPH_SESSION_FILE"
-
-        log_status "INFO" "Initialized session tracking (session: $new_session_id)"
-        return 0
-    fi
-
-    # Validate existing session file
-    if ! jq empty "$RALPH_SESSION_FILE" 2>/dev/null; then
-        log_status "WARN" "Corrupted session file detected, recreating..."
-        local new_session_id
-        new_session_id=$(generate_session_id)
-
-        jq -n \
-            --arg session_id "$new_session_id" \
-            --arg created_at "$ts" \
-            --arg last_used "$ts" \
-            --arg reset_at "$ts" \
-            --arg reset_reason "corrupted_file_recovery" \
-            '{
-                session_id: $session_id,
-                created_at: $created_at,
-                last_used: $last_used,
-                reset_at: $reset_at,
-                reset_reason: $reset_reason
-            }' > "$RALPH_SESSION_FILE"
-    fi
-}
-
-# Update last_used timestamp in session file (called on each loop iteration)
-update_session_last_used() {
-    if [[ ! -f "$RALPH_SESSION_FILE" ]]; then
-        return 0
-    fi
-
-    local ts
-    ts=$(get_iso_timestamp)
-
-    # Update last_used in existing session file
-    local updated
-    updated=$(jq --arg last_used "$ts" '.last_used = $last_used' "$RALPH_SESSION_FILE" 2>/dev/null)
-    local jq_status=$?
-
-    if [[ $jq_status -eq 0 && -n "$updated" ]]; then
-        echo "$updated" > "$RALPH_SESSION_FILE"
-    fi
-}
-
-# Global array for Claude command arguments (avoids shell injection)
-declare -a CLAUDE_CMD_ARGS=()
-
-# Build Claude CLI command with modern flags using array (shell-injection safe)
-# Populates global CLAUDE_CMD_ARGS array for direct execution
-# Uses -p flag with prompt content (Claude CLI does not have --prompt-file)
-build_claude_command() {
-    local prompt_file=$1
-    local loop_context=$2
-    local session_id=$3
-
-    # Reset global array
-    # Note: We do NOT use --dangerously-skip-permissions here. Tool permissions
-    # are controlled via --allowedTools from CLAUDE_ALLOWED_TOOLS in .ralphrc.
-    # This preserves the permission denial circuit breaker (Issue #101).
-    CLAUDE_CMD_ARGS=("$CLAUDE_CODE_CMD")
-
-    # Check if prompt file exists
-    if [[ ! -f "$prompt_file" ]]; then
-        log_status "ERROR" "Prompt file not found: $prompt_file"
-        return 1
-    fi
-
-    # Add output format flag
-    if [[ "$CLAUDE_OUTPUT_FORMAT" == "json" ]]; then
-        CLAUDE_CMD_ARGS+=("--output-format" "json")
-    fi
-
-    # Add allowed tools (each tool as separate array element)
-    if [[ -n "$CLAUDE_ALLOWED_TOOLS" ]]; then
-        CLAUDE_CMD_ARGS+=("--allowedTools")
-        # Split by comma and add each tool
-        local IFS=','
-        read -ra tools_array <<< "$CLAUDE_ALLOWED_TOOLS"
-        for tool in "${tools_array[@]}"; do
-            # Trim whitespace
-            tool=$(echo "$tool" | sed 's/^[[:space:]]*//;s/[[:space:]]*$//')
-            if [[ -n "$tool" ]]; then
-                CLAUDE_CMD_ARGS+=("$tool")
-            fi
-        done
-    fi
-
-    # Add session continuity flag
-    # IMPORTANT: Use --resume with explicit session ID instead of --continue
-    # --continue resumes the "most recent session in current directory" which
-    # can hijack active Claude Code sessions. --resume with a specific session ID
-    # ensures we only resume Ralph's own sessions. (Issue #151)
-    if [[ "$CLAUDE_USE_CONTINUE" == "true" && -n "$session_id" ]]; then
-        CLAUDE_CMD_ARGS+=("--resume" "$session_id")
-    fi
-    # If no session_id, start fresh - Claude will generate a new session ID
-    # which we'll capture via save_claude_session() for future loops
-
-    # Add loop context as system prompt (no escaping needed - array handles it)
-    if [[ -n "$loop_context" ]]; then
-        CLAUDE_CMD_ARGS+=("--append-system-prompt" "$loop_context")
-    fi
-
-    # Read prompt file content and use -p flag
-    # Note: Claude CLI uses -p for prompts, not --prompt-file (which doesn't exist)
-    # Array-based approach maintains shell injection safety
-    local prompt_content
-    prompt_content=$(cat "$prompt_file")
-    CLAUDE_CMD_ARGS+=("-p" "$prompt_content")
-}
-
-# Main execution function
-execute_claude_code() {
-    local timestamp=$(date '+%Y-%m-%d_%H-%M-%S')
-    local output_file="$LOG_DIR/claude_output_${timestamp}.log"
-    local loop_count=$1
-    local calls_made=$(cat "$CALL_COUNT_FILE" 2>/dev/null || echo "0")
-    calls_made=$((calls_made + 1))
-
-    # Fix #141: Capture git HEAD SHA at loop start to detect commits as progress
-    # Store in file for access by progress detection after Claude execution
-    local loop_start_sha=""
-    if command -v git &>/dev/null && git rev-parse --git-dir &>/dev/null 2>&1; then
-        loop_start_sha=$(git rev-parse HEAD 2>/dev/null || echo "")
-    fi
-    echo "$loop_start_sha" > "$RALPH_DIR/.loop_start_sha"
-
-    log_status "LOOP" "Executing Claude Code (Call $calls_made/$MAX_CALLS_PER_HOUR)"
-    local timeout_seconds=$((CLAUDE_TIMEOUT_MINUTES * 60))
-    log_status "INFO" "⏳ Starting Claude Code execution... (timeout: ${CLAUDE_TIMEOUT_MINUTES}m)"
-
-    # Build loop context for session continuity
-    local loop_context=""
-    if [[ "$CLAUDE_USE_CONTINUE" == "true" ]]; then
-        loop_context=$(build_loop_context "$loop_count")
-        if [[ -n "$loop_context" && "$VERBOSE_PROGRESS" == "true" ]]; then
-            log_status "INFO" "Loop context: $loop_context"
-        fi
-    fi
-
-    # Initialize or resume session
-    local session_id=""
-    if [[ "$CLAUDE_USE_CONTINUE" == "true" ]]; then
-        session_id=$(init_claude_session)
-    fi
-
-    # Live mode requires JSON output (stream-json) — override text format
-    if [[ "$LIVE_OUTPUT" == "true" && "$CLAUDE_OUTPUT_FORMAT" == "text" ]]; then
-        log_status "WARN" "Live mode requires JSON output format. Overriding text → json for this session."
-        CLAUDE_OUTPUT_FORMAT="json"
-    fi
-
-    # Build the Claude CLI command with modern flags
-    local use_modern_cli=false
-
-    if build_claude_command "$PROMPT_FILE" "$loop_context" "$session_id"; then
-        use_modern_cli=true
-        log_status "INFO" "Using modern CLI mode (${CLAUDE_OUTPUT_FORMAT} output)"
-    else
-        log_status "WARN" "Failed to build modern CLI command, falling back to legacy mode"
-        if [[ "$LIVE_OUTPUT" == "true" ]]; then
-            log_status "ERROR" "Live mode requires a built Claude command. Falling back to background mode."
-            LIVE_OUTPUT=false
-        fi
-    fi
-
-    # Execute Claude Code
-    local exit_code=0
-
-    # Initialize live.log for this execution
-    echo -e "\n\n=== Loop #$loop_count - $(date '+%Y-%m-%d %H:%M:%S') ===" > "$LIVE_LOG_FILE"
-
-    if [[ "$LIVE_OUTPUT" == "true" ]]; then
-        # LIVE MODE: Show streaming output in real-time using stream-json + jq
-        # Based on: https://www.ytyng.com/en/blog/claude-stream-json-jq/
-        #
-        # Uses CLAUDE_CMD_ARGS from build_claude_command() to preserve:
-        # - --allowedTools (tool permissions)
-        # - --append-system-prompt (loop context)
-        # - --continue (session continuity)
-        # - -p (prompt content)
-
-        # Check dependencies for live mode
-        if ! command -v jq &> /dev/null; then
-            log_status "ERROR" "Live mode requires 'jq' but it's not installed. Falling back to background mode."
-            LIVE_OUTPUT=false
-        elif ! command -v stdbuf &> /dev/null; then
-            log_status "ERROR" "Live mode requires 'stdbuf' (from coreutils) but it's not installed. Falling back to background mode."
-            LIVE_OUTPUT=false
-        fi
-    fi
-
-    if [[ "$LIVE_OUTPUT" == "true" ]]; then
-        # Safety check: live mode requires a successfully built modern command
-        if [[ "$use_modern_cli" != "true" || ${#CLAUDE_CMD_ARGS[@]} -eq 0 ]]; then
-            log_status "ERROR" "Live mode requires a built Claude command. Falling back to background mode."
-            LIVE_OUTPUT=false
-        fi
-    fi
-
-    if [[ "$LIVE_OUTPUT" == "true" ]]; then
-        log_status "INFO" "📺 Live output mode enabled - showing Claude Code streaming..."
-        echo -e "${PURPLE}━━━━━━━━━━━━━━━━ Claude Code Output ━━━━━━━━━━━━━━━━${NC}"
-
-        # Modify CLAUDE_CMD_ARGS: replace --output-format value with stream-json
-        # and add streaming-specific flags
-        local -a LIVE_CMD_ARGS=()
-        local skip_next=false
-        for arg in "${CLAUDE_CMD_ARGS[@]}"; do
-            if [[ "$skip_next" == "true" ]]; then
-                # Replace "json" with "stream-json" for output format
-                LIVE_CMD_ARGS+=("stream-json")
-                skip_next=false
-            elif [[ "$arg" == "--output-format" ]]; then
-                LIVE_CMD_ARGS+=("$arg")
-                skip_next=true
-            else
-                LIVE_CMD_ARGS+=("$arg")
-            fi
-        done
-
-        # Add streaming-specific flags (--verbose and --include-partial-messages)
-        # These are required for stream-json to work properly
-        LIVE_CMD_ARGS+=("--verbose" "--include-partial-messages")
-
-        # jq filter: show text + tool names + newlines for readability
-        local jq_filter='
-            if .type == "stream_event" then
-                if .event.type == "content_block_delta" and .event.delta.type == "text_delta" then
-                    .event.delta.text
-                elif .event.type == "content_block_start" and .event.content_block.type == "tool_use" then
-                    "\n\n⚡ [" + .event.content_block.name + "]\n"
-                elif .event.type == "content_block_stop" then
-                    "\n"
-                else
-                    empty
-                end
-            else
-                empty
-            end'
-
-        # Execute with streaming, preserving all flags from build_claude_command()
-        # Use stdbuf to disable buffering for real-time output
-        # Use portable_timeout for consistent timeout protection (Issue: missing timeout)
-        # Capture all pipeline exit codes for proper error handling
-        # stdin must be redirected from /dev/null because newer Claude CLI versions
-        # read from stdin even in -p (print) mode, causing the process to hang
-        set -o pipefail
-        portable_timeout ${timeout_seconds}s stdbuf -oL "${LIVE_CMD_ARGS[@]}" \
-            < /dev/null 2>&1 | stdbuf -oL tee "$output_file" | stdbuf -oL jq --unbuffered -j "$jq_filter" 2>/dev/null | tee "$LIVE_LOG_FILE"
-
-        # Capture exit codes from pipeline
-        local -a pipe_status=("${PIPESTATUS[@]}")
-        set +o pipefail
-
-        # Primary exit code is from Claude/timeout (first command in pipeline)
-        exit_code=${pipe_status[0]}
-
-        # Check for tee failures (second command) - could break logging/session
-        if [[ ${pipe_status[1]} -ne 0 ]]; then
-            log_status "WARN" "Failed to write stream output to log file (exit code ${pipe_status[1]})"
-        fi
-
-        # Check for jq failures (third command) - warn but don't fail
-        if [[ ${pipe_status[2]} -ne 0 ]]; then
-            log_status "WARN" "jq filter had issues parsing some stream events (exit code ${pipe_status[2]})"
-        fi
-
-        echo ""
-        echo -e "${PURPLE}━━━━━━━━━━━━━━━━ End of Output ━━━━━━━━━━━━━━━━━━━${NC}"
-
-        # Extract session ID from stream-json output for session continuity
-        # Stream-json format has session_id in the final "result" type message
-        # Keep full stream output in _stream.log, extract session data separately
-        if [[ "$CLAUDE_USE_CONTINUE" == "true" && -f "$output_file" ]]; then
-            # Preserve full stream output for analysis (don't overwrite output_file)
-            local stream_output_file="${output_file%.log}_stream.log"
-            cp "$output_file" "$stream_output_file"
-
-            # Extract the result message and convert to standard JSON format
-            # Use flexible regex to match various JSON formatting styles
-            # Matches: "type":"result", "type": "result", "type" : "result"
-            local result_line=$(grep -E '"type"[[:space:]]*:[[:space:]]*"result"' "$output_file" 2>/dev/null | tail -1)
-
-            if [[ -n "$result_line" ]]; then
-                # Validate that extracted line is valid JSON before using it
-                if echo "$result_line" | jq -e . >/dev/null 2>&1; then
-                    # Write validated result as the output_file for downstream processing
-                    # (save_claude_session and analyze_response expect JSON format)
-                    echo "$result_line" > "$output_file"
-                    log_status "INFO" "Extracted and validated session data from stream output"
-                else
-                    log_status "WARN" "Extracted result line is not valid JSON, keeping stream output"
-                    # Restore original stream output
-                    cp "$stream_output_file" "$output_file"
-                fi
-            else
-                log_status "WARN" "Could not find result message in stream output"
-                # Keep stream output as-is for debugging
-            fi
-        fi
-    else
-        # BACKGROUND MODE: Original behavior with progress monitoring
-        if [[ "$use_modern_cli" == "true" ]]; then
-            # Modern execution with command array (shell-injection safe)
-            # Execute array directly without bash -c to prevent shell metacharacter interpretation
-            # stdin must be redirected from /dev/null because newer Claude CLI versions
-            # read from stdin even in -p (print) mode, causing SIGTTIN suspension
-            # when the process is backgrounded
-            if portable_timeout ${timeout_seconds}s "${CLAUDE_CMD_ARGS[@]}" < /dev/null > "$output_file" 2>&1 &
-            then
-                :  # Continue to wait loop
-            else
-                log_status "ERROR" "❌ Failed to start Claude Code process (modern mode)"
-                # Fall back to legacy mode
-                log_status "INFO" "Falling back to legacy mode..."
-                use_modern_cli=false
-            fi
-        fi
-
-        # Fall back to legacy stdin piping if modern mode failed or not enabled
-        # Note: Legacy mode doesn't use --allowedTools, so tool permissions
-        # will be handled by Claude Code's default permission system
-        if [[ "$use_modern_cli" == "false" ]]; then
-            if portable_timeout ${timeout_seconds}s $CLAUDE_CODE_CMD < "$PROMPT_FILE" > "$output_file" 2>&1 &
-            then
-                :  # Continue to wait loop
-            else
-                log_status "ERROR" "❌ Failed to start Claude Code process"
-                return 1
-            fi
-        fi
-
-        # Get PID and monitor progress
-        local claude_pid=$!
-        local progress_counter=0
-
-        # Show progress while Claude Code is running
-        while kill -0 $claude_pid 2>/dev/null; do
-            progress_counter=$((progress_counter + 1))
-            case $((progress_counter % 4)) in
-                1) progress_indicator="⠋" ;;
-                2) progress_indicator="⠙" ;;
-                3) progress_indicator="⠹" ;;
-                0) progress_indicator="⠸" ;;
-            esac
-
-            # Get last line from output if available
-            local last_line=""
-            if [[ -f "$output_file" && -s "$output_file" ]]; then
-                last_line=$(tail -1 "$output_file" 2>/dev/null | head -c 80)
-                # Copy to live.log for tmux monitoring
-                cp "$output_file" "$LIVE_LOG_FILE" 2>/dev/null
-            fi
-
-            # Update progress file for monitor
-            cat > "$PROGRESS_FILE" << EOF
-{
-    "status": "executing",
-    "indicator": "$progress_indicator",
-    "elapsed_seconds": $((progress_counter * 10)),
-    "last_output": "$last_line",
-    "timestamp": "$(date '+%Y-%m-%d %H:%M:%S')"
-}
-EOF
-
-            # Only log if verbose mode is enabled
-            if [[ "$VERBOSE_PROGRESS" == "true" ]]; then
-                if [[ -n "$last_line" ]]; then
-                    log_status "INFO" "$progress_indicator Claude Code: $last_line... (${progress_counter}0s)"
-                else
-                    log_status "INFO" "$progress_indicator Claude Code working... (${progress_counter}0s elapsed)"
-                fi
-            fi
-
-            sleep 10
-        done
-
-        # Wait for the process to finish and get exit code
-        wait $claude_pid
-        exit_code=$?
-    fi
-
-    if [ $exit_code -eq 0 ]; then
-        # Only increment counter on successful execution
-        echo "$calls_made" > "$CALL_COUNT_FILE"
-
-        # Clear progress file
-        echo '{"status": "completed", "timestamp": "'$(date '+%Y-%m-%d %H:%M:%S')'"}' > "$PROGRESS_FILE"
-
-        log_status "SUCCESS" "✅ Claude Code execution completed successfully"
-
-        # Save session ID from JSON output (Phase 1.1)
-        if [[ "$CLAUDE_USE_CONTINUE" == "true" ]]; then
-            save_claude_session "$output_file"
-        fi
-
-        # Analyze the response
-        log_status "INFO" "🔍 Analyzing Claude Code response..."
-        analyze_response "$output_file" "$loop_count"
-        local analysis_exit_code=$?
-
-        # Update exit signals based on analysis
-        update_exit_signals
-
-        # Log analysis summary
-        log_analysis_summary
-
-        # Get file change count for circuit breaker
-        # Fix #141: Detect both uncommitted changes AND committed changes
-        local files_changed=0
-        local loop_start_sha=""
-        local current_sha=""
-
-        if [[ -f "$RALPH_DIR/.loop_start_sha" ]]; then
-            loop_start_sha=$(cat "$RALPH_DIR/.loop_start_sha" 2>/dev/null || echo "")
-        fi
-
-        if command -v git &>/dev/null && git rev-parse --git-dir &>/dev/null 2>&1; then
-            current_sha=$(git rev-parse HEAD 2>/dev/null || echo "")
-
-            # Check if commits were made (HEAD changed)
-            if [[ -n "$loop_start_sha" && -n "$current_sha" && "$loop_start_sha" != "$current_sha" ]]; then
-                # Commits were made - count union of committed files AND working tree changes
-                # This catches cases where Claude commits some files but still has other modified files
-                files_changed=$(
-                    {
-                        git diff --name-only "$loop_start_sha" "$current_sha" 2>/dev/null
-                        git diff --name-only HEAD 2>/dev/null           # unstaged changes
-                        git diff --name-only --cached 2>/dev/null       # staged changes
-                    } | sort -u | wc -l
-                )
-                [[ "$VERBOSE_PROGRESS" == "true" ]] && log_status "DEBUG" "Detected $files_changed unique files changed (commits + working tree) since loop start"
-            else
-                # No commits - check for uncommitted changes (staged + unstaged)
-                files_changed=$(
-                    {
-                        git diff --name-only 2>/dev/null                # unstaged changes
-                        git diff --name-only --cached 2>/dev/null       # staged changes
-                    } | sort -u | wc -l
-                )
-            fi
-        fi
-
-        local has_errors="false"
-
-        # Two-stage error detection to avoid JSON field false positives
-        # Stage 1: Filter out JSON field patterns like "is_error": false
-        # Stage 2: Look for actual error messages in specific contexts
-        # Avoid type annotations like "error: Error" by requiring lowercase after ": error"
-        if grep -v '"[^"]*error[^"]*":' "$output_file" 2>/dev/null | \
-           grep -qE '(^Error:|^ERROR:|^error:|\]: error|Link: error|Error occurred|failed with error|[Ee]xception|Fatal|FATAL)'; then
-            has_errors="true"
-
-            # Debug logging: show what triggered error detection
-            if [[ "$VERBOSE_PROGRESS" == "true" ]]; then
-                log_status "DEBUG" "Error patterns found:"
-                grep -v '"[^"]*error[^"]*":' "$output_file" 2>/dev/null | \
-                    grep -nE '(^Error:|^ERROR:|^error:|\]: error|Link: error|Error occurred|failed with error|[Ee]xception|Fatal|FATAL)' | \
-                    head -3 | while IFS= read -r line; do
-                    log_status "DEBUG" "  $line"
-                done
-            fi
-
-            log_status "WARN" "Errors detected in output, check: $output_file"
-        fi
-        local output_length=$(wc -c < "$output_file" 2>/dev/null || echo 0)
-
-        # Record result in circuit breaker
-        record_loop_result "$loop_count" "$files_changed" "$has_errors" "$output_length"
-        local circuit_result=$?
-
-        if [[ $circuit_result -ne 0 ]]; then
-            log_status "WARN" "Circuit breaker opened - halting execution"
-            return 3  # Special code for circuit breaker trip
-        fi
-
-        return 0
-    else
-        # Clear progress file on failure
-        echo '{"status": "failed", "timestamp": "'$(date '+%Y-%m-%d %H:%M:%S')'"}' > "$PROGRESS_FILE"
-
-        # Check if the failure is due to API 5-hour limit
-        if grep -qi "5.*hour.*limit\|limit.*reached.*try.*back\|usage.*limit.*reached" "$output_file"; then
-            log_status "ERROR" "🚫 Claude API 5-hour usage limit reached"
-            return 2  # Special return code for API limit
-        else
-            log_status "ERROR" "❌ Claude Code execution failed, check: $output_file"
-            return 1
-        fi
-    fi
-}
-
 # Cleanup function
-cleanup() {
-    log_status "INFO" "Ralph loop interrupted. Cleaning up..."
-    reset_session "manual_interrupt"
-    update_status "$loop_count" "$(cat "$CALL_COUNT_FILE" 2>/dev/null || echo "0")" "interrupted" "stopped"
-    exit 0
-}
-
-# Set up signal handlers
-trap cleanup SIGINT SIGTERM
-
-# Global variable for loop count (needed by cleanup function)
-loop_count=0
-
-# Main loop
 main() {
     # Load project-specific configuration from .ralphrc
     if load_ralphrc; then
@@ -1418,7 +534,11 @@ main() {
         fi
     fi
 
-    log_status "SUCCESS" "🚀 Ralph loop starting with Claude Code"
+    # Load AI provider
+    load_provider
+    provider_init
+
+    log_status "SUCCESS" "🚀 Ralph loop starting with AI provider: ${RALPH_PROVIDER:-claude}"
     log_status "INFO" "Max calls per hour: $MAX_CALLS_PER_HOUR"
     log_status "INFO" "Logs: $LOG_DIR/ | Docs: $DOCS_DIR/ | Status: $STATUS_FILE"
 
@@ -1549,8 +669,8 @@ main() {
         local calls_made=$(cat "$CALL_COUNT_FILE" 2>/dev/null || echo "0")
         update_status "$loop_count" "$calls_made" "executing" "running"
         
-        # Execute Claude Code
-        execute_claude_code "$loop_count"
+        # Execute AI provider
+        provider_execute "$loop_count" "$PROMPT_FILE" "$LIVE_OUTPUT"
         local exec_result=$?
         
         if [ $exec_result -eq 0 ]; then
@@ -1671,6 +791,9 @@ Examples:
 HELPEOF
 }
 
+# Load AI provider
+load_provider
+
 # Parse command line arguments
 while [[ $# -gt 0 ]]; do
     case $1 in
diff --git a/templates/system_prompts/generic_agent.md b/templates/system_prompts/generic_agent.md
new file mode 100644
index 00000000..41b7b45a
--- /dev/null
+++ b/templates/system_prompts/generic_agent.md
@@ -0,0 +1,63 @@
+# Ralph Agent Instructions
+
+You are an autonomous AI development agent called Ralph. Your goal is to complete the project requirements provided in the prompt.
+
+## Operational Protocol
+You operate in a loop. In each turn, you can either:
+1.  **Analyze** the codebase and plan your next steps.
+2.  **Execute Tools** to interact with the environment.
+3.  **Finalize** the task when all requirements are met.
+
+## Available Tools
+To use a tool, you MUST use the following XML format in your response. Do not use any other format for tool calls.
+
+### read_file
+Reads the content of a file.
+```xml
+<tool_call name="read_file">
+  <arg name="path">path/to/file</arg>
+</tool_call>
+```
+
+### write_file
+Creates or overwrites a file with new content.
+```xml
+<tool_call name="write_file">
+  <arg name="path">path/to/file</arg>
+  <arg name="content">
+  Your file content here...
+  </arg>
+</tool_call>
+```
+
+### run_command
+Executes a bash command.
+```xml
+<tool_call name="run_command">
+  <arg name="command">npm test</arg>
+</tool_call>
+```
+
+### list_files
+Lists files in a directory recursively.
+```xml
+<tool_call name="list_files">
+  <arg name="directory">.</arg>
+</tool_call>
+```
+
+## Response Format
+You can provide reasoning before or after tool calls.
+If you are finished with all tasks, include the following block at the end of your message:
+
+---RALPH_STATUS---
+STATUS: COMPLETE
+EXIT_SIGNAL: true
+------------------
+
+If you need more steps, use:
+
+---RALPH_STATUS---
+STATUS: WORKING
+EXIT_SIGNAL: false
+------------------
diff --git a/tests/unit/test_cli_modern.bats b/tests/unit/test_cli_modern.bats
index 28dbfbe5..e5417389 100644
--- a/tests/unit/test_cli_modern.bats
+++ b/tests/unit/test_cli_modern.bats
@@ -649,11 +649,11 @@ EOF
 # =============================================================================
 
 @test "modern CLI background execution redirects stdin from /dev/null" {
-    # Verify the implementation in ralph_loop.sh redirects stdin from /dev/null
+    # Verify the implementation in lib/providers/claude.sh redirects stdin from /dev/null
     # to prevent SIGTTIN suspension when claude is backgrounded.
     # Without this, newer Claude CLI versions hang indefinitely.
 
-    run grep 'portable_timeout.*CLAUDE_CMD_ARGS.*< /dev/null.*&' "${BATS_TEST_DIRNAME}/../../ralph_loop.sh"
+    run grep 'portable_timeout.*CLAUDE_CMD_ARGS.*< /dev/null.*&' "${BATS_TEST_DIRNAME}/../../lib/providers/claude.sh"
 
     assert_success
     [[ "$output" == *'< /dev/null'* ]]
@@ -662,10 +662,8 @@ EOF
 @test "live mode execution redirects stdin from /dev/null" {
     # Verify the live (streaming) mode also redirects stdin from /dev/null.
     # This path is used by ralph --monitor (which adds --live).
-    # The live mode splits across two lines (line continuation with \),
-    # so we check the continuation line that has < /dev/null.
 
-    local script="${BATS_TEST_DIRNAME}/../../ralph_loop.sh"
+    local script="${BATS_TEST_DIRNAME}/../../lib/providers/claude.sh"
 
     # The live mode has LIVE_CMD_ARGS on one line and < /dev/null on the next
     run grep '< /dev/null 2>&1 |' "$script"
@@ -681,7 +679,7 @@ EOF
     # We check that no portable_timeout line invoking claude lacks a stdin redirect
     # (either on the same line or a continuation line).
 
-    local script="${BATS_TEST_DIRNAME}/../../ralph_loop.sh"
+    local script="${BATS_TEST_DIRNAME}/../../lib/providers/claude.sh"
 
     # All 3 portable_timeout lines that invoke claude should have < somewhere nearby
     # Modern background: has < /dev/null on same line
@@ -700,7 +698,7 @@ EOF
 @test "modern CLI background execution has comment explaining stdin redirect" {
     # Verify the fix is documented with context about why /dev/null is needed
 
-    run grep -c 'stdin must be redirected' "${BATS_TEST_DIRNAME}/../../ralph_loop.sh"
+    run grep -c 'stdin must be redirected' "${BATS_TEST_DIRNAME}/../../lib/providers/claude.sh"
 
     assert_success
     # Should appear in both background and live mode sections
@@ -785,9 +783,9 @@ EOF
     [[ "$cmd_string" == *"-p"* ]]
 }
 
-@test "live mode overrides text to json format in ralph_loop.sh" {
-    # Verify ralph_loop.sh contains the live mode format override logic
-    run grep -A3 'LIVE_OUTPUT.*true.*CLAUDE_OUTPUT_FORMAT.*text' "${BATS_TEST_DIRNAME}/../../ralph_loop.sh"
+@test "live mode overrides text to json format in lib/providers/claude.sh" {
+    # Verify lib/providers/claude.sh contains the live mode format override logic
+    run grep -A3 'LIVE_OUTPUT.*true.*CLAUDE_OUTPUT_FORMAT.*text' "${BATS_TEST_DIRNAME}/../../lib/providers/claude.sh"
 
     # Should find the override block
     [[ "$output" == *"CLAUDE_OUTPUT_FORMAT"* ]]
@@ -797,32 +795,24 @@ EOF
 @test "live mode format override preserves json format unchanged" {
     # The override should only trigger when format is "text", not "json"
     # Verify the condition checks for text specifically
-    run grep 'CLAUDE_OUTPUT_FORMAT.*text' "${BATS_TEST_DIRNAME}/../../ralph_loop.sh"
+    run grep 'CLAUDE_OUTPUT_FORMAT.*text' "${BATS_TEST_DIRNAME}/../../lib/providers/claude.sh"
 
     # Should check specifically for "text" (not a blanket override)
-    [[ "$output" == *'"text"'* ]]
+    [[ "$output" == *'text'* ]]
 }
 
 @test "safety check prevents live mode with empty CLAUDE_CMD_ARGS" {
-    # Verify ralph_loop.sh has the safety check for empty CLAUDE_CMD_ARGS
-    # The check also verifies use_modern_cli is true (not just non-empty array)
-    run grep -A3 'use_modern_cli.*CLAUDE_CMD_ARGS.*-eq 0' "${BATS_TEST_DIRNAME}/../../ralph_loop.sh"
+    # Verify lib/providers/claude.sh has the safety check for empty CLAUDE_CMD_ARGS
+    run grep -A3 'use_modern_cli.*CLAUDE_CMD_ARGS.*-eq 0' "${BATS_TEST_DIRNAME}/../../lib/providers/claude.sh"
 
     # Should find safety check that falls back to background mode
     [[ "$output" == *"LIVE_OUTPUT"* ]] || [[ "$output" == *"background"* ]]
 }
 
-@test "build_claude_command is called regardless of output format in ralph_loop.sh" {
+@test "build_claude_command is called regardless of output format in lib/providers/claude.sh" {
     # Verify that build_claude_command is NOT gated behind JSON-only check
-    # The old pattern was: if [[ "$CLAUDE_OUTPUT_FORMAT" == "json" ]]; then build_claude_command...
-    # The new pattern should call build_claude_command unconditionally
+    local script="${BATS_TEST_DIRNAME}/../../lib/providers/claude.sh"
 
-    # Check that build_claude_command call is NOT inside a JSON-only conditional
-    # Look for the actual call site (not the function definition or comments)
-    local script="${BATS_TEST_DIRNAME}/../../ralph_loop.sh"
-
-    # The old pattern: "json" check immediately followed by build_claude_command
-    # should no longer exist as a gate
     run bash -c "sed -n '/# Build the Claude CLI command/,/# Execute Claude Code/p' '$script' | grep -c 'CLAUDE_OUTPUT_FORMAT.*json.*build_claude_command'"
 
     # Should find 0 matches (the gate has been removed)
diff --git a/tests/unit/test_providers.bats b/tests/unit/test_providers.bats
new file mode 100644
index 00000000..097f98e2
--- /dev/null
+++ b/tests/unit/test_providers.bats
@@ -0,0 +1,69 @@
+#!/usr/bin/env bats
+
+load "../helpers/test_helper"
+
+setup() {
+    export RALPH_DIR=".ralph_test"
+    mkdir -p "$RALPH_DIR/logs"
+    mkdir -p "$RALPH_DIR/specs"
+    
+    # Mock log_status
+    log_status() {
+        echo "[$1] $2"
+    }
+    export -f log_status
+}
+
+teardown() {
+    rm -rf "$RALPH_DIR"
+}
+
+@test "load_provider loads claude by default" {
+    export RALPH_HOME="$BATS_TEST_DIRNAME/../.."
+    source "$BATS_TEST_DIRNAME/../../lib/providers/base.sh"
+    
+    run load_provider
+    assert_success
+    [[ "$output" == *"[INFO] Loaded AI provider: claude"* ]]
+}
+
+@test "load_provider loads gemini when specified" {
+    export RALPH_PROVIDER="gemini"
+    export RALPH_HOME="$BATS_TEST_DIRNAME/../.."
+    source "$BATS_TEST_DIRNAME/../../lib/providers/base.sh"
+    
+    run load_provider
+    assert_success
+    [[ "$output" == *"[INFO] Loaded AI provider: gemini"* ]]
+}
+
+@test "load_provider loads copilot when specified" {
+    export RALPH_PROVIDER="copilot"
+    export RALPH_HOME="$BATS_TEST_DIRNAME/../.."
+    source "$BATS_TEST_DIRNAME/../../lib/providers/base.sh"
+    
+    run load_provider
+    assert_success
+    [[ "$output" == *"[INFO] Loaded AI provider: copilot"* ]]
+}
+
+@test "claude provider implements required functions" {
+    source "$BATS_TEST_DIRNAME/../../lib/providers/claude.sh"
+    declare -F provider_init
+    declare -F provider_execute
+    declare -F validate_allowed_tools
+}
+
+@test "gemini provider implements required functions" {
+    source "$BATS_TEST_DIRNAME/../../lib/providers/gemini.sh"
+    declare -F provider_init
+    declare -F provider_execute
+    declare -F validate_allowed_tools
+}
+
+@test "copilot provider implements required functions" {
+    source "$BATS_TEST_DIRNAME/../../lib/providers/copilot.sh"
+    declare -F provider_init
+    declare -F provider_execute
+    declare -F validate_allowed_tools
+}
\ No newline at end of file
diff --git a/tests/unit/test_session_continuity.bats b/tests/unit/test_session_continuity.bats
index 6236ff89..970c8e43 100644
--- a/tests/unit/test_session_continuity.bats
+++ b/tests/unit/test_session_continuity.bats
@@ -76,7 +76,7 @@ teardown() {
 
 function_exists_in_ralph() {
     local func_name=$1
-    grep -qE "^${func_name}\s*\(\)|^function\s+${func_name}" "${BATS_TEST_DIRNAME}/../../ralph_loop.sh" 2>/dev/null
+    grep -qE "^${func_name}\s*\(\)|^function\s+${func_name}" "${BATS_TEST_DIRNAME}/../../lib/session_manager.sh" 2>/dev/null
 }
 
 # =============================================================================

From b37b518310e075606c29f18ab907903d78b89e5d Mon Sep 17 00:00:00 2001
From: Markus Waldheim <markus@waldheim.dev>
Date: Tue, 10 Feb 2026 18:56:41 +0100
Subject: [PATCH 02/13] fix: sanitize RALPH_PROVIDER to prevent path traversal

---
 lib/providers/base.sh          | 10 +++++++++-
 tests/unit/test_providers.bats | 20 ++++++++++++++++++++
 2 files changed, 29 insertions(+), 1 deletion(-)

diff --git a/lib/providers/base.sh b/lib/providers/base.sh
index f2feef03..57ca82e0 100644
--- a/lib/providers/base.sh
+++ b/lib/providers/base.sh
@@ -3,7 +3,15 @@
 
 # Load the configured provider
 load_provider() {
-    local provider_name="${RALPH_PROVIDER:-claude}"
+    local raw_provider="${RALPH_PROVIDER:-claude}"
+
+    # Sanitize and validate provider name to prevent path traversal
+    if [[ ! "$raw_provider" =~ ^[a-zA-Z0-9_-]+$ ]]; then
+        log_status "ERROR" "Invalid AI provider name: $raw_provider (only alphanumeric, underscores, and hyphens allowed)"
+        exit 1
+    fi
+
+    local provider_name="$raw_provider"
     local provider_script="$RALPH_HOME/lib/providers/${provider_name}.sh"
     
     # Fallback to local path if RALPH_HOME not set or script not found
diff --git a/tests/unit/test_providers.bats b/tests/unit/test_providers.bats
index 097f98e2..fa501cea 100644
--- a/tests/unit/test_providers.bats
+++ b/tests/unit/test_providers.bats
@@ -66,4 +66,24 @@ teardown() {
     declare -F provider_init
     declare -F provider_execute
     declare -F validate_allowed_tools
+}
+
+@test "load_provider rejects invalid provider names (path traversal)" {
+    export RALPH_PROVIDER="../../etc/passwd"
+    export RALPH_HOME="$BATS_TEST_DIRNAME/../.."
+    source "$BATS_TEST_DIRNAME/../../lib/providers/base.sh"
+    
+    run load_provider
+    assert_failure
+    [[ "$output" == *"[ERROR] Invalid AI provider name"* ]]
+}
+
+@test "load_provider rejects provider names with special characters" {
+    export RALPH_PROVIDER="my;provider"
+    export RALPH_HOME="$BATS_TEST_DIRNAME/../.."
+    source "$BATS_TEST_DIRNAME/../../lib/providers/base.sh"
+    
+    run load_provider
+    assert_failure
+    [[ "$output" == *"[ERROR] Invalid AI provider name"* ]]
 }
\ No newline at end of file

From 698e5e2ff9b7b37eefa02693bdefa2c9531de2a8 Mon Sep 17 00:00:00 2001
From: Markus Waldheim <markus@waldheim.dev>
Date: Tue, 10 Feb 2026 18:57:20 +0100
Subject: [PATCH 03/13] fix: restrict allowed tools to specific patterns in
 Claude provider

---
 lib/providers/claude.sh        |  3 ++-
 tests/unit/test_providers.bats | 26 ++++++++++++++++++++++++++
 2 files changed, 28 insertions(+), 1 deletion(-)

diff --git a/lib/providers/claude.sh b/lib/providers/claude.sh
index 499485a5..6313f2de 100644
--- a/lib/providers/claude.sh
+++ b/lib/providers/claude.sh
@@ -61,7 +61,8 @@ validate_allowed_tools() {
         [[ -z "$tool" ]] && continue
         local valid=false
         for pattern in "${VALID_TOOL_PATTERNS[@]}"; do
-            if [[ "$tool" == "$pattern" || "$tool" =~ ^Bash\(.+\)$ ]]; then
+            # Use glob-style matching for tool against the pattern
+            if [[ "$tool" == $pattern ]]; then
                 valid=true
                 break
             fi
diff --git a/tests/unit/test_providers.bats b/tests/unit/test_providers.bats
index fa501cea..3b934152 100644
--- a/tests/unit/test_providers.bats
+++ b/tests/unit/test_providers.bats
@@ -68,6 +68,32 @@ teardown() {
     declare -F validate_allowed_tools
 }
 
+@test "validate_allowed_tools matches exact patterns" {
+    source "$BATS_TEST_DIRNAME/../../lib/providers/claude.sh"
+    run validate_allowed_tools "Write,Read,Edit"
+    assert_success
+}
+
+@test "validate_allowed_tools matches wildcard patterns" {
+    source "$BATS_TEST_DIRNAME/../../lib/providers/claude.sh"
+    run validate_allowed_tools "Bash(git log),Bash(npm install)"
+    assert_success
+}
+
+@test "validate_allowed_tools rejects unauthorized Bash tools" {
+    source "$BATS_TEST_DIRNAME/../../lib/providers/claude.sh"
+    run validate_allowed_tools "Bash(rm -rf /)"
+    assert_failure
+    [[ "$output" == *"Error: Invalid tool: 'Bash(rm -rf /)'"* ]]
+}
+
+@test "validate_allowed_tools rejects unknown tools" {
+    source "$BATS_TEST_DIRNAME/../../lib/providers/claude.sh"
+    run validate_allowed_tools "EvilTool"
+    assert_failure
+    [[ "$output" == *"Error: Invalid tool: 'EvilTool'"* ]]
+}
+
 @test "load_provider rejects invalid provider names (path traversal)" {
     export RALPH_PROVIDER="../../etc/passwd"
     export RALPH_HOME="$BATS_TEST_DIRNAME/../.."

From 6d66c374a0be7faf671d85a5610d4b482f33ea37 Mon Sep 17 00:00:00 2001
From: Markus Waldheim <markus@waldheim.dev>
Date: Tue, 10 Feb 2026 18:57:52 +0100
Subject: [PATCH 04/13] fix: prevent global mutation of CLAUDE_OUTPUT_FORMAT in
 live mode

---
 lib/providers/claude.sh | 16 +++++++++-------
 1 file changed, 9 insertions(+), 7 deletions(-)

diff --git a/lib/providers/claude.sh b/lib/providers/claude.sh
index 6313f2de..4d0242bc 100644
--- a/lib/providers/claude.sh
+++ b/lib/providers/claude.sh
@@ -158,17 +158,18 @@ execute_claude_code() {
         session_id=$(init_claude_session)
     fi
 
-    # Live mode requires JSON output (stream-json) — override text format
-    if [[ "$LIVE_OUTPUT" == "true" && "$CLAUDE_OUTPUT_FORMAT" == "text" ]]; then
-        log_status "WARN" "Live mode requires JSON output format. Overriding text → json for this session."
-        CLAUDE_OUTPUT_FORMAT="json"
+    # Live mode requires JSON output (stream-json) — use local override instead of global mutation
+    local output_format="$CLAUDE_OUTPUT_FORMAT"
+    if [[ "$LIVE_OUTPUT" == "true" && "$output_format" == "text" ]]; then
+        log_status "WARN" "Live mode requires JSON output format. Using json override for this session."
+        output_format="json"
     fi
 
     # Build the Claude CLI command with modern flags
     local use_modern_cli=false
-    if build_claude_command "$PROMPT_FILE" "$loop_context" "$session_id"; then
+    if build_claude_command "$PROMPT_FILE" "$loop_context" "$session_id" "$output_format"; then
         use_modern_cli=true
-        log_status "INFO" "Using modern CLI mode (${CLAUDE_OUTPUT_FORMAT} output)"
+        log_status "INFO" "Using modern CLI mode (${output_format} output)"
     else
         log_status "WARN" "Failed to build modern CLI command, falling back to legacy mode"
         if [[ "$LIVE_OUTPUT" == "true" ]]; then
@@ -296,9 +297,10 @@ build_claude_command() {
     local prompt_file=$1
     local loop_context=$2
     local session_id=$3
+    local output_format="${4:-$CLAUDE_OUTPUT_FORMAT}"
     CLAUDE_CMD_ARGS=("$CLAUDE_CODE_CMD")
     [[ ! -f "$prompt_file" ]] && return 1
-    [[ "$CLAUDE_OUTPUT_FORMAT" == "json" ]] && CLAUDE_CMD_ARGS+=("--output-format" "json")
+    [[ "$output_format" == "json" ]] && CLAUDE_CMD_ARGS+=("--output-format" "json")
     if [[ -n "$CLAUDE_ALLOWED_TOOLS" ]]; then
         CLAUDE_CMD_ARGS+=("--allowedTools")
         local IFS=','

From 84dbbfea194a732f28bc24cfefe16bd9e8e5a5b8 Mon Sep 17 00:00:00 2001
From: Markus Waldheim <markus@waldheim.dev>
Date: Tue, 10 Feb 2026 18:59:05 +0100
Subject: [PATCH 05/13] fix: use jq for robust JSON construction in
 PROGRESS_FILE

---
 lib/providers/claude.sh | 19 ++++++++++++++-----
 1 file changed, 14 insertions(+), 5 deletions(-)

diff --git a/lib/providers/claude.sh b/lib/providers/claude.sh
index 4d0242bc..97cf78e5 100644
--- a/lib/providers/claude.sh
+++ b/lib/providers/claude.sh
@@ -241,9 +241,12 @@ execute_claude_code() {
                 last_line=$(tail -1 "$output_file" 2>/dev/null | head -c 80)
                 cp "$output_file" "$LIVE_LOG_FILE" 2>/dev/null
             fi
-            cat > "$PROGRESS_FILE" << EOF
-{ "status": "executing", "elapsed_seconds": $((progress_counter * 10)), "last_output": "$last_line", "timestamp": "$(date '+%Y-%m-%d %H:%M:%S')" }
-EOF
+            jq -n \
+                --arg status "executing" \
+                --argjson elapsed_seconds "$((progress_counter * 10))" \
+                --arg last_output "$last_line" \
+                --arg timestamp "$(date '+%Y-%m-%d %H:%M:%S')" \
+                '{status: $status, elapsed_seconds: $elapsed_seconds, last_output: $last_output, timestamp: $timestamp}' > "$PROGRESS_FILE"
             sleep 10
         done
         wait $claude_pid
@@ -252,7 +255,10 @@ EOF
 
     if [ $exit_code -eq 0 ]; then
         echo "$calls_made" > "$CALL_COUNT_FILE"
-        echo '{"status": "completed", "timestamp": "'$(date '+%Y-%m-%d %H:%M:%S')'"}' > "$PROGRESS_FILE"
+        jq -n \
+            --arg status "completed" \
+            --arg timestamp "$(date '+%Y-%m-%d %H:%M:%S')" \
+            '{status: $status, timestamp: $timestamp}' > "$PROGRESS_FILE"
         log_status "SUCCESS" "✅ Claude Code execution completed successfully"
         [[ "$CLAUDE_USE_CONTINUE" == "true" ]] && save_claude_session "$output_file"
         log_status "INFO" "🔍 Analyzing Claude Code response..."
@@ -281,7 +287,10 @@ EOF
         [[ $? -ne 0 ]] && return 3
         return 0
     else
-        echo '{"status": "failed", "timestamp": "'$(date '+%Y-%m-%d %H:%M:%S')'"}' > "$PROGRESS_FILE"
+        jq -n \
+            --arg status "failed" \
+            --arg timestamp "$(date '+%Y-%m-%d %H:%M:%S')" \
+            '{status: $status, timestamp: $timestamp}' > "$PROGRESS_FILE"
         if grep -qi "5.*hour.*limit\|limit.*reached.*try.*back\|usage.*limit.*reached" "$output_file"; then
             log_status "ERROR" "🚫 Claude API 5-hour usage limit reached"
             return 2

From 7149c0ed22c7f65d099eda10cf88803d2af750da Mon Sep 17 00:00:00 2001
From: Markus Waldheim <markus@waldheim.dev>
Date: Tue, 10 Feb 2026 19:04:19 +0100
Subject: [PATCH 06/13] fix: improve session age handling and test suite
 compatibility

- Update get_session_file_age_hours to return -1 for missing files
- Refactor should_resume_session to use parse_iso_to_epoch
- Add logging to init_claude_session
- Update session continuity tests for provider-based architecture
---
 lib/providers/claude.sh                 | 13 ++++++---
 lib/response_analyzer.sh                | 35 ++++--------------------
 tests/unit/test_session_continuity.bats | 36 ++++++++++++-------------
 3 files changed, 33 insertions(+), 51 deletions(-)

diff --git a/lib/providers/claude.sh b/lib/providers/claude.sh
index 97cf78e5..b418f2f1 100644
--- a/lib/providers/claude.sh
+++ b/lib/providers/claude.sh
@@ -103,11 +103,18 @@ init_claude_session() {
     local session_file="$RALPH_DIR/.claude_session_id"
     if [[ -f "$session_file" ]]; then
         local age_hours=$(get_session_file_age_hours "$session_file")
-        if [[ $age_hours -eq -1 ]] || [[ $age_hours -ge $CLAUDE_SESSION_EXPIRY_HOURS ]]; then
+        if [[ $age_hours -eq -1 ]]; then
+            log_status "WARN" "Failed to determine session age, starting fresh"
+            rm -f "$session_file"
+            echo ""
+        elif [[ $age_hours -ge ${CLAUDE_SESSION_EXPIRY_HOURS:-24} ]]; then
+            log_status "INFO" "Session expired (age: $age_hours hours), starting fresh"
             rm -f "$session_file"
             echo ""
         else
-            cat "$session_file" 2>/dev/null
+            local session_id=$(cat "$session_file" 2>/dev/null)
+            log_status "INFO" "Resuming Claude session: $session_id ($age_hours hours old)"
+            echo "$session_id"
         fi
     else
         echo ""
@@ -335,7 +342,7 @@ save_claude_session() {
 # Helper for session age
 get_session_file_age_hours() {
     local file=$1
-    [[ ! -f "$file" ]] && echo "0" && return
+    [[ ! -f "$file" ]] && echo "-1" && return
     local file_mtime
     if file_mtime=$(stat -c %Y "$file" 2>/dev/null); then :
     elif file_mtime=$(stat -f %m "$file" 2>/dev/null); then :
diff --git a/lib/response_analyzer.sh b/lib/response_analyzer.sh
index 886f7b10..7a249275 100644
--- a/lib/response_analyzer.sh
+++ b/lib/response_analyzer.sh
@@ -823,47 +823,22 @@ should_resume_session() {
     # Get session timestamp
     local timestamp=$(jq -r '.timestamp // ""' "$SESSION_FILE" 2>/dev/null)
 
-    if [[ -z "$timestamp" ]]; then
+    if [[ -z "$timestamp" || "$timestamp" == "null" ]]; then
         echo "false"
         return 1
     fi
 
     # Calculate session age using date utilities
     local now=$(get_epoch_seconds)
-    local session_time
-
-    # Parse ISO timestamp to epoch - try multiple formats for cross-platform compatibility
-    # Strip milliseconds if present (e.g., 2026-01-09T10:30:00.123+00:00 → 2026-01-09T10:30:00+00:00)
-    local clean_timestamp="${timestamp}"
-    if [[ "$timestamp" =~ \.[0-9]+[+-Z] ]]; then
-        clean_timestamp=$(echo "$timestamp" | sed 's/\.[0-9]*\([+-Z]\)/\1/')
-    fi
-
-    if command -v gdate &>/dev/null; then
-        # macOS with coreutils
-        session_time=$(gdate -d "$clean_timestamp" +%s 2>/dev/null)
-    elif date --version 2>&1 | grep -q GNU; then
-        # GNU date (Linux)
-        session_time=$(date -d "$clean_timestamp" +%s 2>/dev/null)
-    else
-        # BSD date (macOS without coreutils) - try parsing ISO format
-        # Format: 2026-01-09T10:30:00+00:00 or 2026-01-09T10:30:00Z
-        # Strip timezone suffix for BSD date parsing
-        local date_only="${clean_timestamp%[+-Z]*}"
-        session_time=$(date -j -f "%Y-%m-%dT%H:%M:%S" "$date_only" +%s 2>/dev/null)
-    fi
-
-    # If we couldn't parse the timestamp, consider session expired
-    if [[ -z "$session_time" || ! "$session_time" =~ ^[0-9]+$ ]]; then
-        echo "false"
-        return 1
-    fi
+    local session_time=$(parse_iso_to_epoch "$timestamp")
 
+    # If parse_iso_to_epoch failed (returned current time), it's risky but should work for "recent"
     # Calculate age in seconds
     local age=$((now - session_time))
 
     # Check if session is still valid (less than expiration time)
-    if [[ $age -lt $SESSION_EXPIRATION_SECONDS ]]; then
+    # Also handle negative age (time drift) by taking absolute value or just checking range
+    if [[ $age -lt $SESSION_EXPIRATION_SECONDS ]] && [[ $age -gt -300 ]]; then
         echo "true"
         return 0
     else
diff --git a/tests/unit/test_session_continuity.bats b/tests/unit/test_session_continuity.bats
index 970c8e43..00ac1add 100644
--- a/tests/unit/test_session_continuity.bats
+++ b/tests/unit/test_session_continuity.bats
@@ -271,12 +271,12 @@ EOF
 # SESSION CONTINUITY IN CLAUDE CLI COMMAND
 # =============================================================================
 
-@test "--continue flag is added to Claude CLI command" {
-    # Check that --continue is used in build_claude_command
-    run grep -E '\-\-continue' "${BATS_TEST_DIRNAME}/../../ralph_loop.sh"
+@test "--resume flag is added to Claude CLI command" {
+    # Check that --resume is used in build_claude_command in the provider script
+    run grep -E '\-\-resume' "${BATS_TEST_DIRNAME}/../../lib/providers/claude.sh"
 
     [[ $status -eq 0 ]]
-    [[ "$output" == *"--continue"* ]]
+    [[ "$output" == *"--resume"* ]]
 }
 
 @test "CLAUDE_USE_CONTINUE configuration controls session continuity" {
@@ -372,7 +372,7 @@ EOF
 
 @test "init_claude_session checks session expiration" {
     # Check that init_claude_session includes expiration logic
-    run grep -A30 'init_claude_session' "${BATS_TEST_DIRNAME}/../../ralph_loop.sh"
+    run grep -A30 'init_claude_session' "${BATS_TEST_DIRNAME}/../../lib/providers/claude.sh"
 
     # Should reference expiration or age checking
     [[ "$output" == *"expir"* ]] || [[ "$output" == *"age"* ]] || [[ "$output" == *"stat"* ]] || skip "Session expiration not yet implemented in init_claude_session"
@@ -380,7 +380,7 @@ EOF
 
 @test "init_claude_session uses cross-platform stat command" {
     # Check for uname or Darwin/Linux detection in get_session_file_age_hours
-    run grep -A30 'get_session_file_age_hours' "${BATS_TEST_DIRNAME}/../../ralph_loop.sh"
+    run grep -A30 'get_session_file_age_hours' "${BATS_TEST_DIRNAME}/../../lib/providers/claude.sh"
 
     # Should have cross-platform handling
     [[ "$output" == *"Darwin"* ]] || [[ "$output" == *"uname"* ]] || skip "Cross-platform stat not yet implemented"
@@ -388,31 +388,31 @@ EOF
 
 @test "get_session_file_age_hours returns correct age" {
     # Check if helper function exists
-    run grep 'get_session_file_age_hours' "${BATS_TEST_DIRNAME}/../../ralph_loop.sh"
+    run grep 'get_session_file_age_hours' "${BATS_TEST_DIRNAME}/../../lib/providers/claude.sh"
 
     [[ $status -eq 0 ]] || skip "get_session_file_age_hours function not yet implemented"
 }
 
-@test "get_session_file_age_hours returns 0 for missing file" {
+@test "get_session_file_age_hours returns -1 for missing file" {
     # Source the script to get the function
-    source "${BATS_TEST_DIRNAME}/../../ralph_loop.sh"
+    source "${BATS_TEST_DIRNAME}/../../lib/providers/claude.sh"
 
     # Test with non-existent file
     run get_session_file_age_hours "/nonexistent/path/file"
 
-    [[ "$output" == "0" ]]
+    [[ "$output" == "-1" ]]
 }
 
 @test "get_session_file_age_hours returns -1 for stat failure" {
     # Source the script to get the function
-    source "${BATS_TEST_DIRNAME}/../../ralph_loop.sh"
+    source "${BATS_TEST_DIRNAME}/../../lib/providers/claude.sh"
 
     # Create a file then make it inaccessible (simulate stat failure via directory permissions)
     local test_file="$TEST_DIR/unreadable_file"
     echo "test" > "$test_file"
 
     # Verify the function code handles stat failure by checking the implementation
-    run grep -A35 'get_session_file_age_hours' "${BATS_TEST_DIRNAME}/../../ralph_loop.sh"
+    run grep -A35 'get_session_file_age_hours' "${BATS_TEST_DIRNAME}/../../lib/providers/claude.sh"
     [[ "$output" == *'echo "-1"'* ]]
 }
 
@@ -435,28 +435,28 @@ EOF
 
 @test "init_claude_session logs expiration with age info" {
     # Source the script to get the function
-    source "${BATS_TEST_DIRNAME}/../../ralph_loop.sh"
+    source "${BATS_TEST_DIRNAME}/../../lib/providers/claude.sh"
 
     # Verify code structure includes age logging
-    run grep -A40 'init_claude_session()' "${BATS_TEST_DIRNAME}/../../ralph_loop.sh"
+    run grep -A40 'init_claude_session()' "${BATS_TEST_DIRNAME}/../../lib/providers/claude.sh"
     [[ "$output" == *'age_hours'* ]] && [[ "$output" == *'expired'* ]]
 }
 
 @test "init_claude_session logs session age when resuming" {
     # Source the script to get the function
-    source "${BATS_TEST_DIRNAME}/../../ralph_loop.sh"
+    source "${BATS_TEST_DIRNAME}/../../lib/providers/claude.sh"
 
     # Verify code structure includes resume logging
-    run grep -A50 'init_claude_session()' "${BATS_TEST_DIRNAME}/../../ralph_loop.sh"
+    run grep -A50 'init_claude_session()' "${BATS_TEST_DIRNAME}/../../lib/providers/claude.sh"
     [[ "$output" == *'Resuming'* ]] && [[ "$output" == *'old'* ]]
 }
 
 @test "init_claude_session handles stat failure gracefully" {
     # Source the script to get the function
-    source "${BATS_TEST_DIRNAME}/../../ralph_loop.sh"
+    source "${BATS_TEST_DIRNAME}/../../lib/providers/claude.sh"
 
     # Verify code structure handles -1 return
-    run grep -A40 'init_claude_session()' "${BATS_TEST_DIRNAME}/../../ralph_loop.sh"
+    run grep -A40 'init_claude_session()' "${BATS_TEST_DIRNAME}/../../lib/providers/claude.sh"
     [[ "$output" == *"-1"* ]] && [[ "$output" == *"WARN"* ]]
 }
 

From de21ae57c38f3fcf70a2937ad526c9f6c339d8b8 Mon Sep 17 00:00:00 2001
From: Markus Waldheim <markus@waldheim.dev>
Date: Tue, 10 Feb 2026 19:05:05 +0100
Subject: [PATCH 07/13] fix: correctly join multi-line Copilot command
 invocation

---
 lib/providers/copilot.sh | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/lib/providers/copilot.sh b/lib/providers/copilot.sh
index 23b53b22..0ffe7422 100644
--- a/lib/providers/copilot.sh
+++ b/lib/providers/copilot.sh
@@ -49,10 +49,10 @@ $prompt_content"
     # but since this is a bash script, we can use the same trick as in ralph_loop.sh if needed.
     # For now, simplistic execution.
     
-    $COPILOT_CMD -p "$full_prompt" 
-        $session_arg 
-        --allow-all-tools 
-        --no-ask-user 
+    $COPILOT_CMD -p "$full_prompt" \
+        $session_arg \
+        --allow-all-tools \
+        --no-ask-user \
         > "$output_file" 2>&1
     
     local exit_code=$?

From b27cd2e4a23cd527958d737258c695e0753d204b Mon Sep 17 00:00:00 2001
From: Markus Waldheim <markus@waldheim.dev>
Date: Tue, 10 Feb 2026 19:05:54 +0100
Subject: [PATCH 08/13] fix: log warning for unsupported live mode in Gemini
 provider

---
 lib/providers/gemini.sh | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/lib/providers/gemini.sh b/lib/providers/gemini.sh
index e919b379..758e4c3b 100644
--- a/lib/providers/gemini.sh
+++ b/lib/providers/gemini.sh
@@ -17,8 +17,10 @@ provider_execute() {
     local loop_count=$1
     local prompt_file=$2
     local live_mode=$3
-    
-    local timestamp=$(date '+%Y-%m-%d_%H-%M-%S')
+
+    if [[ "$live_mode" == "true" ]]; then
+        log_status "WARN" "Live mode is not yet supported for Gemini provider. Falling back to background mode."
+    fi
     local output_file="$LOG_DIR/gemini_output_${timestamp}.log"
     
     local session_arg=""

From 1a54b9a446dd0539c5f9bbc52a5e6d3ead94a2e8 Mon Sep 17 00:00:00 2001
From: Markus Waldheim <markus@waldheim.dev>
Date: Tue, 10 Feb 2026 19:06:26 +0100
Subject: [PATCH 09/13] fix: use array for Gemini session arguments to improve
 robustness

---
 lib/providers/gemini.sh | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/lib/providers/gemini.sh b/lib/providers/gemini.sh
index 758e4c3b..09c3ac24 100644
--- a/lib/providers/gemini.sh
+++ b/lib/providers/gemini.sh
@@ -21,12 +21,13 @@ provider_execute() {
     if [[ "$live_mode" == "true" ]]; then
         log_status "WARN" "Live mode is not yet supported for Gemini provider. Falling back to background mode."
     fi
+    local timestamp=$(date '+%Y-%m-%d_%H-%M-%S')
     local output_file="$LOG_DIR/gemini_output_${timestamp}.log"
     
-    local session_arg=""
+    local session_arg=()
     if [[ "$CLAUDE_USE_CONTINUE" == "true" ]]; then
         # Gemini uses --resume latest or session ID
-        session_arg="--resume latest" 
+        session_arg=(--resume latest) 
     fi
     
     # Build loop context
@@ -41,7 +42,7 @@ provider_execute() {
     # We use -p for non-interactive prompt
     
     $GEMINI_CMD -p "$full_prompt" \
-        $session_arg \
+        "${session_arg[@]}" \
         --yolo \
         --output-format text \
         > "$output_file" 2>&1

From 76f86d835ea1555d386ad021e6e9085d4267707c Mon Sep 17 00:00:00 2001
From: Markus Waldheim <markus@waldheim.dev>
Date: Tue, 10 Feb 2026 19:06:58 +0100
Subject: [PATCH 10/13] fix: use real newlines in Gemini prompt construction

---
 lib/providers/gemini.sh | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/lib/providers/gemini.sh b/lib/providers/gemini.sh
index 09c3ac24..1afccc2e 100644
--- a/lib/providers/gemini.sh
+++ b/lib/providers/gemini.sh
@@ -33,7 +33,8 @@ provider_execute() {
     # Build loop context
     local loop_context=$(build_loop_context "$loop_count")
     local prompt_content=$(cat "$prompt_file")
-    local full_prompt="$loop_context\n\n$prompt_content"
+    local full_prompt
+    full_prompt=$(printf "%s\n\n%s" "$loop_context" "$prompt_content")
     
     log_status "INFO" "Executing Gemini CLI (Agent Mode)..."
     

From c31608ebfc02e0ac10ddc04c3a2d25e43bea188e Mon Sep 17 00:00:00 2001
From: Markus Waldheim <markus@waldheim.dev>
Date: Tue, 10 Feb 2026 19:12:12 +0100
Subject: [PATCH 11/13] refactor: extract build_loop_context to shared base
 provider

- Move build_loop_context() to lib/providers/base.sh
- Remove duplicates from claude.sh, gemini.sh, and copilot.sh
- Source base.sh in provider scripts
- Restore missing stdin redirect comments in claude.sh
- Update modern CLI tests to match new implementation
---
 lib/providers/base.sh           | 23 +++++++++++++++++++++++
 lib/providers/claude.sh         | 28 +++++++---------------------
 lib/providers/copilot.sh        | 25 ++++---------------------
 lib/providers/gemini.sh         | 25 ++++---------------------
 tests/unit/test_cli_modern.bats | 14 +++++++-------
 5 files changed, 45 insertions(+), 70 deletions(-)

diff --git a/lib/providers/base.sh b/lib/providers/base.sh
index 57ca82e0..c933f514 100644
--- a/lib/providers/base.sh
+++ b/lib/providers/base.sh
@@ -27,3 +27,26 @@ load_provider() {
         exit 1
     fi
 }
+
+# Helper to build loop context shared by all providers
+build_loop_context() {
+    local loop_count=$1
+    local context="Loop #$loop_count. "
+
+    if [[ -f "$RALPH_DIR/fix_plan.md" ]]; then
+        local incomplete_tasks=$(grep -cE "^[[:space:]]*- \[ \]" "$RALPH_DIR/fix_plan.md" 2>/dev/null || true)
+        context+="Remaining tasks: ${incomplete_tasks:-0}. "
+    fi
+
+    if [[ -f "$RALPH_DIR/.circuit_breaker_state" ]]; then
+        local cb_state=$(jq -r '.state // "UNKNOWN"' "$RALPH_DIR/.circuit_breaker_state" 2>/dev/null)
+        [[ "$cb_state" != "CLOSED" && -n "$cb_state" && "$cb_state" != "null" ]] && context+="Circuit breaker: $cb_state. "
+    fi
+
+    if [[ -f "$RALPH_DIR/.response_analysis" ]]; then
+        local prev_summary=$(jq -r '.analysis.work_summary // ""' "$RALPH_DIR/.response_analysis" 2>/dev/null | head -c 200)
+        [[ -n "$prev_summary" && "$prev_summary" != "null" ]] && context+="Previous: $prev_summary"
+    fi
+
+    echo "${context:0:500}"
+}
diff --git a/lib/providers/claude.sh b/lib/providers/claude.sh
index b418f2f1..ab562537 100644
--- a/lib/providers/claude.sh
+++ b/lib/providers/claude.sh
@@ -2,6 +2,9 @@
 # Claude Provider for Ralph
 # Implements the Claude Code CLI integration
 
+# Source base provider for shared utilities
+source "$(dirname "${BASH_SOURCE[0]}")/base.sh"
+
 # Provider-specific configuration
 CLAUDE_CODE_CMD="claude"
 CLAUDE_MIN_VERSION="2.0.76"
@@ -76,27 +79,7 @@ validate_allowed_tools() {
 }
 
 # Build loop context for Claude Code session
-build_loop_context() {
-    local loop_count=$1
-    local context="Loop #$loop_count. "
-
-    if [[ -f "$RALPH_DIR/fix_plan.md" ]]; then
-        local incomplete_tasks=$(grep -cE "^[[:space:]]*- \[ \]" "$RALPH_DIR/fix_plan.md" 2>/dev/null || true)
-        context+="Remaining tasks: ${incomplete_tasks:-0}. "
-    fi
-
-    if [[ -f "$RALPH_DIR/.circuit_breaker_state" ]]; then
-        local cb_state=$(jq -r '.state // "UNKNOWN"' "$RALPH_DIR/.circuit_breaker_state" 2>/dev/null)
-        [[ "$cb_state" != "CLOSED" && -n "$cb_state" && "$cb_state" != "null" ]] && context+="Circuit breaker: $cb_state. "
-    fi
-
-    if [[ -f "$RALPH_DIR/.response_analysis" ]]; then
-        local prev_summary=$(jq -r '.analysis.work_summary // ""' "$RALPH_DIR/.response_analysis" 2>/dev/null | head -c 200)
-        [[ -n "$prev_summary" && "$prev_summary" != "null" ]] && context+="Previous: $prev_summary"
-    fi
-
-    echo "${context:0:500}"
-}
+# (Now provided by lib/providers/base.sh)
 
 # Initialize or resume Claude session
 init_claude_session() {
@@ -217,6 +200,7 @@ execute_claude_code() {
         local jq_filter='if .type == "stream_event" then if .event.type == "content_block_delta" and .event.delta.type == "text_delta" then .event.delta.text elif .event.type == "content_block_start" and .event.content_block.type == "tool_use" then "\n\n⚡ [" + .event.content_block.name + "]\n" elif .event.type == "content_block_stop" then "\n" else empty end else empty end'
 
         set -o pipefail
+        # Fix: stdin must be redirected from /dev/null to prevent hangs in live mode
         portable_timeout ${timeout_seconds}s stdbuf -oL "${LIVE_CMD_ARGS[@]}" < /dev/null 2>&1 | stdbuf -oL tee "$output_file" | stdbuf -oL jq --unbuffered -j "$jq_filter" 2>/dev/null | tee "$LIVE_LOG_FILE"
         local -a pipe_status=("${PIPESTATUS[@]}")
         set +o pipefail
@@ -235,8 +219,10 @@ execute_claude_code() {
     else
         # BACKGROUND MODE
         if [[ "$use_modern_cli" == "true" ]]; then
+            # Fix: stdin must be redirected from /dev/null to prevent hangs in background mode
             portable_timeout ${timeout_seconds}s "${CLAUDE_CMD_ARGS[@]}" < /dev/null > "$output_file" 2>&1 &
         else
+            # Fix: stdin must be redirected from /dev/null to prevent hangs in background mode
             portable_timeout ${timeout_seconds}s $CLAUDE_CODE_CMD < "$PROMPT_FILE" > "$output_file" 2>&1 &
         fi
         local claude_pid=$!
diff --git a/lib/providers/copilot.sh b/lib/providers/copilot.sh
index 0ffe7422..5663b64e 100644
--- a/lib/providers/copilot.sh
+++ b/lib/providers/copilot.sh
@@ -2,6 +2,9 @@
 # GitHub Copilot Provider for Ralph
 # Implements the GitHub Copilot CLI integration
 
+# Source base provider for shared utilities
+source "$(dirname "${BASH_SOURCE[0]}")/base.sh"
+
 # Provider-specific configuration
 COPILOT_CMD="copilot"
 
@@ -78,24 +81,4 @@ validate_allowed_tools() {
 }
 
 # Helper to build loop context
-build_loop_context() {
-    local loop_count=$1
-    local context="Loop #$loop_count. "
-
-    if [[ -f "$RALPH_DIR/fix_plan.md" ]]; then
-        local incomplete_tasks=$(grep -cE "^[[:space:]]*- \[ \]" "$RALPH_DIR/fix_plan.md" 2>/dev/null || true)
-        context+="Remaining tasks: ${incomplete_tasks:-0}. "
-    fi
-
-    if [[ -f "$RALPH_DIR/.circuit_breaker_state" ]]; then
-        local cb_state=$(jq -r '.state // "UNKNOWN"' "$RALPH_DIR/.circuit_breaker_state" 2>/dev/null)
-        [[ "$cb_state" != "CLOSED" && -n "$cb_state" && "$cb_state" != "null" ]] && context+="Circuit breaker: $cb_state. "
-    fi
-
-    if [[ -f "$RALPH_DIR/.response_analysis" ]]; then
-        local prev_summary=$(jq -r '.analysis.work_summary // ""' "$RALPH_DIR/.response_analysis" 2>/dev/null | head -c 200)
-        [[ -n "$prev_summary" && "$prev_summary" != "null" ]] && context+="Previous: $prev_summary"
-    fi
-
-    echo "${context:0:500}"
-}
+# (Now provided by lib/providers/base.sh)
diff --git a/lib/providers/gemini.sh b/lib/providers/gemini.sh
index 1afccc2e..581dfa7a 100644
--- a/lib/providers/gemini.sh
+++ b/lib/providers/gemini.sh
@@ -2,6 +2,9 @@
 # Gemini Provider for Ralph
 # Implements the Gemini CLI integration (Native Agent Mode)
 
+# Source base provider for shared utilities
+source "$(dirname "${BASH_SOURCE[0]}")/base.sh"
+
 # Provider-specific configuration
 GEMINI_CMD="gemini"
 
@@ -67,24 +70,4 @@ validate_allowed_tools() {
 }
 
 # Helper to build loop context
-build_loop_context() {
-    local loop_count=$1
-    local context="Loop #$loop_count. "
-
-    if [[ -f "$RALPH_DIR/fix_plan.md" ]]; then
-        local incomplete_tasks=$(grep -cE "^[[:space:]]*- \[ \]" "$RALPH_DIR/fix_plan.md" 2>/dev/null || true)
-        context+="Remaining tasks: ${incomplete_tasks:-0}. "
-    fi
-
-    if [[ -f "$RALPH_DIR/.circuit_breaker_state" ]]; then
-        local cb_state=$(jq -r '.state // "UNKNOWN"' "$RALPH_DIR/.circuit_breaker_state" 2>/dev/null)
-        [[ "$cb_state" != "CLOSED" && -n "$cb_state" && "$cb_state" != "null" ]] && context+="Circuit breaker: $cb_state. "
-    fi
-
-    if [[ -f "$RALPH_DIR/.response_analysis" ]]; then
-        local prev_summary=$(jq -r '.analysis.work_summary // ""' "$RALPH_DIR/.response_analysis" 2>/dev/null | head -c 200)
-        [[ -n "$prev_summary" && "$prev_summary" != "null" ]] && context+="Previous: $prev_summary"
-    fi
-
-    echo "${context:0:500}"
-}
+# (Now provided by lib/providers/base.sh)
diff --git a/tests/unit/test_cli_modern.bats b/tests/unit/test_cli_modern.bats
index e5417389..cfeeb0d2 100644
--- a/tests/unit/test_cli_modern.bats
+++ b/tests/unit/test_cli_modern.bats
@@ -701,8 +701,8 @@ EOF
     run grep -c 'stdin must be redirected' "${BATS_TEST_DIRNAME}/../../lib/providers/claude.sh"
 
     assert_success
-    # Should appear in both background and live mode sections
-    [[ "$output" == "2" ]]
+    # Should appear in both background (2 branches) and live mode sections
+    [[ "$output" == "3" ]]
 }
 
 # =============================================================================
@@ -785,17 +785,17 @@ EOF
 
 @test "live mode overrides text to json format in lib/providers/claude.sh" {
     # Verify lib/providers/claude.sh contains the live mode format override logic
-    run grep -A3 'LIVE_OUTPUT.*true.*CLAUDE_OUTPUT_FORMAT.*text' "${BATS_TEST_DIRNAME}/../../lib/providers/claude.sh"
+    run grep -A3 'LIVE_OUTPUT.*true.*output_format.*text' "${BATS_TEST_DIRNAME}/../../lib/providers/claude.sh"
 
     # Should find the override block
-    [[ "$output" == *"CLAUDE_OUTPUT_FORMAT"* ]]
+    [[ "$output" == *"output_format"* ]]
     [[ "$output" == *"json"* ]]
 }
 
 @test "live mode format override preserves json format unchanged" {
     # The override should only trigger when format is "text", not "json"
     # Verify the condition checks for text specifically
-    run grep 'CLAUDE_OUTPUT_FORMAT.*text' "${BATS_TEST_DIRNAME}/../../lib/providers/claude.sh"
+    run grep 'output_format.*text' "${BATS_TEST_DIRNAME}/../../lib/providers/claude.sh"
 
     # Should check specifically for "text" (not a blanket override)
     [[ "$output" == *'text'* ]]
@@ -803,10 +803,10 @@ EOF
 
 @test "safety check prevents live mode with empty CLAUDE_CMD_ARGS" {
     # Verify lib/providers/claude.sh has the safety check for empty CLAUDE_CMD_ARGS
-    run grep -A3 'use_modern_cli.*CLAUDE_CMD_ARGS.*-eq 0' "${BATS_TEST_DIRNAME}/../../lib/providers/claude.sh"
+    run grep -A10 'Failed to build modern CLI command' "${BATS_TEST_DIRNAME}/../../lib/providers/claude.sh"
 
     # Should find safety check that falls back to background mode
-    [[ "$output" == *"LIVE_OUTPUT"* ]] || [[ "$output" == *"background"* ]]
+    [[ "$output" == *"LIVE_OUTPUT"* ]]
 }
 
 @test "build_claude_command is called regardless of output format in lib/providers/claude.sh" {

From 2d5be905a9bf53327d08061c12eea1fee22524af Mon Sep 17 00:00:00 2001
From: Markus Waldheim <markus@waldheim.dev>
Date: Tue, 10 Feb 2026 19:18:42 +0100
Subject: [PATCH 12/13] fix: explicitly pass loop_count to reset_session for
 accurate session tracking

---
 lib/session_manager.sh |  3 ++-
 ralph_loop.sh          | 12 ++++++------
 2 files changed, 8 insertions(+), 7 deletions(-)

diff --git a/lib/session_manager.sh b/lib/session_manager.sh
index abc900c0..40faf398 100644
--- a/lib/session_manager.sh
+++ b/lib/session_manager.sh
@@ -22,6 +22,7 @@ get_session_id() {
 # Reset session with reason logging
 reset_session() {
     local reason=${1:-"manual_reset"}
+    local explicit_loop_count=${2:-0}
     local reset_timestamp=$(get_iso_timestamp)
 
     jq -n \
@@ -45,7 +46,7 @@ reset_session() {
     fi
     rm -f "$RALPH_DIR/.response_analysis" 2>/dev/null
 
-    log_session_transition "active" "reset" "$reason" "${loop_count:-0}" || true
+    log_session_transition "active" "reset" "$reason" "$explicit_loop_count" || true
     log_status "INFO" "Session reset: $reason"
 }
 
diff --git a/ralph_loop.sh b/ralph_loop.sh
index a4a844d3..d184beb7 100755
--- a/ralph_loop.sh
+++ b/ralph_loop.sh
@@ -599,7 +599,7 @@ main() {
         
         # Check circuit breaker before attempting execution
         if should_halt_execution; then
-            reset_session "circuit_breaker_open"
+            reset_session "circuit_breaker_open" "$loop_count"
             update_status "$loop_count" "$(cat "$CALL_COUNT_FILE")" "circuit_breaker_open" "halted" "stagnation_detected"
             log_status "ERROR" "🛑 Circuit breaker has opened - execution halted"
             break
@@ -617,7 +617,7 @@ main() {
             # Handle permission_denied specially (Issue #101)
             if [[ "$exit_reason" == "permission_denied" ]]; then
                 log_status "ERROR" "🚫 Permission denied - halting loop"
-                reset_session "permission_denied"
+                reset_session "permission_denied" "$loop_count"
                 update_status "$loop_count" "$(cat "$CALL_COUNT_FILE")" "permission_denied" "halted" "permission_denied"
 
                 # Display helpful guidance for resolving permission issues
@@ -654,7 +654,7 @@ main() {
             fi
 
             log_status "SUCCESS" "🏁 Graceful exit triggered: $exit_reason"
-            reset_session "project_complete"
+            reset_session "project_complete" "$loop_count"
             update_status "$loop_count" "$(cat "$CALL_COUNT_FILE")" "graceful_exit" "completed" "$exit_reason"
 
             log_status "SUCCESS" "🎉 Ralph has completed the project! Final stats:"
@@ -680,7 +680,7 @@ main() {
             sleep 5
         elif [ $exec_result -eq 3 ]; then
             # Circuit breaker opened
-            reset_session "circuit_breaker_trip"
+            reset_session "circuit_breaker_trip" "$loop_count"
             update_status "$loop_count" "$(cat "$CALL_COUNT_FILE")" "circuit_breaker_open" "halted" "stagnation_detected"
             log_status "ERROR" "🛑 Circuit breaker has opened - halting loop"
             log_status "INFO" "Run 'ralph --reset-circuit' to reset the circuit breaker after addressing issues"
@@ -845,14 +845,14 @@ while [[ $# -gt 0 ]]; do
             source "$SCRIPT_DIR/lib/circuit_breaker.sh"
             source "$SCRIPT_DIR/lib/date_utils.sh"
             reset_circuit_breaker "Manual reset via command line"
-            reset_session "manual_circuit_reset"
+            reset_session "manual_circuit_reset" 0
             exit 0
             ;;
         --reset-session)
             # Reset session state only
             SCRIPT_DIR="$(dirname "${BASH_SOURCE[0]}")"
             source "$SCRIPT_DIR/lib/date_utils.sh"
-            reset_session "manual_reset_flag"
+            reset_session "manual_reset_flag" 0
             echo -e "\033[0;32m✅ Session state reset successfully\033[0m"
             exit 0
             ;;

From ebcce88d4784685799626e549c01aa7f82c36bb2 Mon Sep 17 00:00:00 2001
From: Markus Waldheim <markus@waldheim.dev>
Date: Tue, 10 Feb 2026 20:08:30 +0100
Subject: [PATCH 13/13] fix: improve provider robustness and session logging
 safety

- Validate prompt file existence in copilot.sh
- Implement exit code 2 for API limits in gemini.sh
- Validate loop_number as integer in log_session_transition
---
 lib/providers/copilot.sh | 7 +++++++
 lib/providers/gemini.sh  | 6 ++++++
 lib/session_manager.sh   | 6 ++++++
 3 files changed, 19 insertions(+)

diff --git a/lib/providers/copilot.sh b/lib/providers/copilot.sh
index 5663b64e..29ac4271 100644
--- a/lib/providers/copilot.sh
+++ b/lib/providers/copilot.sh
@@ -36,6 +36,11 @@ provider_execute() {
     
     # Build loop context
     local loop_context=$(build_loop_context "$loop_count")
+    
+    if [[ ! -r "$prompt_file" ]]; then
+        log_status "ERROR" "Prompt file not found or unreadable: $prompt_file"
+        return 1
+    fi
     local prompt_content=$(cat "$prompt_file")
     local full_prompt="$loop_context
 
@@ -70,6 +75,8 @@ $prompt_content"
         return 0
     else
         log_status "ERROR" "Copilot execution failed."
+        # TODO: Detect specific API limit errors if Copilot exposes them in stdout/stderr
+        # If grep -q "rate limit" "$output_file"; then return 2; fi
         return 1
     fi
 }
diff --git a/lib/providers/gemini.sh b/lib/providers/gemini.sh
index 581dfa7a..dcdfb5a0 100644
--- a/lib/providers/gemini.sh
+++ b/lib/providers/gemini.sh
@@ -59,6 +59,12 @@ provider_execute() {
         update_exit_signals
         return 0
     else
+        # Check for specific error conditions in output file
+        if grep -qi "429\|quota\|limit" "$output_file"; then
+            log_status "ERROR" "Gemini API rate limit reached."
+            return 2
+        fi
+        
         log_status "ERROR" "Gemini execution failed."
         return 1
     fi
diff --git a/lib/session_manager.sh b/lib/session_manager.sh
index 40faf398..2799f454 100644
--- a/lib/session_manager.sh
+++ b/lib/session_manager.sh
@@ -56,6 +56,12 @@ log_session_transition() {
     local to_state=$2
     local reason=$3
     local loop_number=${4:-0}
+    
+    # Ensure loop_number is a valid integer
+    if [[ ! "$loop_number" =~ ^[0-9]+$ ]]; then
+        loop_number=0
+    fi
+    
     local ts=$(get_iso_timestamp)
 
     local transition=$(jq -n -c \