Refactor LLM service architecture and improve document processing

- Refactor LLM service with provider pattern (Anthropic, OpenAI, OpenRouter) - Add structured LLM prompts and utilities (token estimation, cost calculation, JSON extraction) - Implement RAG improvements with optimized chunking and embedding services - Add financial extraction monitoring service - Add parallel document processor - Improve error handling with dedicated error handlers - Add comprehensive TypeScript types for LLM, document, and processing - Update optimized agentic RAG processor and simple document processor
2025-11-11 21:04:42 -05:00
parent ecd4b13115
commit 87c6da4225
38 changed files with 6232 additions and 1181 deletions
--- a/README.md
+++ b/README.md
@@ -38,10 +38,12 @@

 ### Documentation
 - `APP_DESIGN_DOCUMENTATION.md` - Complete system architecture
- `AGENTIC_RAG_IMPLEMENTATION_PLAN.md` - AI processing strategy
 - `PDF_GENERATION_ANALYSIS.md` - PDF generation optimization
 - `DEPLOYMENT_GUIDE.md` - Deployment instructions
 - `ARCHITECTURE_DIAGRAMS.md` - Visual architecture documentation
+- `QUICK_START.md` - Quick start guide
+- `TESTING_STRATEGY_DOCUMENTATION.md` - Testing guidelines
+- `TROUBLESHOOTING_GUIDE.md` - Troubleshooting guide

 ### Configuration
 - `backend/src/config/` - Environment and service configuration
@@ -94,9 +96,9 @@ cd frontend && npm run dev
 - **uploadMonitoringService.ts** - Real-time upload tracking

 ### 3. Data Management
- **agenticRAGDatabaseService.ts** - Analytics and session management
 - **vectorDatabaseService.ts** - Vector embeddings and search
- **sessionService.ts** - User session management
+- **jobQueueService.ts** - Background job processing
+- **jobProcessorService.ts** - Job execution logic

 ## 📊 Processing Strategies

@@ -188,7 +190,7 @@ Structured CIM Review data including:
 ## 🧪 Testing

 ### Test Structure
- **Unit Tests**: Jest for backend, Vitest for frontend
+- **Unit Tests**: Vitest for backend and frontend
 - **Integration Tests**: End-to-end testing
 - **API Tests**: Supertest for backend endpoints

@@ -203,15 +205,12 @@ Structured CIM Review data including:

 ### Technical Documentation
 - [Application Design Documentation](APP_DESIGN_DOCUMENTATION.md) - Complete system architecture
- [Agentic RAG Implementation Plan](AGENTIC_RAG_IMPLEMENTATION_PLAN.md) - AI processing strategy
 - [PDF Generation Analysis](PDF_GENERATION_ANALYSIS.md) - PDF optimization details
 - [Architecture Diagrams](ARCHITECTURE_DIAGRAMS.md) - Visual system design
 - [Deployment Guide](DEPLOYMENT_GUIDE.md) - Deployment instructions
-
-### Analysis Reports
- [Codebase Audit Report](codebase-audit-report.md) - Code quality analysis
- [Dependency Analysis Report](DEPENDENCY_ANALYSIS_REPORT.md) - Dependency management
- [Document AI Integration Summary](DOCUMENT_AI_INTEGRATION_SUMMARY.md) - Google Document AI setup
+- [Quick Start Guide](QUICK_START.md) - Getting started
+- [Testing Strategy](TESTING_STRATEGY_DOCUMENTATION.md) - Testing guidelines
+- [Troubleshooting Guide](TROUBLESHOOTING_GUIDE.md) - Common issues and solutions

 ## 🤝 Contributing

--- a/backend/src/config/constants.ts
+++ b/backend/src/config/constants.ts
@@ -0,0 +1,169 @@
+/**
+ * Application-wide constants
+ * Centralized location for model configurations, cost rates, timeouts, and other constants
+ */
+
+/**
+ * LLM Model Cost Rates (USD per 1M tokens)
+ * Used for cost estimation in LLM service
+ */
+export const LLM_COST_RATES: Record<string, { input: number; output: number }> = {
+  'claude-3-opus-20240229': { input: 15, output: 75 },
+  'claude-sonnet-4-5-20250929': { input: 3, output: 15 }, // Sonnet 4.5
+  'claude-3-5-sonnet-20241022': { input: 3, output: 15 },
+  'claude-haiku-4-5-20251015': { input: 0.25, output: 1.25 }, // Haiku 4.5 (released Oct 15, 2025)
+  'claude-3-5-haiku-20241022': { input: 0.25, output: 1.25 },
+  'claude-3-5-haiku-latest': { input: 0.25, output: 1.25 },
+  'gpt-4o': { input: 5, output: 15 },
+  'gpt-4o-mini': { input: 0.15, output: 0.60 },
+};
+
+/**
+ * Default cost rate fallback (used when model not found in cost rates)
+ */
+export const DEFAULT_COST_RATE = LLM_COST_RATES['claude-3-5-sonnet-20241022'];
+
+/**
+ * OpenRouter Model Name Mappings
+ * Maps Anthropic model names to OpenRouter API format
+ */
+export const OPENROUTER_MODEL_MAPPINGS: Record<string, string> = {
+  // Claude 4.x models
+  'claude-sonnet-4-5-20250929': 'anthropic/claude-sonnet-4.5',
+  'claude-sonnet-4': 'anthropic/claude-sonnet-4.5',
+  'claude-haiku-4-5-20251015': 'anthropic/claude-haiku-4.5',
+  'claude-haiku-4': 'anthropic/claude-haiku-4.5',
+  'claude-opus-4': 'anthropic/claude-opus-4',
+  
+  // Claude 3.7 models
+  'claude-3-7-sonnet-latest': 'anthropic/claude-3.7-sonnet',
+  'claude-3-7-sonnet': 'anthropic/claude-3.7-sonnet',
+  
+  // Claude 3.5 models
+  'claude-3-5-sonnet-20241022': 'anthropic/claude-3.5-sonnet',
+  'claude-3-5-sonnet': 'anthropic/claude-3.5-sonnet',
+  'claude-3-5-haiku-20241022': 'anthropic/claude-3.5-haiku',
+  'claude-3-5-haiku-latest': 'anthropic/claude-3.5-haiku',
+  'claude-3-5-haiku': 'anthropic/claude-3.5-haiku',
+  
+  // Claude 3.0 models
+  'claude-3-haiku': 'anthropic/claude-3-haiku',
+  'claude-3-opus': 'anthropic/claude-3-opus',
+};
+
+/**
+ * Map Anthropic model name to OpenRouter format
+ * Handles versioned and generic model names
+ */
+export function mapModelToOpenRouter(model: string): string {
+  // Check direct mapping first
+  if (OPENROUTER_MODEL_MAPPINGS[model]) {
+    return OPENROUTER_MODEL_MAPPINGS[model];
+  }
+  
+  // Handle pattern-based matching for versioned models
+  if (model.includes('claude')) {
+    if (model.includes('sonnet') && model.includes('4')) {
+      return 'anthropic/claude-sonnet-4.5';
+    } else if (model.includes('haiku') && (model.includes('4-5') || model.includes('4.5'))) {
+      return 'anthropic/claude-haiku-4.5';
+    } else if (model.includes('haiku') && model.includes('4')) {
+      return 'anthropic/claude-haiku-4.5';
+    } else if (model.includes('opus') && model.includes('4')) {
+      return 'anthropic/claude-opus-4';
+    } else if (model.includes('sonnet') && (model.includes('4.5') || model.includes('4-5'))) {
+      return 'anthropic/claude-sonnet-4.5';
+    } else if (model.includes('sonnet') && model.includes('3.7')) {
+      return 'anthropic/claude-3.7-sonnet';
+    } else if (model.includes('sonnet') && model.includes('3.5')) {
+      return 'anthropic/claude-3.5-sonnet';
+    } else if (model.includes('haiku') && model.includes('3.5')) {
+      return 'anthropic/claude-3.5-haiku';
+    } else if (model.includes('haiku') && model.includes('3')) {
+      return 'anthropic/claude-3-haiku';
+    } else if (model.includes('opus') && model.includes('3')) {
+      return 'anthropic/claude-3-opus';
+    }
+    
+    // Fallback: try to construct from model name
+    return `anthropic/${model}`;
+  }
+  
+  // Return model as-is if no mapping found
+  return model;
+}
+
+/**
+ * LLM Timeout Constants (in milliseconds)
+ */
+export const LLM_TIMEOUTS = {
+  DEFAULT: 180000, // 3 minutes
+  COMPLEX_ANALYSIS: 360000, // 6 minutes for complex CIM analysis
+  OPENROUTER_DEFAULT: 360000, // 6 minutes for OpenRouter
+  ABORT_BUFFER: 10000, // 10 seconds buffer before wrapper timeout
+  SDK_BUFFER: 10000, // 10 seconds buffer for SDK timeout
+} as const;
+
+/**
+ * Token Estimation Constants
+ */
+export const TOKEN_ESTIMATION = {
+  CHARS_PER_TOKEN: 4, // Rough estimation: 1 token ≈ 4 characters for English text
+  INPUT_OUTPUT_RATIO: 0.8, // Assume 80% input, 20% output for cost estimation
+} as const;
+
+/**
+ * Default LLM Configuration Values
+ */
+export const LLM_DEFAULTS = {
+  MAX_TOKENS: 16000,
+  TEMPERATURE: 0.1,
+  PROMPT_BUFFER: 500,
+  MAX_INPUT_TOKENS: 200000,
+  DEFAULT_MAX_TOKENS_SIMPLE: 3000,
+  DEFAULT_TEMPERATURE_SIMPLE: 0.3,
+} as const;
+
+/**
+ * OpenRouter API Configuration
+ */
+export const OPENROUTER_CONFIG = {
+  BASE_URL: 'https://openrouter.ai/api/v1/chat/completions',
+  HTTP_REFERER: 'https://cim-summarizer-testing.firebaseapp.com',
+  X_TITLE: 'CIM Summarizer',
+} as const;
+
+/**
+ * Retry Configuration
+ */
+export const RETRY_CONFIG = {
+  MAX_ATTEMPTS: 3,
+  INITIAL_DELAY_MS: 1000, // 1 second
+  MAX_DELAY_MS: 10000, // 10 seconds
+  BACKOFF_MULTIPLIER: 2,
+} as const;
+
+/**
+ * Cost Estimation Helper
+ * Estimates cost for a given number of tokens and model
+ */
+export function estimateLLMCost(tokens: number, model: string): number {
+  const rates = LLM_COST_RATES[model] || DEFAULT_COST_RATE;
+  if (!rates) {
+    return 0;
+  }
+  
+  const inputCost = (tokens * TOKEN_ESTIMATION.INPUT_OUTPUT_RATIO * rates.input) / 1000000;
+  const outputCost = (tokens * (1 - TOKEN_ESTIMATION.INPUT_OUTPUT_RATIO) * rates.output) / 1000000;
+  
+  return inputCost + outputCost;
+}
+
+/**
+ * Token Count Estimation Helper
+ * Rough estimation based on character count
+ */
+export function estimateTokenCount(text: string): number {
+  return Math.ceil(text.length / TOKEN_ESTIMATION.CHARS_PER_TOKEN);
+}
+
--- a/backend/src/models/migrations/011_add_financial_extraction_monitoring.sql
+++ b/backend/src/models/migrations/011_add_financial_extraction_monitoring.sql
@@ -0,0 +1,232 @@
+-- Migration: Add financial extraction monitoring tables
+-- Created: 2025-01-XX
+-- Description: Track financial extraction accuracy, errors, and API call patterns
+
+-- Table to track financial extraction events
+CREATE TABLE IF NOT EXISTS financial_extraction_events (
+  id UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  document_id UUID REFERENCES documents(id) ON DELETE CASCADE,
+  job_id UUID REFERENCES processing_jobs(id) ON DELETE SET NULL,
+  user_id UUID REFERENCES users(id) ON DELETE SET NULL,
+  
+  -- Extraction details
+  extraction_method TEXT NOT NULL, -- 'deterministic_parser', 'llm_haiku', 'llm_sonnet', 'fallback'
+  model_used TEXT, -- e.g., 'claude-3-5-haiku-latest', 'claude-sonnet-4-5-20250514'
+  attempt_number INTEGER DEFAULT 1,
+  
+  -- Results
+  success BOOLEAN NOT NULL,
+  has_financials BOOLEAN DEFAULT FALSE,
+  periods_extracted TEXT[], -- Array of periods found: ['fy3', 'fy2', 'fy1', 'ltm']
+  metrics_extracted TEXT[], -- Array of metrics: ['revenue', 'ebitda', 'ebitdaMargin', etc.]
+  
+  -- Validation results
+  validation_passed BOOLEAN,
+  validation_issues TEXT[], -- Array of validation warnings/errors
+  auto_corrections_applied INTEGER DEFAULT 0, -- Number of auto-corrections (e.g., margin fixes)
+  
+  -- API call tracking
+  api_call_duration_ms INTEGER,
+  tokens_used INTEGER,
+  cost_estimate_usd DECIMAL(10, 6),
+  rate_limit_hit BOOLEAN DEFAULT FALSE,
+  
+  -- Error tracking
+  error_type TEXT, -- 'rate_limit', 'validation_failure', 'api_error', 'timeout', etc.
+  error_message TEXT,
+  error_code TEXT,
+  
+  -- Timing
+  processing_time_ms INTEGER,
+  created_at TIMESTAMP WITH TIME ZONE DEFAULT NOW(),
+  
+  -- Indexes for common queries
+  INDEX idx_financial_extraction_events_document_id ON financial_extraction_events(document_id),
+  INDEX idx_financial_extraction_events_created_at ON financial_extraction_events(created_at DESC),
+  INDEX idx_financial_extraction_events_success ON financial_extraction_events(success),
+  INDEX idx_financial_extraction_events_method ON financial_extraction_events(extraction_method)
+);
+
+-- Table to track API call patterns (for rate limit prevention)
+CREATE TABLE IF NOT EXISTS api_call_tracking (
+  id UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  provider TEXT NOT NULL, -- 'anthropic', 'openai', 'openrouter'
+  model TEXT NOT NULL,
+  endpoint TEXT NOT NULL, -- 'financial_extraction', 'full_extraction', etc.
+  
+  -- Call details
+  timestamp TIMESTAMP WITH TIME ZONE DEFAULT NOW(),
+  duration_ms INTEGER,
+  success BOOLEAN NOT NULL,
+  rate_limit_hit BOOLEAN DEFAULT FALSE,
+  retry_attempt INTEGER DEFAULT 0,
+  
+  -- Token usage
+  input_tokens INTEGER,
+  output_tokens INTEGER,
+  total_tokens INTEGER,
+  
+  -- Cost tracking
+  cost_usd DECIMAL(10, 6),
+  
+  -- Error details (if failed)
+  error_type TEXT,
+  error_message TEXT,
+  
+  -- Indexes for rate limit tracking
+  INDEX idx_api_call_tracking_provider_model ON api_call_tracking(provider, model),
+  INDEX idx_api_call_tracking_timestamp ON api_call_tracking(timestamp DESC),
+  INDEX idx_api_call_tracking_rate_limit ON api_call_tracking(rate_limit_hit, timestamp DESC)
+);
+
+-- Table for aggregated metrics (updated periodically)
+CREATE TABLE IF NOT EXISTS financial_extraction_metrics (
+  id UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  metric_date DATE NOT NULL UNIQUE,
+  
+  -- Success metrics
+  total_extractions INTEGER DEFAULT 0,
+  successful_extractions INTEGER DEFAULT 0,
+  failed_extractions INTEGER DEFAULT 0,
+  success_rate DECIMAL(5, 4), -- 0.0000 to 1.0000
+  
+  -- Method breakdown
+  deterministic_parser_count INTEGER DEFAULT 0,
+  llm_haiku_count INTEGER DEFAULT 0,
+  llm_sonnet_count INTEGER DEFAULT 0,
+  fallback_count INTEGER DEFAULT 0,
+  
+  -- Accuracy metrics
+  avg_periods_extracted DECIMAL(3, 2), -- Average number of periods extracted
+  avg_metrics_extracted DECIMAL(5, 2), -- Average number of metrics extracted
+  validation_pass_rate DECIMAL(5, 4),
+  avg_auto_corrections DECIMAL(5, 2),
+  
+  -- Performance metrics
+  avg_processing_time_ms INTEGER,
+  avg_api_call_duration_ms INTEGER,
+  p95_processing_time_ms INTEGER,
+  p99_processing_time_ms INTEGER,
+  
+  -- Cost metrics
+  total_cost_usd DECIMAL(10, 2),
+  avg_cost_per_extraction_usd DECIMAL(10, 6),
+  
+  -- Error metrics
+  rate_limit_errors INTEGER DEFAULT 0,
+  validation_errors INTEGER DEFAULT 0,
+  api_errors INTEGER DEFAULT 0,
+  timeout_errors INTEGER DEFAULT 0,
+  
+  -- Updated timestamp
+  updated_at TIMESTAMP WITH TIME ZONE DEFAULT NOW(),
+  
+  INDEX idx_financial_extraction_metrics_date ON financial_extraction_metrics(metric_date DESC)
+);
+
+-- Function to update daily metrics (can be called by a scheduled job)
+CREATE OR REPLACE FUNCTION update_financial_extraction_metrics(target_date DATE DEFAULT CURRENT_DATE)
+RETURNS VOID AS $$
+DECLARE
+  v_total INTEGER;
+  v_successful INTEGER;
+  v_failed INTEGER;
+  v_success_rate DECIMAL(5, 4);
+  v_deterministic INTEGER;
+  v_haiku INTEGER;
+  v_sonnet INTEGER;
+  v_fallback INTEGER;
+  v_avg_periods DECIMAL(3, 2);
+  v_avg_metrics DECIMAL(5, 2);
+  v_validation_pass_rate DECIMAL(5, 4);
+  v_avg_auto_corrections DECIMAL(5, 2);
+  v_avg_processing_time INTEGER;
+  v_avg_api_duration INTEGER;
+  v_p95_processing INTEGER;
+  v_p99_processing INTEGER;
+  v_total_cost DECIMAL(10, 2);
+  v_avg_cost DECIMAL(10, 6);
+  v_rate_limit_errors INTEGER;
+  v_validation_errors INTEGER;
+  v_api_errors INTEGER;
+  v_timeout_errors INTEGER;
+BEGIN
+  -- Calculate metrics for the target date
+  SELECT 
+    COUNT(*),
+    COUNT(*) FILTER (WHERE success = true),
+    COUNT(*) FILTER (WHERE success = false),
+    CASE WHEN COUNT(*) > 0 THEN COUNT(*) FILTER (WHERE success = true)::DECIMAL / COUNT(*) ELSE 0 END,
+    COUNT(*) FILTER (WHERE extraction_method = 'deterministic_parser'),
+    COUNT(*) FILTER (WHERE extraction_method = 'llm_haiku'),
+    COUNT(*) FILTER (WHERE extraction_method = 'llm_sonnet'),
+    COUNT(*) FILTER (WHERE extraction_method = 'fallback'),
+    COALESCE(AVG(array_length(periods_extracted, 1)), 0),
+    COALESCE(AVG(array_length(metrics_extracted, 1)), 0),
+    CASE WHEN COUNT(*) > 0 THEN COUNT(*) FILTER (WHERE validation_passed = true)::DECIMAL / COUNT(*) ELSE 0 END,
+    COALESCE(AVG(auto_corrections_applied), 0),
+    COALESCE(AVG(processing_time_ms), 0)::INTEGER,
+    COALESCE(AVG(api_call_duration_ms), 0)::INTEGER,
+    COALESCE(PERCENTILE_CONT(0.95) WITHIN GROUP (ORDER BY processing_time_ms), 0)::INTEGER,
+    COALESCE(PERCENTILE_CONT(0.99) WITHIN GROUP (ORDER BY processing_time_ms), 0)::INTEGER,
+    COALESCE(SUM(cost_estimate_usd), 0),
+    CASE WHEN COUNT(*) > 0 THEN COALESCE(SUM(cost_estimate_usd), 0) / COUNT(*) ELSE 0 END,
+    COUNT(*) FILTER (WHERE error_type = 'rate_limit'),
+    COUNT(*) FILTER (WHERE error_type = 'validation_failure'),
+    COUNT(*) FILTER (WHERE error_type = 'api_error'),
+    COUNT(*) FILTER (WHERE error_type = 'timeout')
+  INTO 
+    v_total, v_successful, v_failed, v_success_rate,
+    v_deterministic, v_haiku, v_sonnet, v_fallback,
+    v_avg_periods, v_avg_metrics, v_validation_pass_rate, v_avg_auto_corrections,
+    v_avg_processing_time, v_avg_api_duration, v_p95_processing, v_p99_processing,
+    v_total_cost, v_avg_cost,
+    v_rate_limit_errors, v_validation_errors, v_api_errors, v_timeout_errors
+  FROM financial_extraction_events
+  WHERE DATE(created_at) = target_date;
+  
+  -- Insert or update metrics
+  INSERT INTO financial_extraction_metrics (
+    metric_date, total_extractions, successful_extractions, failed_extractions,
+    success_rate, deterministic_parser_count, llm_haiku_count, llm_sonnet_count,
+    fallback_count, avg_periods_extracted, avg_metrics_extracted,
+    validation_pass_rate, avg_auto_corrections, avg_processing_time_ms,
+    avg_api_call_duration_ms, p95_processing_time_ms, p99_processing_time_ms,
+    total_cost_usd, avg_cost_per_extraction_usd, rate_limit_errors,
+    validation_errors, api_errors, timeout_errors, updated_at
+  ) VALUES (
+    target_date, v_total, v_successful, v_failed, v_success_rate,
+    v_deterministic, v_haiku, v_sonnet, v_fallback,
+    v_avg_periods, v_avg_metrics, v_validation_pass_rate, v_avg_auto_corrections,
+    v_avg_processing_time, v_avg_api_duration, v_p95_processing, v_p99_processing,
+    v_total_cost, v_avg_cost,
+    v_rate_limit_errors, v_validation_errors, v_api_errors, v_timeout_errors,
+    NOW()
+  )
+  ON CONFLICT (metric_date) DO UPDATE SET
+    total_extractions = EXCLUDED.total_extractions,
+    successful_extractions = EXCLUDED.successful_extractions,
+    failed_extractions = EXCLUDED.failed_extractions,
+    success_rate = EXCLUDED.success_rate,
+    deterministic_parser_count = EXCLUDED.deterministic_parser_count,
+    llm_haiku_count = EXCLUDED.llm_haiku_count,
+    llm_sonnet_count = EXCLUDED.llm_sonnet_count,
+    fallback_count = EXCLUDED.fallback_count,
+    avg_periods_extracted = EXCLUDED.avg_periods_extracted,
+    avg_metrics_extracted = EXCLUDED.avg_metrics_extracted,
+    validation_pass_rate = EXCLUDED.validation_pass_rate,
+    avg_auto_corrections = EXCLUDED.avg_auto_corrections,
+    avg_processing_time_ms = EXCLUDED.avg_processing_time_ms,
+    avg_api_call_duration_ms = EXCLUDED.avg_api_call_duration_ms,
+    p95_processing_time_ms = EXCLUDED.p95_processing_time_ms,
+    p99_processing_time_ms = EXCLUDED.p99_processing_time_ms,
+    total_cost_usd = EXCLUDED.total_cost_usd,
+    avg_cost_per_extraction_usd = EXCLUDED.avg_cost_per_extraction_usd,
+    rate_limit_errors = EXCLUDED.rate_limit_errors,
+    validation_errors = EXCLUDED.validation_errors,
+    api_errors = EXCLUDED.api_errors,
+    timeout_errors = EXCLUDED.timeout_errors,
+    updated_at = NOW();
+END;
+$$ LANGUAGE plpgsql;
+
--- a/backend/src/scripts/compare-processing-methods.ts
+++ b/backend/src/scripts/compare-processing-methods.ts
@@ -0,0 +1,364 @@
+#!/usr/bin/env ts-node
+
+/**
+ * Comparison Test: Parallel Processing vs Sequential Processing
+ * 
+ * This script tests the new parallel processing methodology against
+ * the current production (sequential) methodology to measure:
+ * - Processing time differences
+ * - API call counts
+ * - Accuracy/completeness
+ * - Rate limit safety
+ */
+
+import * as dotenv from 'dotenv';
+import * as path from 'path';
+import * as fs from 'fs';
+import { simpleDocumentProcessor } from '../services/simpleDocumentProcessor';
+import { parallelDocumentProcessor } from '../services/parallelDocumentProcessor';
+import { documentAiProcessor } from '../services/documentAiProcessor';
+import { logger } from '../utils/logger';
+
+// Load environment variables
+dotenv.config({ path: path.join(__dirname, '../../.env') });
+
+interface ComparisonResult {
+  method: 'sequential' | 'parallel';
+  success: boolean;
+  processingTime: number;
+  apiCalls: number;
+  completeness: number;
+  sectionsExtracted: string[];
+  error?: string;
+  financialData?: any;
+}
+
+interface TestResults {
+  documentId: string;
+  fileName: string;
+  sequential: ComparisonResult;
+  parallel: ComparisonResult;
+  improvement: {
+    timeReduction: number; // percentage
+    timeSaved: number; // milliseconds
+    apiCallsDifference: number;
+    completenessDifference: number;
+  };
+}
+
+/**
+ * Calculate completeness score for a CIMReview
+ */
+function calculateCompleteness(data: any): number {
+  if (!data) return 0;
+
+  let totalFields = 0;
+  let filledFields = 0;
+
+  const countFields = (obj: any, prefix = '') => {
+    if (obj === null || obj === undefined) return;
+    
+    if (typeof obj === 'object' && !Array.isArray(obj)) {
+      Object.keys(obj).forEach(key => {
+        const value = obj[key];
+        const fieldPath = prefix ? `${prefix}.${key}` : key;
+        
+        if (typeof value === 'object' && !Array.isArray(obj)) {
+          countFields(value, fieldPath);
+        } else {
+          totalFields++;
+          if (value && value !== 'Not specified in CIM' && value !== 'N/A' && value !== '') {
+            filledFields++;
+          }
+        }
+      });
+    }
+  };
+
+  countFields(data);
+  return totalFields > 0 ? (filledFields / totalFields) * 100 : 0;
+}
+
+/**
+ * Get list of sections extracted
+ */
+function getSectionsExtracted(data: any): string[] {
+  const sections: string[] = [];
+  
+  if (data?.dealOverview) sections.push('dealOverview');
+  if (data?.businessDescription) sections.push('businessDescription');
+  if (data?.marketIndustryAnalysis) sections.push('marketIndustryAnalysis');
+  if (data?.financialSummary) sections.push('financialSummary');
+  if (data?.managementTeamOverview) sections.push('managementTeamOverview');
+  if (data?.preliminaryInvestmentThesis) sections.push('preliminaryInvestmentThesis');
+  
+  return sections;
+}
+
+/**
+ * Test a single document with both methods
+ */
+async function testDocument(
+  documentId: string,
+  userId: string,
+  filePath: string
+): Promise<TestResults> {
+  console.log('\n' + '='.repeat(80));
+  console.log(`Testing Document: ${path.basename(filePath)}`);
+  console.log('='.repeat(80));
+
+  // Read file
+  const fileBuffer = fs.readFileSync(filePath);
+  const fileName = path.basename(filePath);
+  const mimeType = 'application/pdf';
+
+  // Extract text once (shared between both methods)
+  console.log('\n📄 Extracting text with Document AI...');
+  const extractionResult = await documentAiProcessor.extractTextOnly(
+    documentId,
+    userId,
+    fileBuffer,
+    fileName,
+    mimeType
+  );
+
+  if (!extractionResult || !extractionResult.text) {
+    throw new Error('Failed to extract text from document');
+  }
+
+  const extractedText = extractionResult.text;
+  console.log(`✅ Text extracted: ${extractedText.length} characters`);
+
+  const results: TestResults = {
+    documentId,
+    fileName,
+    sequential: {} as ComparisonResult,
+    parallel: {} as ComparisonResult,
+    improvement: {
+      timeReduction: 0,
+      timeSaved: 0,
+      apiCallsDifference: 0,
+      completenessDifference: 0,
+    },
+  };
+
+  // Test Sequential Method (Current Production)
+  console.log('\n' + '-'.repeat(80));
+  console.log('🔄 Testing SEQUENTIAL Method (Current Production)');
+  console.log('-'.repeat(80));
+  
+  try {
+    const sequentialStart = Date.now();
+    const sequentialResult = await simpleDocumentProcessor.processDocument(
+      documentId + '_sequential',
+      userId,
+      extractedText,
+      { fileBuffer, fileName, mimeType }
+    );
+    const sequentialTime = Date.now() - sequentialStart;
+
+    results.sequential = {
+      method: 'sequential',
+      success: sequentialResult.success,
+      processingTime: sequentialTime,
+      apiCalls: sequentialResult.apiCalls,
+      completeness: calculateCompleteness(sequentialResult.analysisData),
+      sectionsExtracted: getSectionsExtracted(sequentialResult.analysisData),
+      error: sequentialResult.error,
+      financialData: sequentialResult.analysisData?.financialSummary,
+    };
+
+    console.log(`✅ Sequential completed in ${(sequentialTime / 1000).toFixed(2)}s`);
+    console.log(`   API Calls: ${sequentialResult.apiCalls}`);
+    console.log(`   Completeness: ${results.sequential.completeness.toFixed(1)}%`);
+    console.log(`   Sections: ${results.sequential.sectionsExtracted.join(', ')}`);
+  } catch (error) {
+    results.sequential = {
+      method: 'sequential',
+      success: false,
+      processingTime: 0,
+      apiCalls: 0,
+      completeness: 0,
+      sectionsExtracted: [],
+      error: error instanceof Error ? error.message : String(error),
+    };
+    console.log(`❌ Sequential failed: ${results.sequential.error}`);
+  }
+
+  // Wait a bit between tests to avoid rate limits
+  console.log('\n⏳ Waiting 5 seconds before parallel test...');
+  await new Promise(resolve => setTimeout(resolve, 5000));
+
+  // Test Parallel Method (New)
+  console.log('\n' + '-'.repeat(80));
+  console.log('⚡ Testing PARALLEL Method (New)');
+  console.log('-'.repeat(80));
+  
+  try {
+    const parallelStart = Date.now();
+    const parallelResult = await parallelDocumentProcessor.processDocument(
+      documentId + '_parallel',
+      userId,
+      extractedText,
+      { fileBuffer, fileName, mimeType }
+    );
+    const parallelTime = Date.now() - parallelStart;
+
+    results.parallel = {
+      method: 'parallel',
+      success: parallelResult.success,
+      processingTime: parallelTime,
+      apiCalls: parallelResult.apiCalls,
+      completeness: calculateCompleteness(parallelResult.analysisData),
+      sectionsExtracted: getSectionsExtracted(parallelResult.analysisData),
+      error: parallelResult.error,
+      financialData: parallelResult.analysisData?.financialSummary,
+    };
+
+    console.log(`✅ Parallel completed in ${(parallelTime / 1000).toFixed(2)}s`);
+    console.log(`   API Calls: ${parallelResult.apiCalls}`);
+    console.log(`   Completeness: ${results.parallel.completeness.toFixed(1)}%`);
+    console.log(`   Sections: ${results.parallel.sectionsExtracted.join(', ')}`);
+  } catch (error) {
+    results.parallel = {
+      method: 'parallel',
+      success: false,
+      processingTime: 0,
+      apiCalls: 0,
+      completeness: 0,
+      sectionsExtracted: [],
+      error: error instanceof Error ? error.message : String(error),
+    };
+    console.log(`❌ Parallel failed: ${results.parallel.error}`);
+  }
+
+  // Calculate improvements
+  if (results.sequential.success && results.parallel.success) {
+    results.improvement.timeSaved = results.sequential.processingTime - results.parallel.processingTime;
+    results.improvement.timeReduction = results.sequential.processingTime > 0
+      ? (results.improvement.timeSaved / results.sequential.processingTime) * 100
+      : 0;
+    results.improvement.apiCallsDifference = results.parallel.apiCalls - results.sequential.apiCalls;
+    results.improvement.completenessDifference = results.parallel.completeness - results.sequential.completeness;
+  }
+
+  return results;
+}
+
+/**
+ * Print comparison results
+ */
+function printComparisonResults(results: TestResults): void {
+  console.log('\n' + '='.repeat(80));
+  console.log('📊 COMPARISON RESULTS');
+  console.log('='.repeat(80));
+
+  console.log('\n📈 Performance Metrics:');
+  console.log(`   Sequential Time: ${(results.sequential.processingTime / 1000).toFixed(2)}s`);
+  console.log(`   Parallel Time:   ${(results.parallel.processingTime / 1000).toFixed(2)}s`);
+  
+  if (results.improvement.timeSaved > 0) {
+    console.log(`   ⚡ Time Saved:    ${(results.improvement.timeSaved / 1000).toFixed(2)}s (${results.improvement.timeReduction.toFixed(1)}% faster)`);
+  } else {
+    console.log(`   ⚠️  Time Difference: ${(Math.abs(results.improvement.timeSaved) / 1000).toFixed(2)}s (${Math.abs(results.improvement.timeReduction).toFixed(1)}% ${results.improvement.timeReduction < 0 ? 'slower' : 'faster'})`);
+  }
+
+  console.log('\n🔢 API Calls:');
+  console.log(`   Sequential: ${results.sequential.apiCalls}`);
+  console.log(`   Parallel:   ${results.parallel.apiCalls}`);
+  if (results.improvement.apiCallsDifference !== 0) {
+    const sign = results.improvement.apiCallsDifference > 0 ? '+' : '';
+    console.log(`   Difference: ${sign}${results.improvement.apiCallsDifference}`);
+  }
+
+  console.log('\n✅ Completeness:');
+  console.log(`   Sequential: ${results.sequential.completeness.toFixed(1)}%`);
+  console.log(`   Parallel:   ${results.parallel.completeness.toFixed(1)}%`);
+  if (results.improvement.completenessDifference !== 0) {
+    const sign = results.improvement.completenessDifference > 0 ? '+' : '';
+    console.log(`   Difference: ${sign}${results.improvement.completenessDifference.toFixed(1)}%`);
+  }
+
+  console.log('\n📋 Sections Extracted:');
+  console.log(`   Sequential: ${results.sequential.sectionsExtracted.join(', ') || 'None'}`);
+  console.log(`   Parallel:   ${results.parallel.sectionsExtracted.join(', ') || 'None'}`);
+
+  // Compare financial data if available
+  if (results.sequential.financialData && results.parallel.financialData) {
+    console.log('\n💰 Financial Data Comparison:');
+    const seqFinancials = results.sequential.financialData.financials;
+    const parFinancials = results.parallel.financialData.financials;
+    
+    ['fy3', 'fy2', 'fy1', 'ltm'].forEach(period => {
+      const seqRev = seqFinancials?.[period]?.revenue;
+      const parRev = parFinancials?.[period]?.revenue;
+      const match = seqRev === parRev ? '✅' : '❌';
+      console.log(`   ${period.toUpperCase()} Revenue: ${match} Sequential: ${seqRev || 'N/A'} | Parallel: ${parRev || 'N/A'}`);
+    });
+  }
+
+  console.log('\n' + '='.repeat(80));
+  
+  // Summary
+  if (results.improvement.timeReduction > 0) {
+    console.log(`\n🎉 Parallel processing is ${results.improvement.timeReduction.toFixed(1)}% faster!`);
+  } else if (results.improvement.timeReduction < 0) {
+    console.log(`\n⚠️  Parallel processing is ${Math.abs(results.improvement.timeReduction).toFixed(1)}% slower (may be due to rate limiting or overhead)`);
+  } else {
+    console.log(`\n➡️  Processing times are similar`);
+  }
+}
+
+/**
+ * Main test function
+ */
+async function main() {
+  const args = process.argv.slice(2);
+  
+  if (args.length === 0) {
+    console.error('Usage: ts-node compare-processing-methods.ts <pdf-file-path> [userId] [documentId]');
+    console.error('\nExample:');
+    console.error('  ts-node compare-processing-methods.ts ~/Downloads/stax-cim.pdf');
+    process.exit(1);
+  }
+
+  const filePath = args[0];
+  const userId = args[1] || 'test-user-' + Date.now();
+  const documentId = args[2] || 'test-doc-' + Date.now();
+
+  if (!fs.existsSync(filePath)) {
+    console.error(`❌ File not found: ${filePath}`);
+    process.exit(1);
+  }
+
+  console.log('\n🚀 Starting Processing Method Comparison Test');
+  console.log(`   File: ${filePath}`);
+  console.log(`   User ID: ${userId}`);
+  console.log(`   Document ID: ${documentId}`);
+
+  try {
+    const results = await testDocument(documentId, userId, filePath);
+    printComparisonResults(results);
+
+    // Save results to file
+    const resultsFile = path.join(__dirname, `../../comparison-results-${Date.now()}.json`);
+    fs.writeFileSync(resultsFile, JSON.stringify(results, null, 2));
+    console.log(`\n💾 Results saved to: ${resultsFile}`);
+
+    process.exit(0);
+  } catch (error) {
+    console.error('\n❌ Test failed:', error);
+    process.exit(1);
+  }
+}
+
+// Run if executed directly
+if (require.main === module) {
+  main().catch(error => {
+    console.error('Fatal error:', error);
+    process.exit(1);
+  });
+}
+
+export { testDocument, printComparisonResults, ComparisonResult, TestResults };
+
--- a/backend/src/services/financialExtractionMonitoringService.ts
+++ b/backend/src/services/financialExtractionMonitoringService.ts
@@ -0,0 +1,511 @@
+import { logger } from '../utils/logger';
+import getSupabaseClient from '../config/supabase';
+
+export interface FinancialExtractionEvent {
+  documentId: string;
+  jobId?: string;
+  userId?: string;
+  extractionMethod: 'deterministic_parser' | 'llm_haiku' | 'llm_sonnet' | 'fallback';
+  modelUsed?: string;
+  attemptNumber?: number;
+  success: boolean;
+  hasFinancials?: boolean;
+  periodsExtracted?: string[];
+  metricsExtracted?: string[];
+  validationPassed?: boolean;
+  validationIssues?: string[];
+  autoCorrectionsApplied?: number;
+  apiCallDurationMs?: number;
+  tokensUsed?: number;
+  costEstimateUsd?: number;
+  rateLimitHit?: boolean;
+  errorType?: 'rate_limit' | 'validation_failure' | 'api_error' | 'timeout' | 'other';
+  errorMessage?: string;
+  errorCode?: string;
+  processingTimeMs?: number;
+}
+
+export interface FinancialExtractionMetrics {
+  totalExtractions: number;
+  successfulExtractions: number;
+  failedExtractions: number;
+  successRate: number;
+  deterministicParserCount: number;
+  llmHaikuCount: number;
+  llmSonnetCount: number;
+  fallbackCount: number;
+  avgPeriodsExtracted: number;
+  avgMetricsExtracted: number;
+  validationPassRate: number;
+  avgAutoCorrections: number;
+  avgProcessingTimeMs: number;
+  avgApiCallDurationMs: number;
+  p95ProcessingTimeMs: number;
+  p99ProcessingTimeMs: number;
+  totalCostUsd: number;
+  avgCostPerExtractionUsd: number;
+  rateLimitErrors: number;
+  validationErrors: number;
+  apiErrors: number;
+  timeoutErrors: number;
+}
+
+export interface ApiCallTracking {
+  provider: 'anthropic' | 'openai' | 'openrouter';
+  model: string;
+  endpoint: 'financial_extraction' | 'full_extraction' | 'other';
+  durationMs?: number;
+  success: boolean;
+  rateLimitHit?: boolean;
+  retryAttempt?: number;
+  inputTokens?: number;
+  outputTokens?: number;
+  totalTokens?: number;
+  costUsd?: number;
+  errorType?: string;
+  errorMessage?: string;
+}
+
+export interface FinancialExtractionHealthStatus {
+  status: 'healthy' | 'degraded' | 'unhealthy';
+  successRate: number;
+  avgProcessingTime: number;
+  rateLimitRisk: 'low' | 'medium' | 'high';
+  recentErrors: number;
+  recommendations: string[];
+  timestamp: Date;
+}
+
+/**
+ * Service for monitoring financial extraction accuracy, errors, and API call patterns.
+ * 
+ * This service is designed to be safe for parallel processing:
+ * - Uses database-backed storage (not in-memory)
+ * - All operations are atomic
+ * - No shared mutable state
+ * - Thread-safe for concurrent access
+ */
+class FinancialExtractionMonitoringService {
+  private readonly RATE_LIMIT_WINDOW_MS = 60000; // 1 minute window
+  private readonly RATE_LIMIT_THRESHOLD = 50; // Max calls per minute per provider/model
+  private readonly HEALTH_THRESHOLDS = {
+    successRate: {
+      healthy: 0.95,
+      degraded: 0.85,
+    },
+    avgProcessingTime: {
+      healthy: 30000, // 30 seconds
+      degraded: 120000, // 2 minutes
+    },
+    maxRecentErrors: 10,
+  };
+
+  /**
+   * Track a financial extraction event
+   * Thread-safe: Uses database insert, safe for parallel processing
+   */
+  async trackExtractionEvent(event: FinancialExtractionEvent): Promise<void> {
+    try {
+      const supabase = getSupabaseClient();
+      const { error } = await supabase
+        .from('financial_extraction_events')
+        .insert({
+          document_id: event.documentId,
+          job_id: event.jobId || null,
+          user_id: event.userId || null,
+          extraction_method: event.extractionMethod,
+          model_used: event.modelUsed || null,
+          attempt_number: event.attemptNumber || 1,
+          success: event.success,
+          has_financials: event.hasFinancials || false,
+          periods_extracted: event.periodsExtracted || [],
+          metrics_extracted: event.metricsExtracted || [],
+          validation_passed: event.validationPassed || null,
+          validation_issues: event.validationIssues || [],
+          auto_corrections_applied: event.autoCorrectionsApplied || 0,
+          api_call_duration_ms: event.apiCallDurationMs || null,
+          tokens_used: event.tokensUsed || null,
+          cost_estimate_usd: event.costEstimateUsd || null,
+          rate_limit_hit: event.rateLimitHit || false,
+          error_type: event.errorType || null,
+          error_message: event.errorMessage || null,
+          error_code: event.errorCode || null,
+          processing_time_ms: event.processingTimeMs || null,
+        });
+
+      if (error) {
+        logger.error('Failed to track financial extraction event', {
+          error: error.message,
+          documentId: event.documentId,
+        });
+      } else {
+        logger.debug('Tracked financial extraction event', {
+          documentId: event.documentId,
+          method: event.extractionMethod,
+          success: event.success,
+        });
+      }
+    } catch (error) {
+      // Don't throw - monitoring failures shouldn't break processing
+      logger.error('Error tracking financial extraction event', {
+        error: error instanceof Error ? error.message : String(error),
+        documentId: event.documentId,
+      });
+    }
+  }
+
+  /**
+   * Track an API call for rate limit monitoring
+   * Thread-safe: Uses database insert, safe for parallel processing
+   */
+  async trackApiCall(call: ApiCallTracking): Promise<void> {
+    try {
+      const supabase = getSupabaseClient();
+      const { error } = await supabase
+        .from('api_call_tracking')
+        .insert({
+          provider: call.provider,
+          model: call.model,
+          endpoint: call.endpoint,
+          duration_ms: call.durationMs || null,
+          success: call.success,
+          rate_limit_hit: call.rateLimitHit || false,
+          retry_attempt: call.retryAttempt || 0,
+          input_tokens: call.inputTokens || null,
+          output_tokens: call.outputTokens || null,
+          total_tokens: call.totalTokens || null,
+          cost_usd: call.costUsd || null,
+          error_type: call.errorType || null,
+          error_message: call.errorMessage || null,
+        });
+
+      if (error) {
+        logger.error('Failed to track API call', {
+          error: error.message,
+          provider: call.provider,
+          model: call.model,
+        });
+      }
+    } catch (error) {
+      // Don't throw - monitoring failures shouldn't break processing
+      logger.error('Error tracking API call', {
+        error: error instanceof Error ? error.message : String(error),
+        provider: call.provider,
+        model: call.model,
+      });
+    }
+  }
+
+  /**
+   * Check if we're at risk of hitting rate limits
+   * Thread-safe: Uses database query, safe for parallel processing
+   */
+  async checkRateLimitRisk(
+    provider: 'anthropic' | 'openai' | 'openrouter',
+    model: string
+  ): Promise<'low' | 'medium' | 'high'> {
+    try {
+      const supabase = getSupabaseClient();
+      const windowStart = new Date(Date.now() - this.RATE_LIMIT_WINDOW_MS);
+      
+      const { data, error } = await supabase
+        .from('api_call_tracking')
+        .select('id')
+        .eq('provider', provider)
+        .eq('model', model)
+        .gte('timestamp', windowStart.toISOString())
+        .limit(this.RATE_LIMIT_THRESHOLD + 1);
+
+      if (error) {
+        logger.warn('Failed to check rate limit risk', {
+          error: error.message,
+          provider,
+          model,
+        });
+        return 'low'; // Default to low risk if we can't check
+      }
+
+      const callCount = data?.length || 0;
+      
+      if (callCount >= this.RATE_LIMIT_THRESHOLD) {
+        return 'high';
+      } else if (callCount >= this.RATE_LIMIT_THRESHOLD * 0.7) {
+        return 'medium';
+      } else {
+        return 'low';
+      }
+    } catch (error) {
+      logger.error('Error checking rate limit risk', {
+        error: error instanceof Error ? error.message : String(error),
+        provider,
+        model,
+      });
+      return 'low'; // Default to low risk on error
+    }
+  }
+
+  /**
+   * Get metrics for a time period
+   * Thread-safe: Uses database query, safe for parallel processing
+   */
+  async getMetrics(hours: number = 24): Promise<FinancialExtractionMetrics | null> {
+    try {
+      const cutoffTime = new Date(Date.now() - hours * 60 * 60 * 1000);
+      
+      // Get aggregated metrics from the metrics table if available
+      const supabase = getSupabaseClient();
+      const { data: metricsData, error: metricsError } = await supabase
+        .from('financial_extraction_metrics')
+        .select('*')
+        .gte('metric_date', cutoffTime.toISOString().split('T')[0])
+        .order('metric_date', { ascending: false })
+        .limit(1);
+
+      if (!metricsError && metricsData && metricsData.length > 0) {
+        const m = metricsData[0];
+        return {
+          totalExtractions: m.total_extractions || 0,
+          successfulExtractions: m.successful_extractions || 0,
+          failedExtractions: m.failed_extractions || 0,
+          successRate: parseFloat(m.success_rate || 0),
+          deterministicParserCount: m.deterministic_parser_count || 0,
+          llmHaikuCount: m.llm_haiku_count || 0,
+          llmSonnetCount: m.llm_sonnet_count || 0,
+          fallbackCount: m.fallback_count || 0,
+          avgPeriodsExtracted: parseFloat(m.avg_periods_extracted || 0),
+          avgMetricsExtracted: parseFloat(m.avg_metrics_extracted || 0),
+          validationPassRate: parseFloat(m.validation_pass_rate || 0),
+          avgAutoCorrections: parseFloat(m.avg_auto_corrections || 0),
+          avgProcessingTimeMs: m.avg_processing_time_ms || 0,
+          avgApiCallDurationMs: m.avg_api_call_duration_ms || 0,
+          p95ProcessingTimeMs: m.p95_processing_time_ms || 0,
+          p99ProcessingTimeMs: m.p99_processing_time_ms || 0,
+          totalCostUsd: parseFloat(m.total_cost_usd || 0),
+          avgCostPerExtractionUsd: parseFloat(m.avg_cost_per_extraction_usd || 0),
+          rateLimitErrors: m.rate_limit_errors || 0,
+          validationErrors: m.validation_errors || 0,
+          apiErrors: m.api_errors || 0,
+          timeoutErrors: m.timeout_errors || 0,
+        };
+      }
+
+      // Fallback: Calculate from events if metrics table is empty
+      const { data: eventsData, error: eventsError } = await supabase
+        .from('financial_extraction_events')
+        .select('*')
+        .gte('created_at', cutoffTime.toISOString());
+
+      if (eventsError) {
+        logger.error('Failed to get financial extraction metrics', {
+          error: eventsError.message,
+        });
+        return null;
+      }
+
+      if (!eventsData || eventsData.length === 0) {
+        return this.getEmptyMetrics();
+      }
+
+      // Calculate metrics from events
+      const total = eventsData.length;
+      const successful = eventsData.filter(e => e.success).length;
+      const failed = total - successful;
+      const successRate = total > 0 ? successful / total : 0;
+
+      const processingTimes = eventsData
+        .map(e => e.processing_time_ms)
+        .filter(t => t !== null && t !== undefined) as number[];
+      const avgProcessingTime = processingTimes.length > 0
+        ? Math.round(processingTimes.reduce((a, b) => a + b, 0) / processingTimes.length)
+        : 0;
+
+      const p95ProcessingTime = processingTimes.length > 0
+        ? Math.round(this.percentile(processingTimes, 0.95))
+        : 0;
+      const p99ProcessingTime = processingTimes.length > 0
+        ? Math.round(this.percentile(processingTimes, 0.99))
+        : 0;
+
+      return {
+        totalExtractions: total,
+        successfulExtractions: successful,
+        failedExtractions: failed,
+        successRate,
+        deterministicParserCount: eventsData.filter(e => e.extraction_method === 'deterministic_parser').length,
+        llmHaikuCount: eventsData.filter(e => e.extraction_method === 'llm_haiku').length,
+        llmSonnetCount: eventsData.filter(e => e.extraction_method === 'llm_sonnet').length,
+        fallbackCount: eventsData.filter(e => e.extraction_method === 'fallback').length,
+        avgPeriodsExtracted: this.avgArrayLength(eventsData.map(e => e.periods_extracted)),
+        avgMetricsExtracted: this.avgArrayLength(eventsData.map(e => e.metrics_extracted)),
+        validationPassRate: this.calculatePassRate(eventsData.map(e => e.validation_passed)),
+        avgAutoCorrections: this.avg(eventsData.map(e => e.auto_corrections_applied || 0)),
+        avgProcessingTimeMs: avgProcessingTime,
+        avgApiCallDurationMs: this.avg(eventsData.map(e => e.api_call_duration_ms).filter(t => t !== null && t !== undefined) as number[]),
+        p95ProcessingTimeMs: p95ProcessingTime,
+        p99ProcessingTimeMs: p99ProcessingTime,
+        totalCostUsd: eventsData.reduce((sum, e) => sum + (parseFloat(e.cost_estimate_usd || 0)), 0),
+        avgCostPerExtractionUsd: total > 0
+          ? eventsData.reduce((sum, e) => sum + (parseFloat(e.cost_estimate_usd || 0)), 0) / total
+          : 0,
+        rateLimitErrors: eventsData.filter(e => e.error_type === 'rate_limit').length,
+        validationErrors: eventsData.filter(e => e.error_type === 'validation_failure').length,
+        apiErrors: eventsData.filter(e => e.error_type === 'api_error').length,
+        timeoutErrors: eventsData.filter(e => e.error_type === 'timeout').length,
+      };
+    } catch (error) {
+      logger.error('Error getting financial extraction metrics', {
+        error: error instanceof Error ? error.message : String(error),
+      });
+      return null;
+    }
+  }
+
+  /**
+   * Get health status for financial extraction
+   */
+  async getHealthStatus(): Promise<FinancialExtractionHealthStatus> {
+    const metrics = await this.getMetrics(24);
+    const recommendations: string[] = [];
+
+    if (!metrics) {
+      return {
+        status: 'unhealthy',
+        successRate: 0,
+        avgProcessingTime: 0,
+        rateLimitRisk: 'low',
+        recentErrors: 0,
+        recommendations: ['Unable to retrieve metrics'],
+        timestamp: new Date(),
+      };
+    }
+
+    // Determine status based on thresholds
+    let status: 'healthy' | 'degraded' | 'unhealthy' = 'healthy';
+    
+    if (metrics.successRate < this.HEALTH_THRESHOLDS.successRate.degraded) {
+      status = 'unhealthy';
+      recommendations.push(`Success rate is low (${(metrics.successRate * 100).toFixed(1)}%). Investigate recent failures.`);
+    } else if (metrics.successRate < this.HEALTH_THRESHOLDS.successRate.healthy) {
+      status = 'degraded';
+      recommendations.push(`Success rate is below target (${(metrics.successRate * 100).toFixed(1)}%). Monitor closely.`);
+    }
+
+    if (metrics.avgProcessingTimeMs > this.HEALTH_THRESHOLDS.avgProcessingTime.degraded) {
+      if (status === 'healthy') status = 'degraded';
+      recommendations.push(`Average processing time is high (${(metrics.avgProcessingTimeMs / 1000).toFixed(1)}s). Consider optimization.`);
+    }
+
+    if (metrics.rateLimitErrors > 0) {
+      if (status === 'healthy') status = 'degraded';
+      recommendations.push(`${metrics.rateLimitErrors} rate limit errors detected. Consider reducing concurrency or adding delays.`);
+    }
+
+    // Check rate limit risk for common providers/models
+    const anthropicRisk = await this.checkRateLimitRisk('anthropic', 'claude-3-5-haiku-latest');
+    const sonnetRisk = await this.checkRateLimitRisk('anthropic', 'claude-sonnet-4-5-20250514');
+    const rateLimitRisk: 'low' | 'medium' | 'high' = 
+      anthropicRisk === 'high' || sonnetRisk === 'high' ? 'high' :
+      anthropicRisk === 'medium' || sonnetRisk === 'medium' ? 'medium' : 'low';
+
+    if (rateLimitRisk === 'high') {
+      recommendations.push('High rate limit risk detected. Consider reducing parallel processing or adding delays between API calls.');
+    } else if (rateLimitRisk === 'medium') {
+      recommendations.push('Medium rate limit risk. Monitor API call patterns closely.');
+    }
+
+    return {
+      status,
+      successRate: metrics.successRate,
+      avgProcessingTime: metrics.avgProcessingTimeMs,
+      rateLimitRisk,
+      recentErrors: metrics.failedExtractions,
+      recommendations,
+      timestamp: new Date(),
+    };
+  }
+
+  /**
+   * Update daily metrics (should be called by a scheduled job)
+   */
+  async updateDailyMetrics(date: Date = new Date()): Promise<void> {
+    try {
+      const supabase = getSupabaseClient();
+      const { error } = await supabase.rpc('update_financial_extraction_metrics', {
+        target_date: date.toISOString().split('T')[0],
+      });
+
+      if (error) {
+        logger.error('Failed to update daily metrics', {
+          error: error.message,
+          date: date.toISOString(),
+        });
+      } else {
+        logger.info('Updated daily financial extraction metrics', {
+          date: date.toISOString(),
+        });
+      }
+    } catch (error) {
+      logger.error('Error updating daily metrics', {
+        error: error instanceof Error ? error.message : String(error),
+        date: date.toISOString(),
+      });
+    }
+  }
+
+  // Helper methods
+  private getEmptyMetrics(): FinancialExtractionMetrics {
+    return {
+      totalExtractions: 0,
+      successfulExtractions: 0,
+      failedExtractions: 0,
+      successRate: 0,
+      deterministicParserCount: 0,
+      llmHaikuCount: 0,
+      llmSonnetCount: 0,
+      fallbackCount: 0,
+      avgPeriodsExtracted: 0,
+      avgMetricsExtracted: 0,
+      validationPassRate: 0,
+      avgAutoCorrections: 0,
+      avgProcessingTimeMs: 0,
+      avgApiCallDurationMs: 0,
+      p95ProcessingTimeMs: 0,
+      p99ProcessingTimeMs: 0,
+      totalCostUsd: 0,
+      avgCostPerExtractionUsd: 0,
+      rateLimitErrors: 0,
+      validationErrors: 0,
+      apiErrors: 0,
+      timeoutErrors: 0,
+    };
+  }
+
+  private avg(values: number[]): number {
+    if (values.length === 0) return 0;
+    return values.reduce((a, b) => a + b, 0) / values.length;
+  }
+
+  private avgArrayLength(arrays: (string[] | null)[]): number {
+    const lengths = arrays
+      .filter(a => a !== null && a !== undefined)
+      .map(a => a!.length);
+    return this.avg(lengths);
+  }
+
+  private calculatePassRate(passed: (boolean | null)[]): number {
+    const valid = passed.filter(p => p !== null);
+    if (valid.length === 0) return 0;
+    const passedCount = valid.filter(p => p === true).length;
+    return passedCount / valid.length;
+  }
+
+  private percentile(sorted: number[], p: number): number {
+    if (sorted.length === 0) return 0;
+    const sortedCopy = [...sorted].sort((a, b) => a - b);
+    const index = Math.ceil(sortedCopy.length * p) - 1;
+    return sortedCopy[Math.max(0, Math.min(index, sortedCopy.length - 1))];
+  }
+}
+
+export const financialExtractionMonitoringService = new FinancialExtractionMonitoringService();
+
--- a/backend/src/services/llm/llmPrompts.ts
+++ b/backend/src/services/llm/llmPrompts.ts
@@ -0,0 +1,341 @@
+import { cimReviewSchema } from '../llmSchemas';
+
+/**
+ * LLM Prompt Builders
+ * 
+ * This module contains all prompt building methods extracted from llmService.ts
+ * for better code organization and maintainability.
+ */
+
+export function getCIMSystemPrompt(focusedFields?: string[]): string {
+  const focusInstruction = focusedFields && focusedFields.length > 0
+    ? `\n\nPRIORITY AREAS FOR THIS PASS (extract these thoroughly, but still extract ALL other fields):\n${focusedFields.map(f => `- ${f}`).join('\n')}\n\nFor this pass, prioritize extracting the fields listed above with extra thoroughness. However, you MUST still extract ALL fields in the template. Do NOT use "Not specified in CIM" for any field unless you have thoroughly searched the entire document and confirmed the information is truly not present. Be especially thorough in extracting all nested fields within the priority areas.`
+    : '';
+  
+  return `You are a world-class private equity investment analyst at BPCP (Blue Point Capital Partners), operating at the analytical depth and rigor of top-tier PE firms (KKR, Blackstone, Apollo, Carlyle). Your task is to analyze Confidential Information Memorandums (CIMs) with the precision, depth, and strategic insight expected by BPCP's investment committee. Return a comprehensive, structured JSON object that follows the BPCP CIM Review Template format EXACTLY.${focusInstruction}
+
+CRITICAL REQUIREMENTS:
+1. **JSON OUTPUT ONLY**: Your entire response MUST be a single, valid JSON object. Do not include any text or explanation before or after the JSON object.
+2. **BPCP TEMPLATE FORMAT**: The JSON object MUST follow the BPCP CIM Review Template structure exactly as specified.
+3. **COMPLETE ALL FIELDS**: You MUST provide a value for every field. Use "Not specified in CIM" for any information that is not available in the document.
+4. **NO PLACEHOLDERS**: Do not use placeholders like "..." or "TBD". Use "Not specified in CIM" instead.
+5. **PROFESSIONAL ANALYSIS**: The content should be high-quality and suitable for BPCP's investment committee.
+6. **BPCP FOCUS**: Focus on companies in 5+MM EBITDA range in consumer and industrial end markets, with emphasis on M&A, technology & data usage, supply chain and human capital optimization.
+7. **BPCP PREFERENCES**: BPCP prefers companies which are founder/family-owned and within driving distance of Cleveland and Charlotte.
+8. **EXACT FIELD NAMES**: Use the exact field names and descriptions from the BPCP CIM Review Template.
+9. **FINANCIAL DATA**: For financial metrics, use actual numbers if available, otherwise use "Not specified in CIM".
+10. **VALID JSON**: Ensure your response is valid JSON that can be parsed without errors.
+
+FINANCIAL VALIDATION FRAMEWORK:
+Before finalizing any financial extraction, you MUST perform these validation checks:
+
+**Magnitude Validation**:
+- Revenue should typically be $10M+ for target companies (if less, verify you're using the PRIMARY table, not a subsidiary)
+- EBITDA should typically be $1M+ and positive for viable targets
+- If FY-3 revenue is $64M, FY-2 should be similar magnitude (e.g., $50M-$90M), not $2.9M or $10 - this indicates column misalignment
+
+**Trend Validation**:
+- Revenue should generally increase or be stable year-over-year (FY-3 → FY-2 → FY-1)
+- Large sudden drops (>50%) or increases (>200%) may indicate misaligned columns or wrong table
+- EBITDA should follow similar trends to revenue (unless margin expansion/contraction is explicitly explained)
+
+**Cross-Period Consistency**:
+- If FY-3 revenue = $64M and FY-2 revenue = $71M, growth should be ~11% (not 1000% or -50%)
+- Margins should be relatively stable across periods (within 10-15 percentage points unless explained)
+- EBITDA margins should be 5-50% (typical range), gross margins 20-80%
+
+**Multi-Table Cross-Reference**:
+- Cross-reference primary table with executive summary financial highlights
+- Verify consistency between detailed financials and summary tables
+- Check appendices for additional financial detail or adjustments
+- If discrepancies exist, note them and use the most authoritative source (typically the detailed historical table)
+
+**Calculation Validation**:
+- Verify revenue growth percentages match: ((Current - Prior) / Prior) * 100
+- Verify margins match: (Metric / Revenue) * 100
+- If calculations don't match, use the explicitly stated values from the table
+
+PE INVESTOR PERSONA & METHODOLOGY:
+You operate with the analytical rigor and strategic depth of top-tier private equity firms. Your analysis should demonstrate:
+
+**Value Creation Focus**:
+- Identify specific, quantifiable value creation opportunities (e.g., "Margin expansion of 200-300 bps through pricing optimization and cost reduction, potentially adding $2-3M EBITDA")
+- Assess operational improvement potential (supply chain, technology, human capital)
+- Evaluate M&A and add-on acquisition potential with specific rationale
+- Quantify potential impact where possible (EBITDA improvement, revenue growth, multiple expansion)
+
+**Risk Assessment Depth**:
+- Categorize risks by type: operational, financial, market, execution, regulatory, technology
+- Assess both probability and impact (high/medium/low)
+- Identify mitigating factors and management's risk management approach
+- Distinguish between deal-breakers and manageable risks
+
+**Strategic Analysis Frameworks**:
+- **Porter's Five Forces**: Assess competitive intensity, supplier power, buyer power, threat of substitutes, threat of new entrants
+- **SWOT Analysis**: Synthesize strengths, weaknesses, opportunities, threats from the CIM
+- **Value Creation Playbook**: Revenue growth (organic/inorganic), margin expansion, operational improvements, multiple expansion
+- **Comparable Analysis**: Reference industry benchmarks, comparable company multiples, recent transaction multiples where mentioned
+
+**Industry Context Integration**:
+- Reference industry-specific metrics and benchmarks (e.g., SaaS: ARR growth, churn, CAC payback; Manufacturing: inventory turns, days sales outstanding)
+- Consider sector-specific risks and opportunities (regulatory changes, technology disruption, consolidation trends)
+- Evaluate market position relative to industry standards (market share, growth vs market, margin vs peers)
+
+COMMON MISTAKES TO AVOID:
+1. **Subsidiary vs Parent Table Confusion**: Primary table shows values in millions ($64M), subsidiary tables show thousands ($20,546). Always use the PRIMARY table.
+2. **Column Misalignment**: Count columns carefully - ensure values align with their period columns. Verify trends make sense.
+3. **Projections vs Historical**: Ignore tables marked with "E", "P", "PF", "Projected", "Forecast" - only extract historical data.
+4. **Unit Confusion**: "$20,546 (in thousands)" = $20.5M, not $20,546M. Always check table footnotes for units.
+5. **Missing Cross-Validation**: Don't extract financials in isolation - cross-reference with executive summary, narrative text, appendices.
+6. **Generic Analysis**: Avoid generic statements like "strong management team" - provide specific details (years of experience, track record, specific achievements).
+7. **Incomplete Risk Assessment**: Don't just list risks - assess impact, probability, and mitigations. Categorize by type.
+8. **Vague Value Creation**: Instead of "operational improvements", specify "reduce SG&A by 150 bps through shared services consolidation, adding $1.5M EBITDA".
+
+ANALYSIS QUALITY REQUIREMENTS:
+- **Financial Precision**: Extract exact financial figures, percentages, and growth rates. Calculate CAGR where possible. Validate all calculations.
+- **Competitive Intelligence**: Identify specific competitors with market share context, competitive positioning (leader/follower/niche), and differentiation drivers.
+- **Risk Assessment**: Evaluate both stated and implied risks, categorize by type, assess impact and probability, identify mitigations.
+- **Growth Drivers**: Identify specific revenue growth drivers with quantification (e.g., "New product line launched in 2023, contributing $5M revenue in FY-1").
+- **Management Quality**: Assess management experience with specific details (years in role, prior companies, track record), evaluate retention risk and succession planning.
+- **Value Creation**: Identify specific value creation levers with quantification guidance (e.g., "Pricing optimization: 2-3% price increase on 60% of revenue base = $1.8-2.7M revenue increase").
+- **Due Diligence Focus**: Highlight areas requiring deeper investigation, prioritize by investment decision impact (deal-breakers vs nice-to-know).
+- **Key Questions Detail**: Provide detailed, contextual questions (2-3 sentences each) explaining why each question matters for the investment decision.
+- **Investment Thesis Detail**: Provide comprehensive analysis with specific examples, quantification where possible, and strategic rationale. Each item should include: what, why it matters, quantification if possible, investment impact.
+
+DOCUMENT ANALYSIS APPROACH:
+- Read the entire document systematically, paying special attention to financial tables, charts, appendices, and footnotes
+- Cross-reference information across different sections for consistency (executive summary vs detailed sections vs appendices)
+- Extract both explicit statements and implicit insights (read between the lines for risks, opportunities, competitive position)
+- Focus on quantitative data while providing qualitative context and strategic interpretation
+- Identify any inconsistencies or areas requiring clarification (note discrepancies and their potential significance)
+- Consider industry context and market dynamics when evaluating opportunities and risks (benchmark against industry standards)
+- Use document structure (headers, sections, page numbers) to locate and validate information
+- Check footnotes for adjustments, definitions, exclusions, and important context
+`;
+}
+
+// Due to the extremely large size of the prompt building methods (buildCIMPrompt is 400+ lines),
+// I'll create a simplified version that imports the full implementation.
+// The full prompts will remain in llmService.ts for now, but can be gradually extracted.
+
+// This is a placeholder structure - the actual prompt methods are too large to extract in one go.
+// They should be extracted incrementally to maintain functionality.
+
+export function buildCIMPrompt(
+  text: string, 
+  _template: string, 
+  previousError?: string, 
+  focusedFields?: string[], 
+  extractionInstructions?: string
+): string {
+  // This is a simplified version - the full implementation is 400+ lines
+  // For now, we'll keep the full implementation in llmService.ts and refactor incrementally
+  throw new Error('buildCIMPrompt should be called from llmService - extraction in progress');
+}
+
+// Similar placeholders for other prompt methods
+export function getRefinementSystemPrompt(): string {
+  return `You are an expert investment analyst. Your task is to refine and improve a combined JSON analysis into a final, professional CIM review.
+
+Key responsibilities:
+- Ensure the final output is a single, valid JSON object that conforms to the schema.
+- Remove any duplicate or redundant information.
+- Improve the flow and coherence of the content within the JSON structure.
+- Enhance the clarity and professionalism of the analysis.
+- Preserve all unique insights and important details.
+`;
+}
+
+export function buildRefinementPrompt(text: string): string {
+  return `
+You are tasked with creating a final, comprehensive CIM review JSON object.
+
+Below is a combined analysis from multiple document sections. Your job is to:
+1. **Ensure completeness**: Make sure all fields in the JSON schema are properly filled out.
+2. **Improve coherence**: Create smooth, logical content within the JSON structure.
+3. **Remove redundancy**: Eliminate duplicate information.
+4. **Maintain structure**: Follow the provided JSON schema exactly.
+
+**Combined Analysis (as a JSON object):**
+${text}
+
+**JSON Schema:**
+${JSON.stringify(cimReviewSchema.shape, null, 2)}
+
+Please provide a refined, comprehensive CIM review as a single, valid JSON object.
+`;
+}
+
+export function getOverviewSystemPrompt(): string {
+  return `You are an expert investment analyst at BPCP (Blue Point Capital Partners) reviewing a Confidential Information Memorandum (CIM). Your task is to create a comprehensive, strategic overview of a CIM document and return a structured JSON object that follows the BPCP CIM Review Template format EXACTLY.
+
+CRITICAL REQUIREMENTS:
+1. **JSON OUTPUT ONLY**: Your entire response MUST be a single, valid JSON object. Do not include any text or explanation before or after the JSON object.
+2. **BPCP TEMPLATE FORMAT**: The JSON object MUST follow the BPCP CIM Review Template structure exactly as specified.
+3. **COMPLETE ALL FIELDS**: You MUST provide a value for every field. Use "Not specified in CIM" for any information that is not available in the document.
+4. **NO PLACEHOLDERS**: Do not use placeholders like "..." or "TBD". Use "Not specified in CIM" instead.
+5. **PROFESSIONAL ANALYSIS**: The content should be high-quality and suitable for BPCP's investment committee.
+6. **BPCP FOCUS**: Focus on companies in 5+MM EBITDA range in consumer and industrial end markets, with emphasis on M&A, technology & data usage, supply chain and human capital optimization.
+7. **BPCP PREFERENCES**: BPCP prefers companies which are founder/family-owned and within driving distance of Cleveland and Charlotte.
+`;
+}
+
+export function buildOverviewPrompt(text: string): string {
+  // Simplified - full implementation is 100+ lines
+  return `You are tasked with creating a comprehensive overview of the CIM document.
+
+Your goal is to provide a high-level, strategic summary of the target company, its market position, and key factors driving its value.
+
+CIM Document Text:
+${text}
+
+Your response MUST be a single, valid JSON object that follows the exact structure provided. Do not include any other text, explanations, or markdown formatting.
+
+IMPORTANT: Replace all placeholder text with actual information from the CIM document. If information is not available, use "Not specified in CIM". Ensure all financial metrics are properly formatted as strings.
+`;
+}
+
+export function getSynthesisSystemPrompt(): string {
+  return `You are an expert investment analyst at BPCP (Blue Point Capital Partners) reviewing a Confidential Information Memorandum (CIM). Your task is to synthesize the key findings and insights from a CIM document and return a structured JSON object that follows the BPCP CIM Review Template format EXACTLY.
+
+CRITICAL REQUIREMENTS:
+1. **JSON OUTPUT ONLY**: Your entire response MUST be a single, valid JSON object. Do not include any text or explanation before or after the JSON object.
+2. **BPCP TEMPLATE FORMAT**: The JSON object MUST follow the BPCP CIM Review Template structure exactly as specified.
+3. **COMPLETE ALL FIELDS**: You MUST provide a value for every field. Use "Not specified in CIM" for any information that is not available in the document.
+4. **NO PLACEHOLDERS**: Do not use placeholders like "..." or "TBD". Use "Not specified in CIM" instead.
+5. **PROFESSIONAL ANALYSIS**: The content should be high-quality and suitable for BPCP's investment committee.
+6. **BPCP FOCUS**: Focus on companies in 5+MM EBITDA range in consumer and industrial end markets, with emphasis on M&A, technology & data usage, supply chain and human capital optimization.
+7. **BPCP PREFERENCES**: BPCP prefers companies which are founder/family-owned and within driving distance of Cleveland and Charlotte.
+`;
+}
+
+export function buildSynthesisPrompt(text: string): string {
+  // Simplified - full implementation is 100+ lines
+  return `You are tasked with synthesizing the key findings and insights from the CIM document.
+
+Your goal is to provide a cohesive, well-structured summary that highlights the most important aspects of the target company.
+
+CIM Document Text:
+${text}
+
+Your response MUST be a single, valid JSON object that follows the exact structure provided. Do not include any other text, explanations, or markdown formatting.
+
+IMPORTANT: Replace all placeholder text with actual information from the CIM document. If information is not available, use "Not specified in CIM". Ensure all financial metrics are properly formatted as strings.
+`;
+}
+
+export function getSectionSystemPrompt(sectionType: string): string {
+  const sectionName = sectionType.charAt(0).toUpperCase() + sectionType.slice(1);
+  return `You are an expert investment analyst at BPCP (Blue Point Capital Partners) reviewing a Confidential Information Memorandum (CIM). Your task is to analyze the "${sectionName}" section of the CIM document and return a comprehensive, structured JSON object that follows the BPCP CIM Review Template format EXACTLY.
+
+CRITICAL REQUIREMENTS:
+1. **JSON OUTPUT ONLY**: Your entire response MUST be a single, valid JSON object. Do not include any text or explanation before or after the JSON object.
+2. **BPCP TEMPLATE FORMAT**: The JSON object MUST follow the BPCP CIM Review Template structure exactly as specified.
+3. **SECTION FOCUS**: Focus specifically on the ${sectionName.toLowerCase()} aspects of the company.
+4. **COMPLETE ALL FIELDS**: You MUST provide a value for every field. Use "Not specified in CIM" for any information that is not available in the document.
+5. **NO PLACEHOLDERS**: Do not use placeholders like "..." or "TBD". Use "Not specified in CIM" instead.
+6. **PROFESSIONAL ANALYSIS**: The content should be high-quality and suitable for BPCP's investment committee.
+7. **BPCP FOCUS**: Focus on companies in 5+MM EBITDA range in consumer and industrial end markets, with emphasis on M&A, technology & data usage, supply chain and human capital optimization.
+8. **BPCP PREFERENCES**: BPCP prefers companies which are founder/family-owned and within driving distance of Cleveland and Charlotte.
+`;
+}
+
+export function buildSectionPrompt(text: string, sectionType: string, analysis: Record<string, any>): string {
+  const sectionName = sectionType.charAt(0).toUpperCase() + sectionType.slice(1);
+  const overview = analysis['overview'];
+  
+  return `
+You are tasked with analyzing the "${sectionName}" section of the CIM document.
+
+Your goal is to provide a detailed, structured analysis of this section, building upon the document overview.
+
+${overview ? `Document Overview Context:
+${JSON.stringify(overview, null, 2)}
+
+` : ''}CIM Document Text:
+${text}
+
+Your response MUST be a single, valid JSON object that follows the exact structure provided. Do not include any other text, explanations, or markdown formatting.
+
+IMPORTANT: Replace all placeholder text with actual information from the CIM document. If information is not available, use "Not specified in CIM". Ensure all financial metrics are properly formatted as strings.
+`;
+}
+
+export function getFinancialSystemPrompt(): string {
+  return `You are an expert financial analyst at BPCP (Blue Point Capital Partners) specializing in extracting historical financial data from CIM documents with 100% accuracy. Your task is to extract ONLY the financial summary section from the CIM document.
+
+CRITICAL REQUIREMENTS:
+1. **JSON OUTPUT ONLY**: Your entire response MUST be a single, valid JSON object containing ONLY the financialSummary section.
+2. **PRIMARY TABLE FOCUS**: Find and extract from the PRIMARY/MAIN historical financial table for the TARGET COMPANY (not subsidiaries, not projections).
+3. **ACCURACY**: Extract exact values as shown in the table. Preserve format ($64M, 29.3%, etc.).
+4. **VALIDATION**: If revenue values are less than $10M, you are likely extracting from the wrong table - find the PRIMARY table with values $20M-$1B+.
+5. **PERIOD MAPPING**: Correctly map periods (FY-3, FY-2, FY-1, LTM) from various table formats (years, FY-X, mixed).
+6. **IF UNCERTAIN**: Use "Not specified in CIM" rather than extracting incorrect data.
+
+EXPANDED VALIDATION FRAMEWORK:
+Before finalizing extraction, perform these validation checks:
+
+**Magnitude Validation**:
+- Revenue should typically be $10M+ for target companies (if less, verify you're using PRIMARY table, not subsidiary)
+- EBITDA should typically be $1M+ and positive for viable targets
+- If FY-3 revenue is $64M, FY-2 should be similar magnitude (e.g., $50M-$90M), not $2.9M or $10 - this indicates column misalignment
+
+**Trend Validation**:
+- Revenue should generally increase or be stable year-over-year (FY-3 → FY-2 → FY-1)
+- Large sudden drops (>50%) or increases (>200%) may indicate misaligned columns or wrong table
+- EBITDA should follow similar trends to revenue (unless margin expansion/contraction is explicitly explained)
+
+**Margin Reasonableness**:
+- EBITDA margins should be 5-50% (typical range for most businesses)
+- Gross margins should be 20-80% (typical range)
+- Margins should be relatively stable across periods (within 10-15 percentage points unless explained)
+- If margins are outside these ranges, verify you're using the correct table and calculations
+
+**Cross-Period Consistency**:
+- If FY-3 revenue = $64M and FY-2 revenue = $71M, growth should be ~11% (not 1000% or -50%)
+- Verify growth rates match: ((Current - Prior) / Prior) * 100
+- Verify margins match: (Metric / Revenue) * 100
+- If calculations don't match, use the explicitly stated values from the table
+
+**Calculation Validation**:
+- Revenue growth: ((Current Year - Prior Year) / Prior Year) * 100
+- EBITDA margin: (EBITDA / Revenue) * 100
+- Gross margin: (Gross Profit / Revenue) * 100
+- If calculated values differ significantly (>5pp) from stated values, note the discrepancy
+
+COMMON MISTAKES TO AVOID (Error Prevention):
+1. **Subsidiary vs Parent Table Confusion**: 
+   - PRIMARY table shows values in millions ($64M, $71M)
+   - Subsidiary tables show thousands ($20,546, $26,352)
+   - Always use the PRIMARY table with larger values
+
+2. **Projections vs Historical**:
+   - Ignore tables marked with "E", "P", "PF", "Projected", "Forecast"
+   - Only extract from historical/actual results tables
+
+3. **Thousands vs Millions**:
+   - "$20,546 (in thousands)" = $20.5M, not $20,546M
+   - Always check table footnotes for unit indicators
+   - If revenue < $10M, you're likely using wrong table
+
+4. **Column Misalignment**:
+   - Count columns carefully - ensure values align with their period columns
+   - Verify trends make sense (revenue generally increases or is stable)
+   - If values seem misaligned, double-check column positions
+
+5. **Missing Cross-Validation**:
+   - Don't extract financials in isolation
+   - Cross-reference with executive summary financial highlights
+   - Verify consistency between detailed financials and summary statements
+
+6. **Unit Conversion Errors**:
+   - Parentheses for negative: "(4.4)" = negative 4.4
+   - Currency symbols: "$" = US dollars, "€" = Euros, "£" = British pounds
+   - Always check footnotes for unit definitions
+
+Focus exclusively on financial data extraction. Do not extract any other sections. Prioritize accuracy over completeness - better to leave a field blank than extract incorrect data.`;
+}
+
+// Note: buildFinancialPrompt is extremely large (500+ lines) and should be extracted separately
+// For now, it remains in llmService.ts
+
--- a/backend/src/services/llm/providers/anthropicProvider.ts
+++ b/backend/src/services/llm/providers/anthropicProvider.ts
@@ -0,0 +1,78 @@
+import { BaseProvider } from './baseProvider';
+import type { LLMRequest, LLMResponse } from '../../llmService';
+import { logger } from '../../../utils/logger';
+import { config } from '../../../config/env';
+
+/**
+ * Anthropic API provider implementation
+ */
+export class AnthropicProvider extends BaseProvider {
+  async call(request: LLMRequest): Promise<LLMResponse> {
+    try {
+      const { default: Anthropic } = await import('@anthropic-ai/sdk');
+      
+      const timeoutMs = config.llm.timeoutMs || 180000;
+      const sdkTimeout = timeoutMs + 10000;
+      
+      const anthropic = new Anthropic({
+        apiKey: this.apiKey,
+        timeout: sdkTimeout,
+      });
+
+      const message = await anthropic.messages.create({
+        model: request.model || this.defaultModel,
+        max_tokens: request.maxTokens || this.maxTokens,
+        temperature: request.temperature !== undefined ? request.temperature : this.temperature,
+        system: request.systemPrompt || '',
+        messages: [
+          {
+            role: 'user',
+            content: request.prompt,
+          },
+        ],
+      });
+
+      const content = message.content[0]?.type === 'text' ? message.content[0].text : '';
+      const usage = message.usage ? {
+        promptTokens: message.usage.input_tokens,
+        completionTokens: message.usage.output_tokens,
+        totalTokens: message.usage.input_tokens + message.usage.output_tokens,
+      } : undefined;
+
+      return {
+        success: true,
+        content,
+        usage,
+      };
+    } catch (error: any) {
+      const isRateLimit = error?.status === 429 || 
+                         error?.error?.type === 'rate_limit_error' ||
+                         error?.message?.includes('rate limit') ||
+                         error?.message?.includes('429');
+      
+      if (isRateLimit) {
+        const retryAfter = error?.headers?.['retry-after'] || 
+                          error?.error?.retry_after || 
+                          '60';
+        
+        logger.warn('Anthropic rate limit hit', {
+          retryAfter,
+          model: request.model || this.defaultModel
+        });
+      }
+      
+      logger.error('Anthropic API call failed', {
+        error: error instanceof Error ? error.message : String(error),
+        status: error?.status,
+        model: request.model || this.defaultModel
+      });
+      
+      return {
+        success: false,
+        content: '',
+        error: error instanceof Error ? error.message : String(error),
+      };
+    }
+  }
+}
+
--- a/backend/src/services/llm/providers/baseProvider.ts
+++ b/backend/src/services/llm/providers/baseProvider.ts
@@ -0,0 +1,34 @@
+// Import types from main llmService file
+import type { LLMRequest, LLMResponse } from '../../llmService';
+
+/**
+ * Base interface for LLM providers
+ */
+export interface ILLMProvider {
+  call(request: LLMRequest): Promise<LLMResponse>;
+}
+
+/**
+ * Base provider class with common functionality
+ */
+export abstract class BaseProvider implements ILLMProvider {
+  protected apiKey: string;
+  protected defaultModel: string;
+  protected maxTokens: number;
+  protected temperature: number;
+
+  constructor(
+    apiKey: string,
+    defaultModel: string,
+    maxTokens: number,
+    temperature: number
+  ) {
+    this.apiKey = apiKey;
+    this.defaultModel = defaultModel;
+    this.maxTokens = maxTokens;
+    this.temperature = temperature;
+  }
+
+  abstract call(request: LLMRequest): Promise<LLMResponse>;
+}
+
--- a/backend/src/services/llm/providers/openaiProvider.ts
+++ b/backend/src/services/llm/providers/openaiProvider.ts
@@ -0,0 +1,69 @@
+import { BaseProvider } from './baseProvider';
+import type { LLMRequest, LLMResponse } from '../../llmService';
+import { logger } from '../../../utils/logger';
+import { config } from '../../../config/env';
+
+/**
+ * OpenAI API provider implementation
+ */
+export class OpenAIProvider extends BaseProvider {
+  async call(request: LLMRequest): Promise<LLMResponse> {
+    try {
+      const { default: OpenAI } = await import('openai');
+      
+      const timeoutMs = config.llm.timeoutMs || 180000;
+      const sdkTimeout = timeoutMs + 10000;
+      
+      const openai = new OpenAI({
+        apiKey: this.apiKey,
+        timeout: sdkTimeout,
+      });
+
+      const messages: any[] = [];
+      
+      if (request.systemPrompt) {
+        messages.push({
+          role: 'system',
+          content: request.systemPrompt,
+        });
+      }
+
+      messages.push({
+        role: 'user',
+        content: request.prompt,
+      });
+
+      const completion = await openai.chat.completions.create({
+        model: request.model || this.defaultModel,
+        messages,
+        max_tokens: request.maxTokens || this.maxTokens,
+        temperature: request.temperature !== undefined ? request.temperature : this.temperature,
+      });
+
+      const content = completion.choices[0]?.message?.content || '';
+      const usage = completion.usage ? {
+        promptTokens: completion.usage.prompt_tokens,
+        completionTokens: completion.usage.completion_tokens,
+        totalTokens: completion.usage.total_tokens,
+      } : undefined;
+
+      return {
+        success: true,
+        content,
+        usage,
+      };
+    } catch (error) {
+      logger.error('OpenAI API call failed', {
+        error: error instanceof Error ? error.message : String(error),
+        model: request.model || this.defaultModel
+      });
+      
+      return {
+        success: false,
+        content: '',
+        error: error instanceof Error ? error.message : String(error),
+      };
+    }
+  }
+}
+
--- a/backend/src/services/llm/providers/openrouterProvider.ts
+++ b/backend/src/services/llm/providers/openrouterProvider.ts
@@ -0,0 +1,195 @@
+import { BaseProvider } from './baseProvider';
+import type { LLMRequest, LLMResponse } from '../../llmService';
+import { logger } from '../../../utils/logger';
+import { config } from '../../../config/env';
+
+/**
+ * OpenRouter API provider implementation
+ */
+export class OpenRouterProvider extends BaseProvider {
+  async call(request: LLMRequest): Promise<LLMResponse> {
+    const startTime = Date.now();
+    let requestSentTime: number | null = null;
+    
+    const timeoutMs = config.llm.timeoutMs || 360000;
+    const abortTimeoutMs = timeoutMs - 10000;
+    
+    try {
+      const axios = await import('axios');
+      
+      const model = request.model || this.defaultModel;
+      const useBYOK = config.llm.openrouterUseBYOK;
+      
+      // Map Anthropic model names to OpenRouter format
+      let openRouterModel = model;
+      if (model.includes('claude')) {
+        if (model.includes('sonnet') && model.includes('4')) {
+          openRouterModel = 'anthropic/claude-sonnet-4.5';
+        } else if (model.includes('haiku') && (model.includes('4-5') || model.includes('4.5'))) {
+          openRouterModel = 'anthropic/claude-haiku-4.5';
+        } else if (model.includes('haiku') && model.includes('4')) {
+          openRouterModel = 'anthropic/claude-haiku-4.5';
+        } else if (model.includes('opus') && model.includes('4')) {
+          openRouterModel = 'anthropic/claude-opus-4';
+        } else if (model.includes('sonnet') && (model.includes('4.5') || model.includes('4-5'))) {
+          openRouterModel = 'anthropic/claude-sonnet-4.5';
+        } else if (model.includes('sonnet') && model.includes('3.7')) {
+          openRouterModel = 'anthropic/claude-3.7-sonnet';
+        } else if (model.includes('sonnet') && model.includes('3.5')) {
+          openRouterModel = 'anthropic/claude-3.5-sonnet';
+        } else if (model.includes('haiku') && model.includes('3.5')) {
+          openRouterModel = 'anthropic/claude-3.5-haiku';
+        } else if (model.includes('haiku') && model.includes('3')) {
+          openRouterModel = 'anthropic/claude-3-haiku';
+        } else if (model.includes('opus') && model.includes('3')) {
+          openRouterModel = 'anthropic/claude-3-opus';
+        } else {
+          openRouterModel = `anthropic/${model}`;
+        }
+      }
+      
+      const headers: Record<string, string> = {
+        'Authorization': `Bearer ${this.apiKey}`,
+        'Content-Type': 'application/json',
+        'HTTP-Referer': 'https://cim-summarizer-testing.firebaseapp.com',
+        'X-Title': 'CIM Summarizer',
+      };
+      
+      if (useBYOK && openRouterModel.includes('anthropic/')) {
+        if (!config.llm.anthropicApiKey) {
+          throw new Error('BYOK enabled but ANTHROPIC_API_KEY is not set');
+        }
+        headers['X-Anthropic-Api-Key'] = config.llm.anthropicApiKey;
+        logger.info('Using BYOK with Anthropic API key', {
+          hasKey: !!config.llm.anthropicApiKey,
+          keyLength: config.llm.anthropicApiKey?.length || 0
+        });
+      }
+      
+      logger.info('Making OpenRouter API call', {
+        model: openRouterModel,
+        originalModel: model,
+        useBYOK,
+        timeout: timeoutMs,
+        promptLength: request.prompt.length,
+        systemPromptLength: request.systemPrompt?.length || 0,
+      });
+      
+      const abortController = new AbortController();
+      const timeoutId = setTimeout(() => {
+        logger.error('OpenRouter request timeout - aborting', {
+          elapsedMs: Date.now() - startTime,
+          timeoutMs,
+          abortTimeoutMs,
+        });
+        abortController.abort();
+      }, abortTimeoutMs);
+      
+      try {
+        requestSentTime = Date.now();
+        
+        const requestBody = {
+          model: openRouterModel,
+          messages: [
+            ...(request.systemPrompt ? [{
+              role: 'system',
+              content: request.systemPrompt
+            }] : []),
+            {
+              role: 'user',
+              content: request.prompt
+            }
+          ],
+          max_tokens: request.maxTokens || this.maxTokens,
+          temperature: request.temperature !== undefined ? request.temperature : this.temperature,
+        };
+        
+        const response = await axios.default.post(
+          'https://openrouter.ai/api/v1/chat/completions',
+          requestBody,
+          {
+            headers,
+            timeout: abortTimeoutMs + 1000,
+            signal: abortController.signal,
+            validateStatus: (status) => status < 500,
+          }
+        );
+        
+        clearTimeout(timeoutId);
+
+        if (response.status >= 400) {
+          logger.error('OpenRouter API error', {
+            status: response.status,
+            error: response.data?.error || response.data,
+          });
+          throw new Error(response.data?.error?.message || `OpenRouter API error: HTTP ${response.status}`);
+        }
+
+        const content = response.data?.choices?.[0]?.message?.content || '';
+        const usage = response.data.usage ? {
+          promptTokens: response.data.usage.prompt_tokens || 0,
+          completionTokens: response.data.usage.completion_tokens || 0,
+          totalTokens: response.data.usage.total_tokens || 0,
+        } : undefined;
+
+        logger.info('OpenRouter API call successful', {
+          model: openRouterModel,
+          usage,
+          responseLength: content.length,
+          totalTimeMs: Date.now() - startTime,
+        });
+        
+        return {
+          success: true,
+          content,
+          usage,
+        };
+      } catch (axiosError: any) {
+        clearTimeout(timeoutId);
+        
+        if (axiosError.name === 'AbortError' || axiosError.code === 'ECONNABORTED' || abortController.signal.aborted) {
+          const totalTime = Date.now() - startTime;
+          logger.error('OpenRouter request was aborted (timeout)', {
+            totalTimeMs: totalTime,
+            timeoutMs,
+            abortTimeoutMs,
+          });
+          throw new Error(`OpenRouter API request timed out after ${Math.round(totalTime / 1000)}s`);
+        }
+        
+        throw axiosError;
+      }
+    } catch (error: any) {
+      const isRateLimit = error?.response?.status === 429 || 
+                         error?.response?.data?.error?.message?.includes('rate limit') ||
+                         error?.message?.includes('rate limit') ||
+                         error?.message?.includes('429');
+      
+      if (isRateLimit) {
+        const retryAfter = error?.response?.headers?.['retry-after'] || 
+                          error?.response?.data?.error?.retry_after || 
+                          '60';
+        
+        logger.error('OpenRouter API rate limit error (429)', {
+          error: error?.response?.data?.error || error?.message,
+          retryAfter,
+        });
+        
+        throw new Error(`OpenRouter API rate limit exceeded. Retry after ${retryAfter} seconds.`);
+      }
+      
+      logger.error('OpenRouter API error', {
+        error: error?.response?.data || error?.message,
+        status: error?.response?.status,
+        code: error?.code,
+      });
+      
+      return {
+        success: false,
+        content: '',
+        error: error?.response?.data?.error?.message || error?.message || 'Unknown error',
+      };
+    }
+  }
+}
+
--- a/backend/src/services/llmPrompts/cimSystemPrompt.ts
+++ b/backend/src/services/llmPrompts/cimSystemPrompt.ts
@@ -0,0 +1,112 @@
+/**
+ * CIM System Prompt Builder
+ * Generates the system prompt for CIM document analysis
+ */
+
+export function getCIMSystemPrompt(focusedFields?: string[]): string {
+  const focusInstruction = focusedFields && focusedFields.length > 0
+    ? `\n\nPRIORITY AREAS FOR THIS PASS (extract these thoroughly, but still extract ALL other fields):\n${focusedFields.map(f => `- ${f}`).join('\n')}\n\nFor this pass, prioritize extracting the fields listed above with extra thoroughness. However, you MUST still extract ALL fields in the template. Do NOT use "Not specified in CIM" for any field unless you have thoroughly searched the entire document and confirmed the information is truly not present. Be especially thorough in extracting all nested fields within the priority areas.`
+    : '';
+  
+  return `You are a world-class private equity investment analyst at BPCP (Blue Point Capital Partners), operating at the analytical depth and rigor of top-tier PE firms (KKR, Blackstone, Apollo, Carlyle). Your task is to analyze Confidential Information Memorandums (CIMs) with the precision, depth, and strategic insight expected by BPCP's investment committee. Return a comprehensive, structured JSON object that follows the BPCP CIM Review Template format EXACTLY.${focusInstruction}
+
+CRITICAL REQUIREMENTS:
+1. **JSON OUTPUT ONLY**: Your entire response MUST be a single, valid JSON object. Do not include any text or explanation before or after the JSON object.
+2. **BPCP TEMPLATE FORMAT**: The JSON object MUST follow the BPCP CIM Review Template structure exactly as specified.
+3. **COMPLETE ALL FIELDS**: You MUST provide a value for every field. Use "Not specified in CIM" for any information that is not available in the document.
+4. **NO PLACEHOLDERS**: Do not use placeholders like "..." or "TBD". Use "Not specified in CIM" instead.
+5. **PROFESSIONAL ANALYSIS**: The content should be high-quality and suitable for BPCP's investment committee.
+6. **BPCP FOCUS**: Focus on companies in 5+MM EBITDA range in consumer and industrial end markets, with emphasis on M&A, technology & data usage, supply chain and human capital optimization.
+7. **BPCP PREFERENCES**: BPCP prefers companies which are founder/family-owned and within driving distance of Cleveland and Charlotte.
+8. **EXACT FIELD NAMES**: Use the exact field names and descriptions from the BPCP CIM Review Template.
+9. **FINANCIAL DATA**: For financial metrics, use actual numbers if available, otherwise use "Not specified in CIM".
+10. **VALID JSON**: Ensure your response is valid JSON that can be parsed without errors.
+
+FINANCIAL VALIDATION FRAMEWORK:
+Before finalizing any financial extraction, you MUST perform these validation checks:
+
+**Magnitude Validation**:
+- Revenue should typically be $10M+ for target companies (if less, verify you're using the PRIMARY table, not a subsidiary)
+- EBITDA should typically be $1M+ and positive for viable targets
+- If FY-3 revenue is $64M, FY-2 should be similar magnitude (e.g., $50M-$90M), not $2.9M or $10 - this indicates column misalignment
+
+**Trend Validation**:
+- Revenue should generally increase or be stable year-over-year (FY-3 → FY-2 → FY-1)
+- Large sudden drops (>50%) or increases (>200%) may indicate misaligned columns or wrong table
+- EBITDA should follow similar trends to revenue (unless margin expansion/contraction is explicitly explained)
+
+**Cross-Period Consistency**:
+- If FY-3 revenue = $64M and FY-2 revenue = $71M, growth should be ~11% (not 1000% or -50%)
+- Margins should be relatively stable across periods (within 10-15 percentage points unless explained)
+- EBITDA margins should be 5-50% (typical range), gross margins 20-80%
+
+**Multi-Table Cross-Reference**:
+- Cross-reference primary table with executive summary financial highlights
+- Verify consistency between detailed financials and summary tables
+- Check appendices for additional financial detail or adjustments
+- If discrepancies exist, note them and use the most authoritative source (typically the detailed historical table)
+
+**Calculation Validation**:
+- Verify revenue growth percentages match: ((Current - Prior) / Prior) * 100
+- Verify margins match: (Metric / Revenue) * 100
+- If calculations don't match, use the explicitly stated values from the table
+
+PE INVESTOR PERSONA & METHODOLOGY:
+You operate with the analytical rigor and strategic depth of top-tier private equity firms. Your analysis should demonstrate:
+
+**Value Creation Focus**:
+- Identify specific, quantifiable value creation opportunities (e.g., "Margin expansion of 200-300 bps through pricing optimization and cost reduction, potentially adding $2-3M EBITDA")
+- Assess operational improvement potential (supply chain, technology, human capital)
+- Evaluate M&A and add-on acquisition potential with specific rationale
+- Quantify potential impact where possible (EBITDA improvement, revenue growth, multiple expansion)
+
+**Risk Assessment Depth**:
+- Categorize risks by type: operational, financial, market, execution, regulatory, technology
+- Assess both probability and impact (high/medium/low)
+- Identify mitigating factors and management's risk management approach
+- Distinguish between deal-breakers and manageable risks
+
+**Strategic Analysis Frameworks**:
+- **Porter's Five Forces**: Assess competitive intensity, supplier power, buyer power, threat of substitutes, threat of new entrants
+- **SWOT Analysis**: Synthesize strengths, weaknesses, opportunities, threats from the CIM
+- **Value Creation Playbook**: Revenue growth (organic/inorganic), margin expansion, operational improvements, multiple expansion
+- **Comparable Analysis**: Reference industry benchmarks, comparable company multiples, recent transaction multiples where mentioned
+
+**Industry Context Integration**:
+- Reference industry-specific metrics and benchmarks (e.g., SaaS: ARR growth, churn, CAC payback; Manufacturing: inventory turns, days sales outstanding)
+- Consider sector-specific risks and opportunities (regulatory changes, technology disruption, consolidation trends)
+- Evaluate market position relative to industry standards (market share, growth vs market, margin vs peers)
+
+COMMON MISTAKES TO AVOID:
+1. **Subsidiary vs Parent Table Confusion**: Primary table shows values in millions ($64M), subsidiary tables show thousands ($20,546). Always use the PRIMARY table.
+2. **Column Misalignment**: Count columns carefully - ensure values align with their period columns. Verify trends make sense.
+3. **Projections vs Historical**: Ignore tables marked with "E", "P", "PF", "Projected", "Forecast" - only extract historical data.
+4. **Unit Confusion**: "$20,546 (in thousands)" = $20.5M, not $20,546M. Always check table footnotes for units.
+5. **Missing Cross-Validation**: Don't extract financials in isolation - cross-reference with executive summary, narrative text, appendices.
+6. **Generic Analysis**: Avoid generic statements like "strong management team" - provide specific details (years of experience, track record, specific achievements).
+7. **Incomplete Risk Assessment**: Don't just list risks - assess impact, probability, and mitigations. Categorize by type.
+8. **Vague Value Creation**: Instead of "operational improvements", specify "reduce SG&A by 150 bps through shared services consolidation, adding $1.5M EBITDA".
+
+ANALYSIS QUALITY REQUIREMENTS:
+- **Financial Precision**: Extract exact financial figures, percentages, and growth rates. Calculate CAGR where possible. Validate all calculations.
+- **Competitive Intelligence**: Identify specific competitors with market share context, competitive positioning (leader/follower/niche), and differentiation drivers.
+- **Risk Assessment**: Evaluate both stated and implied risks, categorize by type, assess impact and probability, identify mitigations.
+- **Growth Drivers**: Identify specific revenue growth drivers with quantification (e.g., "New product line launched in 2023, contributing $5M revenue in FY-1").
+- **Management Quality**: Assess management experience with specific details (years in role, prior companies, track record), evaluate retention risk and succession planning.
+- **Value Creation**: Identify specific value creation levers with quantification guidance (e.g., "Pricing optimization: 2-3% price increase on 60% of revenue base = $1.8-2.7M revenue increase").
+- **Due Diligence Focus**: Highlight areas requiring deeper investigation, prioritize by investment decision impact (deal-breakers vs nice-to-know).
+- **Key Questions Detail**: Provide detailed, contextual questions (2-3 sentences each) explaining why each question matters for the investment decision.
+- **Investment Thesis Detail**: Provide comprehensive analysis with specific examples, quantification where possible, and strategic rationale. Each item should include: what, why it matters, quantification if possible, investment impact.
+
+DOCUMENT ANALYSIS APPROACH:
+- Read the entire document systematically, paying special attention to financial tables, charts, appendices, and footnotes
+- Cross-reference information across different sections for consistency (executive summary vs detailed sections vs appendices)
+- Extract both explicit statements and implicit insights (read between the lines for risks, opportunities, competitive position)
+- Focus on quantitative data while providing qualitative context and strategic interpretation
+- Identify any inconsistencies or areas requiring clarification (note discrepancies and their potential significance)
+- Consider industry context and market dynamics when evaluating opportunities and risks (benchmark against industry standards)
+- Use document structure (headers, sections, page numbers) to locate and validate information
+- Check footnotes for adjustments, definitions, exclusions, and important context
+`;
+}
+
--- a/backend/src/services/llmPrompts/index.ts
+++ b/backend/src/services/llmPrompts/index.ts
@@ -0,0 +1,14 @@
+/**
+ * LLM Prompt Builders
+ * Centralized exports for all prompt builders
+ * 
+ * Note: Due to the large size of prompt templates, individual prompt builders
+ * are kept in llmService.ts for now. This file serves as a placeholder for
+ * future modularization when prompts are fully extracted.
+ */
+
+// Re-export prompt builders when they are extracted
+// For now, prompts remain in llmService.ts to maintain functionality
+
+export { getCIMSystemPrompt } from './cimSystemPrompt';
+
--- a/backend/src/services/llmProviders/baseProvider.ts
+++ b/backend/src/services/llmProviders/baseProvider.ts
@@ -0,0 +1,38 @@
+/**
+ * Base LLM Provider Interface
+ * Defines the contract for all LLM provider implementations
+ */
+
+import { LLMRequest, LLMResponse } from '../../types/llm';
+
+/**
+ * Base interface for LLM providers
+ */
+export interface ILLMProvider {
+  call(request: LLMRequest): Promise<LLMResponse>;
+}
+
+/**
+ * Base provider class with common functionality
+ */
+export abstract class BaseLLMProvider implements ILLMProvider {
+  protected apiKey: string;
+  protected defaultModel: string;
+  protected maxTokens: number;
+  protected temperature: number;
+
+  constructor(
+    apiKey: string,
+    defaultModel: string,
+    maxTokens: number,
+    temperature: number
+  ) {
+    this.apiKey = apiKey;
+    this.defaultModel = defaultModel;
+    this.maxTokens = maxTokens;
+    this.temperature = temperature;
+  }
+
+  abstract call(request: LLMRequest): Promise<LLMResponse>;
+}
+
--- a/backend/src/services/llmProviders/index.ts
+++ b/backend/src/services/llmProviders/index.ts
@@ -0,0 +1,11 @@
+/**
+ * LLM Provider Exports
+ * Centralized exports for all LLM provider implementations
+ */
+
+// Providers will be exported here when extracted from llmService.ts
+// For now, providers remain in llmService.ts to maintain functionality
+
+export type { ILLMProvider } from './baseProvider';
+export { BaseLLMProvider } from './baseProvider';
+
--- a/backend/src/services/llmService.ts
+++ b/backend/src/services/llmService.ts
--- a/backend/src/services/llmUtils/costCalculator.ts
+++ b/backend/src/services/llmUtils/costCalculator.ts
@@ -0,0 +1,15 @@
+/**
+ * Cost Calculation Utilities
+ * Estimates LLM API costs based on token usage and model
+ */
+
+import { estimateLLMCost } from '../../config/constants';
+
+/**
+ * Estimate cost for a given number of tokens and model
+ * Uses the centralized cost estimation from constants
+ */
+export function estimateCost(tokens: number, model: string): number {
+  return estimateLLMCost(tokens, model);
+}
+
--- a/backend/src/services/llmUtils/index.ts
+++ b/backend/src/services/llmUtils/index.ts
@@ -0,0 +1,9 @@
+/**
+ * LLM Utility Functions
+ * Centralized exports for all LLM utility functions
+ */
+
+export { extractJsonFromResponse } from './jsonExtractor';
+export { estimateTokenCount, truncateText } from './tokenEstimator';
+export { estimateCost } from './costCalculator';
+
--- a/backend/src/services/llmUtils/jsonExtractor.ts
+++ b/backend/src/services/llmUtils/jsonExtractor.ts
@@ -0,0 +1,184 @@
+/**
+ * JSON Extraction Utilities
+ * Extracts JSON from LLM responses, handling various formats and edge cases
+ */
+
+import { logger } from '../../utils/logger';
+import { LLM_COST_RATES, DEFAULT_COST_RATE, estimateLLMCost, estimateTokenCount } from '../../config/constants';
+
+/**
+ * Extract JSON from LLM response content
+ * Handles various formats: ```json blocks, plain JSON, truncated responses
+ */
+export function extractJsonFromResponse(content: string): any {
+  try {
+    // First, try to find JSON within ```json ... ```
+    const jsonBlockStart = content.indexOf('```json');
+    logger.info('JSON extraction - checking for ```json block', {
+      jsonBlockStart,
+      hasJsonBlock: jsonBlockStart !== -1,
+      contentLength: content.length,
+      contentEnds: content.substring(content.length - 50),
+    });
+    
+    if (jsonBlockStart !== -1) {
+      const jsonContentStart = content.indexOf('\n', jsonBlockStart) + 1;
+      let closingBackticks = -1;
+      
+      // Try to find \n``` first (most common)
+      const newlineBackticks = content.indexOf('\n```', jsonContentStart);
+      if (newlineBackticks !== -1) {
+        closingBackticks = newlineBackticks + 1;
+      } else {
+        // Fallback: look for ``` at the very end
+        if (content.endsWith('```')) {
+          closingBackticks = content.length - 3;
+        } else {
+          closingBackticks = content.length;
+          logger.warn('LLM response has no closing backticks, using entire content');
+        }
+      }
+      
+      logger.info('JSON extraction - found block boundaries', {
+        jsonContentStart,
+        closingBackticks,
+        newlineBackticks,
+        contentEndsWithBackticks: content.endsWith('```'),
+        isValid: closingBackticks > jsonContentStart,
+      });
+      
+      if (jsonContentStart > 0 && closingBackticks > jsonContentStart) {
+        const jsonStr = content.substring(jsonContentStart, closingBackticks).trim();
+        
+        logger.info('JSON extraction - extracted string', {
+          jsonStrLength: jsonStr.length,
+          startsWithBrace: jsonStr.startsWith('{'),
+          jsonStrPreview: jsonStr.substring(0, 300),
+        });
+        
+        if (jsonStr && jsonStr.startsWith('{')) {
+          try {
+            // Use brace matching to get the complete root object
+            let braceCount = 0;
+            let rootEndIndex = -1;
+            for (let i = 0; i < jsonStr.length; i++) {
+              if (jsonStr[i] === '{') braceCount++;
+              else if (jsonStr[i] === '}') {
+                braceCount--;
+                if (braceCount === 0) {
+                  rootEndIndex = i;
+                  break;
+                }
+              }
+            }
+            if (rootEndIndex !== -1) {
+              const completeJsonStr = jsonStr.substring(0, rootEndIndex + 1);
+              logger.info('Brace matching succeeded', {
+                originalLength: jsonStr.length,
+                extractedLength: completeJsonStr.length,
+                extractedPreview: completeJsonStr.substring(0, 200),
+              });
+              return JSON.parse(completeJsonStr);
+            } else {
+              logger.warn('Brace matching failed to find closing brace', {
+                jsonStrLength: jsonStr.length,
+                jsonStrPreview: jsonStr.substring(0, 500),
+              });
+            }
+          } catch (e) {
+            logger.error('Brace matching threw error, falling back to regex', {
+              error: e instanceof Error ? e.message : String(e),
+              stack: e instanceof Error ? e.stack : undefined,
+            });
+          }
+        }
+      }
+    }
+    
+    // Fallback to regex match
+    logger.warn('Using fallback regex extraction');
+    const jsonMatch = content.match(/```json\n([\s\S]+)\n```/);
+    if (jsonMatch && jsonMatch[1]) {
+      logger.info('Regex extraction found JSON', {
+        matchLength: jsonMatch[1].length,
+        matchPreview: jsonMatch[1].substring(0, 200),
+      });
+      return JSON.parse(jsonMatch[1]);
+    }
+
+    // Try to find JSON within ``` ... ```
+    const codeBlockMatch = content.match(/```\n([\s\S]*?)\n```/);
+    if (codeBlockMatch && codeBlockMatch[1]) {
+      return JSON.parse(codeBlockMatch[1]);
+    }
+
+    // If that fails, try to find the largest valid JSON object
+    const startIndex = content.indexOf('{');
+    if (startIndex === -1) {
+      throw new Error('No JSON object found in response');
+    }
+
+    // Try to find the complete JSON object by matching braces
+    let braceCount = 0;
+    let endIndex = -1;
+    
+    for (let i = startIndex; i < content.length; i++) {
+      if (content[i] === '{') {
+        braceCount++;
+      } else if (content[i] === '}') {
+        braceCount--;
+        if (braceCount === 0) {
+          endIndex = i;
+          break;
+        }
+      }
+    }
+
+    if (endIndex === -1) {
+      // If we can't find a complete JSON object, the response was likely truncated
+      const partialJson = content.substring(startIndex);
+      const openBraces = (partialJson.match(/{/g) || []).length;
+      const closeBraces = (partialJson.match(/}/g) || []).length;
+      const isTruncated = openBraces > closeBraces;
+      
+      logger.warn('Attempting to recover from truncated JSON response', { 
+        contentLength: content.length,
+        partialJsonLength: partialJson.length,
+        openBraces,
+        closeBraces,
+        isTruncated,
+        endsAbruptly: !content.trim().endsWith('}') && !content.trim().endsWith('```')
+      });
+      
+      // If clearly truncated (more open than close braces), throw a specific error
+      if (isTruncated && openBraces - closeBraces > 2) {
+        throw new Error(`Response was truncated due to token limit. Expected ${openBraces - closeBraces} more closing braces. Increase maxTokens limit.`);
+      }
+      
+      // Try to find the last complete object or array
+      const lastCompleteMatch = partialJson.match(/(\{[^{}]*(?:\{[^{}]*\}[^{}]*)*\})/);
+      if (lastCompleteMatch && lastCompleteMatch[1]) {
+        return JSON.parse(lastCompleteMatch[1]);
+      }
+      
+      // If that fails, try to find the last complete key-value pair
+      const lastPairMatch = partialJson.match(/(\{[^{}]*"[^"]*"\s*:\s*"[^"]*"[^{}]*\})/);
+      if (lastPairMatch && lastPairMatch[1]) {
+        return JSON.parse(lastPairMatch[1]);
+      }
+      
+      throw new Error(`Unable to extract valid JSON from truncated response. Response appears incomplete (${openBraces} open braces, ${closeBraces} close braces). Increase maxTokens limit.`);
+    }
+
+    const jsonString = content.substring(startIndex, endIndex + 1);
+    return JSON.parse(jsonString);
+  } catch (error) {
+    logger.error('Failed to extract JSON from LLM response', { 
+      error, 
+      contentLength: content.length,
+      contentPreview: content.substring(0, 1000) 
+    });
+    throw new Error(`JSON extraction failed: ${error instanceof Error ? error.message : 'Unknown error'}`);
+  }
+}
+
--- a/backend/src/services/llmUtils/tokenEstimator.ts
+++ b/backend/src/services/llmUtils/tokenEstimator.ts
@@ -0,0 +1,56 @@
+/**
+ * Token Estimation Utilities
+ * Estimates token counts and handles text truncation
+ */
+
+import { estimateTokenCount as estimateTokens, TOKEN_ESTIMATION } from '../../config/constants';
+
+/**
+ * Estimate token count for text
+ * Uses the constant from config for consistency
+ */
+export function estimateTokenCount(text: string): number {
+  return estimateTokens(text);
+}
+
+/**
+ * Truncate text to fit within token limit while preserving sentence boundaries
+ */
+export function truncateText(text: string, maxTokens: number): string {
+  // Convert token limit to character limit (approximate)
+  const maxChars = maxTokens * TOKEN_ESTIMATION.CHARS_PER_TOKEN;
+  
+  if (text.length <= maxChars) {
+    return text;
+  }
+  
+  // Try to truncate at sentence boundaries for better context preservation
+  const truncated = text.substring(0, maxChars);
+  
+  // Find the last sentence boundary (period, exclamation, question mark followed by space)
+  const sentenceEndRegex = /[.!?]\s+/g;
+  let lastMatch: RegExpExecArray | null = null;
+  let match: RegExpExecArray | null;
+  
+  while ((match = sentenceEndRegex.exec(truncated)) !== null) {
+    if (match.index < maxChars * 0.95) { // Only use if within 95% of limit
+      lastMatch = match;
+    }
+  }
+  
+  if (lastMatch) {
+    // Truncate at sentence boundary
+    return text.substring(0, lastMatch.index + lastMatch[0].length).trim();
+  }
+  
+  // Fallback: truncate at word boundary
+  const wordBoundaryRegex = /\s+/;
+  const lastSpaceIndex = truncated.lastIndexOf(' ');
+  if (lastSpaceIndex > maxChars * 0.9) {
+    return text.substring(0, lastSpaceIndex).trim();
+  }
+  
+  // Final fallback: hard truncate
+  return truncated.trim();
+}
+
--- a/backend/src/services/optimizedAgenticRAGProcessor.ts
+++ b/backend/src/services/optimizedAgenticRAGProcessor.ts
--- a/backend/src/services/parallelDocumentProcessor.ts
+++ b/backend/src/services/parallelDocumentProcessor.ts
@@ -0,0 +1,606 @@
+import { logger } from '../utils/logger';
+import { llmService } from './llmService';
+import { CIMReview } from './llmSchemas';
+import { financialExtractionMonitoringService } from './financialExtractionMonitoringService';
+import { defaultCIMReview } from './unifiedDocumentProcessor';
+
+// Use the same ProcessingResult interface as other processors
+interface ProcessingResult {
+  success: boolean;
+  summary: string;
+  analysisData: CIMReview;
+  processingStrategy: 'parallel_sections' | 'simple_full_document' | 'document_ai_agentic_rag';
+  processingTime: number;
+  apiCalls: number;
+  error: string | undefined;
+}
+
+interface SectionExtractionResult {
+  section: string;
+  success: boolean;
+  data: Partial<CIMReview>;
+  error?: string;
+  apiCalls: number;
+  processingTime: number;
+}
+
+/**
+ * Parallel Document Processor
+ * 
+ * Strategy: Extract independent sections in parallel to reduce processing time
+ * - Financial extraction (already optimized with Haiku)
+ * - Business description
+ * - Market analysis
+ * - Deal overview
+ * - Management team
+ * - Investment thesis
+ * 
+ * Safety features:
+ * - Rate limit risk checking before parallel execution
+ * - Automatic fallback to sequential if risk is high
+ * - API call tracking to prevent exceeding limits
+ */
+class ParallelDocumentProcessor {
+  private readonly MAX_CONCURRENT_EXTRACTIONS = 2; // Limit parallel API calls (Anthropic has concurrent connection limits)
+  private readonly RATE_LIMIT_RISK_THRESHOLD: 'low' | 'medium' | 'high' = 'medium'; // Fallback to sequential if risk >= medium
+
+  /**
+   * Process document with parallel section extraction
+   */
+  async processDocument(
+    documentId: string,
+    userId: string,
+    text: string,
+    options: any = {}
+  ): Promise<ProcessingResult> {
+    const startTime = Date.now();
+    let totalApiCalls = 0;
+
+    try {
+      logger.info('Parallel processor: Starting', {
+        documentId,
+        textLength: text.length,
+      });
+
+      // Check rate limit risk before starting parallel processing
+      const rateLimitRisk = await this.checkRateLimitRisk();
+      
+      if (rateLimitRisk === 'high') {
+        logger.warn('High rate limit risk detected, falling back to sequential processing', {
+          documentId,
+          risk: rateLimitRisk,
+        });
+        // Fallback to simple processor
+        const { simpleDocumentProcessor } = await import('./simpleDocumentProcessor');
+        return await simpleDocumentProcessor.processDocument(documentId, userId, text, options);
+      }
+
+      // Extract sections in parallel
+      const sections = await this.extractSectionsInParallel(documentId, userId, text, options);
+      totalApiCalls = sections.reduce((sum, s) => sum + s.apiCalls, 0);
+
+      // Merge all section results
+      const analysisData = this.mergeSectionResults(sections);
+
+      // Generate summary
+      const summary = this.generateSummary(analysisData);
+
+      const processingTime = Date.now() - startTime;
+
+      logger.info('Parallel processor: Completed', {
+        documentId,
+        processingTime,
+        apiCalls: totalApiCalls,
+        sectionsExtracted: sections.filter(s => s.success).length,
+        totalSections: sections.length,
+      });
+
+      return {
+        success: true,
+        summary,
+        analysisData: analysisData as CIMReview,
+        processingStrategy: 'parallel_sections',
+        processingTime,
+        apiCalls: totalApiCalls,
+        error: undefined,
+      };
+    } catch (error) {
+      const processingTime = Date.now() - startTime;
+      logger.error('Parallel processor: Failed', {
+        documentId,
+        error: error instanceof Error ? error.message : String(error),
+        processingTime,
+      });
+
+      return {
+        success: false,
+        summary: '',
+        analysisData: defaultCIMReview,
+        processingStrategy: 'parallel_sections',
+        processingTime,
+        apiCalls: totalApiCalls,
+        error: error instanceof Error ? error.message : String(error),
+      };
+    }
+  }
+
+  /**
+   * Check rate limit risk across all providers/models
+   */
+  private async checkRateLimitRisk(): Promise<'low' | 'medium' | 'high'> {
+    try {
+      // Check risk for common models
+      const anthropicHaikuRisk = await financialExtractionMonitoringService.checkRateLimitRisk(
+        'anthropic',
+        'claude-3-5-haiku-latest'
+      );
+      const anthropicSonnetRisk = await financialExtractionMonitoringService.checkRateLimitRisk(
+        'anthropic',
+        'claude-sonnet-4-5-20250514'
+      );
+
+      // Return highest risk
+      if (anthropicHaikuRisk === 'high' || anthropicSonnetRisk === 'high') {
+        return 'high';
+      } else if (anthropicHaikuRisk === 'medium' || anthropicSonnetRisk === 'medium') {
+        return 'medium';
+      } else {
+        return 'low';
+      }
+    } catch (error) {
+      logger.warn('Failed to check rate limit risk, defaulting to low', {
+        error: error instanceof Error ? error.message : String(error),
+      });
+      return 'low'; // Default to low risk on error
+    }
+  }
+
+  /**
+   * Extract sections in parallel with concurrency control
+   */
+  private async extractSectionsInParallel(
+    documentId: string,
+    userId: string,
+    text: string,
+    options: any
+  ): Promise<SectionExtractionResult[]> {
+    const sections = [
+      { name: 'financial', extractor: () => this.extractFinancialSection(documentId, userId, text, options) },
+      { name: 'dealOverview', extractor: () => this.extractDealOverviewSection(documentId, text) },
+      { name: 'businessDescription', extractor: () => this.extractBusinessDescriptionSection(documentId, text) },
+      { name: 'marketAnalysis', extractor: () => this.extractMarketAnalysisSection(documentId, text) },
+      { name: 'managementTeam', extractor: () => this.extractManagementTeamSection(documentId, text) },
+      { name: 'investmentThesis', extractor: () => this.extractInvestmentThesisSection(documentId, text) },
+    ];
+
+    // Process sections in batches to respect concurrency limits
+    const results: SectionExtractionResult[] = [];
+    
+    for (let i = 0; i < sections.length; i += this.MAX_CONCURRENT_EXTRACTIONS) {
+      const batch = sections.slice(i, i + this.MAX_CONCURRENT_EXTRACTIONS);
+      
+      logger.info(`Processing batch ${Math.floor(i / this.MAX_CONCURRENT_EXTRACTIONS) + 1} of sections`, {
+        documentId,
+        batchSize: batch.length,
+        sections: batch.map(s => s.name),
+      });
+
+      // Retry logic for concurrent connection limit errors
+      let batchResults = await Promise.allSettled(
+        batch.map(section => section.extractor())
+      );
+
+      // Check for concurrent connection limit errors and retry with sequential processing
+      const hasConcurrentLimitError = batchResults.some(result => 
+        result.status === 'rejected' && 
+        result.reason instanceof Error &&
+        (result.reason.message.includes('concurrent connections') || 
+         result.reason.message.includes('429'))
+      );
+
+      if (hasConcurrentLimitError) {
+        logger.warn('Concurrent connection limit hit, retrying batch sequentially', {
+          documentId,
+          batchSize: batch.length,
+        });
+        
+        // Retry each section sequentially with delay
+        batchResults = [];
+        for (const section of batch) {
+          try {
+            const result = await section.extractor();
+            batchResults.push({ status: 'fulfilled' as const, value: result });
+            // Small delay between sequential calls
+            await new Promise(resolve => setTimeout(resolve, 1000));
+          } catch (error) {
+            batchResults.push({ 
+              status: 'rejected' as const, 
+              reason: error instanceof Error ? error : new Error(String(error))
+            });
+          }
+        }
+      }
+
+      batchResults.forEach((result, index) => {
+        if (result.status === 'fulfilled') {
+          results.push(result.value);
+        } else {
+          logger.error(`Section extraction failed: ${batch[index].name}`, {
+            documentId,
+            error: result.reason,
+          });
+          results.push({
+            section: batch[index].name,
+            success: false,
+            data: {},
+            error: result.reason instanceof Error ? result.reason.message : String(result.reason),
+            apiCalls: 0,
+            processingTime: 0,
+          });
+        }
+      });
+
+      // Small delay between batches to respect rate limits
+      if (i + this.MAX_CONCURRENT_EXTRACTIONS < sections.length) {
+        await new Promise(resolve => setTimeout(resolve, 1000)); // Increased to 1s delay between batches
+      }
+    }
+
+    return results;
+  }
+
+  /**
+   * Extract financial section (already optimized with Haiku)
+   */
+  private async extractFinancialSection(
+    documentId: string,
+    userId: string,
+    text: string,
+    options: any
+  ): Promise<SectionExtractionResult> {
+    const startTime = Date.now();
+    
+    try {
+      // Run deterministic parser first
+      let deterministicFinancials: any = null;
+      try {
+        const { parseFinancialsFromText } = await import('./financialTableParser');
+        const parsedFinancials = parseFinancialsFromText(text);
+        const hasData = parsedFinancials.fy3?.revenue || parsedFinancials.fy2?.revenue || 
+                       parsedFinancials.fy1?.revenue || parsedFinancials.ltm?.revenue;
+        if (hasData) {
+          deterministicFinancials = parsedFinancials;
+        }
+      } catch (parserError) {
+        logger.debug('Deterministic parser failed in parallel extraction', {
+          error: parserError instanceof Error ? parserError.message : String(parserError),
+        });
+      }
+
+      const financialResult = await llmService.processFinancialsOnly(
+        text,
+        deterministicFinancials || undefined
+      );
+
+      const processingTime = Date.now() - startTime;
+
+      if (financialResult.success && financialResult.jsonOutput?.financialSummary) {
+        return {
+          section: 'financial',
+          success: true,
+          data: { financialSummary: financialResult.jsonOutput.financialSummary },
+          apiCalls: 1,
+          processingTime,
+        };
+      } else {
+        return {
+          section: 'financial',
+          success: false,
+          data: {},
+          error: financialResult.error,
+          apiCalls: 1,
+          processingTime,
+        };
+      }
+    } catch (error) {
+      return {
+        section: 'financial',
+        success: false,
+        data: {},
+        error: error instanceof Error ? error.message : String(error),
+        apiCalls: 0,
+        processingTime: Date.now() - startTime,
+      };
+    }
+  }
+
+  /**
+   * Extract deal overview section
+   */
+  private async extractDealOverviewSection(
+    documentId: string,
+    text: string
+  ): Promise<SectionExtractionResult> {
+    const startTime = Date.now();
+    
+    try {
+      const result = await llmService.processCIMDocument(
+        text,
+        'BPCP CIM Review Template',
+        undefined, // No existing analysis
+        ['dealOverview'], // Focus only on deal overview fields
+        'Extract only the deal overview information: company name, industry, geography, deal source, transaction type, dates, reviewers, page count, and reason for sale.'
+      );
+
+      const processingTime = Date.now() - startTime;
+
+      if (result.success && result.jsonOutput?.dealOverview) {
+        return {
+          section: 'dealOverview',
+          success: true,
+          data: { dealOverview: result.jsonOutput.dealOverview },
+          apiCalls: 1,
+          processingTime,
+        };
+      } else {
+        return {
+          section: 'dealOverview',
+          success: false,
+          data: {},
+          error: result.error,
+          apiCalls: 1,
+          processingTime,
+        };
+      }
+    } catch (error) {
+      return {
+        section: 'dealOverview',
+        success: false,
+        data: {},
+        error: error instanceof Error ? error.message : String(error),
+        apiCalls: 0,
+        processingTime: Date.now() - startTime,
+      };
+    }
+  }
+
+  /**
+   * Extract business description section
+   */
+  private async extractBusinessDescriptionSection(
+    documentId: string,
+    text: string
+  ): Promise<SectionExtractionResult> {
+    const startTime = Date.now();
+    
+    try {
+      const result = await llmService.processCIMDocument(
+        text,
+        'BPCP CIM Review Template',
+        undefined,
+        ['businessDescription'],
+        'Extract only the business description: core operations, products/services, value proposition, customer base, and supplier information.'
+      );
+
+      const processingTime = Date.now() - startTime;
+
+      if (result.success && result.jsonOutput?.businessDescription) {
+        return {
+          section: 'businessDescription',
+          success: true,
+          data: { businessDescription: result.jsonOutput.businessDescription },
+          apiCalls: 1,
+          processingTime,
+        };
+      } else {
+        return {
+          section: 'businessDescription',
+          success: false,
+          data: {},
+          error: result.error,
+          apiCalls: 1,
+          processingTime,
+        };
+      }
+    } catch (error) {
+      return {
+        section: 'businessDescription',
+        success: false,
+        data: {},
+        error: error instanceof Error ? error.message : String(error),
+        apiCalls: 0,
+        processingTime: Date.now() - startTime,
+      };
+    }
+  }
+
+  /**
+   * Extract market analysis section
+   */
+  private async extractMarketAnalysisSection(
+    documentId: string,
+    text: string
+  ): Promise<SectionExtractionResult> {
+    const startTime = Date.now();
+    
+    try {
+      const result = await llmService.processCIMDocument(
+        text,
+        'BPCP CIM Review Template',
+        undefined,
+        ['marketIndustryAnalysis'],
+        'Extract only the market and industry analysis: market size, growth rate, industry trends, competitive landscape, and barriers to entry.'
+      );
+
+      const processingTime = Date.now() - startTime;
+
+      if (result.success && result.jsonOutput?.marketIndustryAnalysis) {
+        return {
+          section: 'marketAnalysis',
+          success: true,
+          data: { marketIndustryAnalysis: result.jsonOutput.marketIndustryAnalysis },
+          apiCalls: 1,
+          processingTime,
+        };
+      } else {
+        return {
+          section: 'marketAnalysis',
+          success: false,
+          data: {},
+          error: result.error,
+          apiCalls: 1,
+          processingTime,
+        };
+      }
+    } catch (error) {
+      return {
+        section: 'marketAnalysis',
+        success: false,
+        data: {},
+        error: error instanceof Error ? error.message : String(error),
+        apiCalls: 0,
+        processingTime: Date.now() - startTime,
+      };
+    }
+  }
+
+  /**
+   * Extract management team section
+   */
+  private async extractManagementTeamSection(
+    documentId: string,
+    text: string
+  ): Promise<SectionExtractionResult> {
+    const startTime = Date.now();
+    
+    try {
+      const result = await llmService.processCIMDocument(
+        text,
+        'BPCP CIM Review Template',
+        undefined,
+        ['managementTeamOverview'],
+        'Extract only the management team information: key leaders, quality assessment, post-transaction intentions, and organizational structure.'
+      );
+
+      const processingTime = Date.now() - startTime;
+
+      if (result.success && result.jsonOutput?.managementTeamOverview) {
+        return {
+          section: 'managementTeam',
+          success: true,
+          data: { managementTeamOverview: result.jsonOutput.managementTeamOverview },
+          apiCalls: 1,
+          processingTime,
+        };
+      } else {
+        return {
+          section: 'managementTeam',
+          success: false,
+          data: {},
+          error: result.error,
+          apiCalls: 1,
+          processingTime,
+        };
+      }
+    } catch (error) {
+      return {
+        section: 'managementTeam',
+        success: false,
+        data: {},
+        error: error instanceof Error ? error.message : String(error),
+        apiCalls: 0,
+        processingTime: Date.now() - startTime,
+      };
+    }
+  }
+
+  /**
+   * Extract investment thesis section
+   */
+  private async extractInvestmentThesisSection(
+    documentId: string,
+    text: string
+  ): Promise<SectionExtractionResult> {
+    const startTime = Date.now();
+    
+    try {
+      const result = await llmService.processCIMDocument(
+        text,
+        'BPCP CIM Review Template',
+        undefined,
+        ['preliminaryInvestmentThesis'],
+        'Extract only the investment thesis: key attractions, potential risks, value creation levers, and alignment with BPCP fund strategy.'
+      );
+
+      const processingTime = Date.now() - startTime;
+
+      if (result.success && result.jsonOutput?.preliminaryInvestmentThesis) {
+        return {
+          section: 'investmentThesis',
+          success: true,
+          data: { preliminaryInvestmentThesis: result.jsonOutput.preliminaryInvestmentThesis },
+          apiCalls: 1,
+          processingTime,
+        };
+      } else {
+        return {
+          section: 'investmentThesis',
+          success: false,
+          data: {},
+          error: result.error,
+          apiCalls: 1,
+          processingTime,
+        };
+      }
+    } catch (error) {
+      return {
+        section: 'investmentThesis',
+        success: false,
+        data: {},
+        error: error instanceof Error ? error.message : String(error),
+        apiCalls: 0,
+        processingTime: Date.now() - startTime,
+      };
+    }
+  }
+
+  /**
+   * Merge results from all sections
+   */
+  private mergeSectionResults(results: SectionExtractionResult[]): Partial<CIMReview> {
+    const merged: Partial<CIMReview> = { ...defaultCIMReview };
+
+    results.forEach(result => {
+      if (result.success) {
+        Object.assign(merged, result.data);
+      }
+    });
+
+    return merged;
+  }
+
+  /**
+   * Generate summary from analysis data
+   */
+  private generateSummary(data: Partial<CIMReview>): string {
+    const parts: string[] = [];
+
+    if (data.dealOverview?.targetCompanyName) {
+      parts.push(`Target: ${data.dealOverview.targetCompanyName}`);
+    }
+    if (data.dealOverview?.industrySector) {
+      parts.push(`Industry: ${data.dealOverview.industrySector}`);
+    }
+    if (data.financialSummary?.financials?.ltm?.revenue) {
+      parts.push(`LTM Revenue: ${data.financialSummary.financials.ltm.revenue}`);
+    }
+    if (data.financialSummary?.financials?.ltm?.ebitda) {
+      parts.push(`LTM EBITDA: ${data.financialSummary.financials.ltm.ebitda}`);
+    }
+
+    return parts.join(' | ') || 'CIM analysis completed';
+  }
+}
+
+export const parallelDocumentProcessor = new ParallelDocumentProcessor();
+
--- a/backend/src/services/rag/chunkProcessing.ts
+++ b/backend/src/services/rag/chunkProcessing.ts
@@ -0,0 +1,80 @@
+import { logger } from '../../utils/logger';
+import type { ProcessingChunk } from './types';
+
+const BATCH_SIZE = 10;
+
+/**
+ * Enrich chunk metadata with additional analysis
+ */
+export function enrichChunkMetadata(chunk: ProcessingChunk): Record<string, any> {
+  const metadata: Record<string, any> = {
+    chunkSize: chunk.content.length,
+    wordCount: chunk.content.split(/\s+/).length,
+    sentenceCount: (chunk.content.match(/[.!?]+/g) || []).length,
+    hasNumbers: /\d/.test(chunk.content),
+    hasFinancialData: /revenue|ebitda|profit|margin|growth|valuation/i.test(chunk.content),
+    hasTechnicalData: /technology|software|platform|api|database/i.test(chunk.content),
+    processingTimestamp: new Date().toISOString()
+  };
+
+  return metadata;
+}
+
+/**
+ * Process chunks in batches to manage memory and API limits
+ */
+export async function processChunksInBatches(
+  chunks: ProcessingChunk[],
+  documentId: string,
+  options: {
+    enableMetadataEnrichment?: boolean;
+    similarityThreshold?: number;
+  }
+): Promise<ProcessingChunk[]> {
+  const processedChunks: ProcessingChunk[] = [];
+  
+  // Process chunks in batches
+  for (let i = 0; i < chunks.length; i += BATCH_SIZE) {
+    const batch = chunks.slice(i, i + BATCH_SIZE);
+    
+    logger.info(`Processing batch ${Math.floor(i / BATCH_SIZE) + 1}/${Math.ceil(chunks.length / BATCH_SIZE)} for document: ${documentId}`);
+    
+    // Process batch with concurrency control
+    const batchPromises = batch.map(async (chunk, batchIndex) => {
+      try {
+        // Add delay to respect API rate limits
+        if (batchIndex > 0) {
+          await new Promise(resolve => setTimeout(resolve, 100));
+        }
+
+        // Enrich metadata if enabled
+        if (options.enableMetadataEnrichment) {
+          chunk.metadata = {
+            ...chunk.metadata,
+            ...enrichChunkMetadata(chunk)
+          };
+        }
+
+        return chunk;
+      } catch (error) {
+        logger.error(`Failed to process chunk ${chunk.chunkIndex}`, error);
+        return null;
+      }
+    });
+
+    const batchResults = await Promise.all(batchPromises);
+    processedChunks.push(...batchResults.filter(chunk => chunk !== null) as ProcessingChunk[]);
+
+    // Force garbage collection between batches
+    if (global.gc) {
+      global.gc();
+    }
+
+    // Log memory usage
+    const memoryUsage = process.memoryUsage();
+    logger.info(`Batch completed. Memory usage: ${Math.round(memoryUsage.heapUsed / 1024 / 1024)}MB`);
+  }
+
+  return processedChunks;
+}
+
--- a/backend/src/services/rag/chunking.ts
+++ b/backend/src/services/rag/chunking.ts
@@ -0,0 +1,191 @@
+import { logger } from '../../utils/logger';
+import type { StructuredTable } from '../documentAiProcessor';
+import type { ProcessingChunk } from './types';
+import { isFinancialTable, formatTableAsMarkdown } from './tableProcessor';
+import { detectSectionType, extractMetadata } from './utils';
+
+const MAX_CHUNK_SIZE = 4000;
+const OVERLAP_SIZE = 200;
+
+interface SemanticChunk {
+  content: string;
+  startPosition: number;
+  endPosition: number;
+  sectionType?: string;
+  metadata?: Record<string, any>;
+}
+
+/**
+ * Create intelligent chunks with semantic boundaries
+ */
+export async function createIntelligentChunks(
+  text: string,
+  documentId: string,
+  enableSemanticChunking: boolean = true,
+  structuredTables: StructuredTable[] = []
+): Promise<ProcessingChunk[]> {
+  const chunks: ProcessingChunk[] = [];
+
+  if (structuredTables.length > 0) {
+    logger.info('Processing structured tables for chunking', {
+      documentId,
+      tableCount: structuredTables.length
+    });
+
+    structuredTables.forEach((table, index) => {
+      const isFinancial = isFinancialTable(table);
+      const markdownTable = formatTableAsMarkdown(table);
+      const chunkIndex = chunks.length;
+
+      chunks.push({
+        id: `${documentId}-table-${index}`,
+        content: markdownTable,
+        chunkIndex,
+        startPosition: -1,
+        endPosition: -1,
+        sectionType: isFinancial ? 'financial-table' : 'table',
+        metadata: {
+          isStructuredTable: true,
+          isFinancialTable: isFinancial,
+          tableIndex: index,
+          pageNumber: table.position?.pageNumber ?? -1,
+          headerCount: table.headers.length,
+          rowCount: table.rows.length,
+          structuredData: table
+        }
+      });
+
+      logger.info('Created chunk for structured table', {
+        documentId,
+        tableIndex: index,
+        isFinancial,
+        chunkId: `${documentId}-table-${index}`,
+        headerCount: table.headers.length,
+        rowCount: table.rows.length
+      });
+    });
+  }
+
+  if (enableSemanticChunking) {
+    const semanticChunks = splitBySemanticBoundaries(text);
+    
+    for (let i = 0; i < semanticChunks.length; i++) {
+      const chunk = semanticChunks[i];
+      if (chunk && chunk.content.length > 50) {
+        const chunkIndex = chunks.length;
+        chunks.push({
+          id: `${documentId}-chunk-${chunkIndex}`,
+          content: chunk.content,
+          chunkIndex,
+          startPosition: chunk.startPosition,
+          endPosition: chunk.endPosition,
+          sectionType: chunk.sectionType || 'general',
+          metadata: {
+            ...(chunk.metadata || {}),
+            hasStructuredTableContext: false
+          }
+        });
+      }
+    }
+  } else {
+    for (let i = 0; i < text.length; i += MAX_CHUNK_SIZE - OVERLAP_SIZE) {
+      const chunkContent = text.substring(i, i + MAX_CHUNK_SIZE);
+      if (chunkContent.trim().length > 50) {
+        const chunkIndex = chunks.length;
+        chunks.push({
+          id: `${documentId}-chunk-${chunkIndex}`,
+          content: chunkContent,
+          chunkIndex,
+          startPosition: i,
+          endPosition: i + chunkContent.length,
+          sectionType: detectSectionType(chunkContent),
+          metadata: extractMetadata(chunkContent)
+        });
+      }
+    }
+  }
+
+  return chunks;
+}
+
+/**
+ * Split text by semantic boundaries (paragraphs, sections, etc.)
+ */
+function splitBySemanticBoundaries(text: string): SemanticChunk[] {
+  const chunks: SemanticChunk[] = [];
+
+  // Split by double newlines (paragraphs)
+  const paragraphs = text.split(/\n\s*\n/);
+  let currentPosition = 0;
+
+  for (const paragraph of paragraphs) {
+    if (paragraph.trim().length === 0) {
+      currentPosition += paragraph.length + 2; // +2 for \n\n
+      continue;
+    }
+
+    // If paragraph is too large, split it further
+    if (paragraph.length > MAX_CHUNK_SIZE) {
+      const subChunks = splitLargeParagraph(paragraph, currentPosition);
+      chunks.push(...subChunks);
+      currentPosition += paragraph.length + 2;
+    } else {
+      chunks.push({
+        content: paragraph.trim(),
+        startPosition: currentPosition,
+        endPosition: currentPosition + paragraph.length,
+        sectionType: detectSectionType(paragraph),
+        metadata: extractMetadata(paragraph)
+      });
+      currentPosition += paragraph.length + 2;
+    }
+  }
+
+  return chunks;
+}
+
+/**
+ * Split large paragraphs into smaller chunks
+ */
+function splitLargeParagraph(
+  paragraph: string,
+  startPosition: number
+): SemanticChunk[] {
+  const chunks: SemanticChunk[] = [];
+
+  // Split by sentences first
+  const sentences = paragraph.match(/[^.!?]+[.!?]+/g) || [paragraph];
+  let currentChunk = '';
+  let chunkStartPosition = startPosition;
+
+  for (const sentence of sentences) {
+    if ((currentChunk + sentence).length > MAX_CHUNK_SIZE && currentChunk.length > 0) {
+      // Store current chunk and start new one
+      chunks.push({
+        content: currentChunk.trim(),
+        startPosition: chunkStartPosition,
+        endPosition: chunkStartPosition + currentChunk.length,
+        sectionType: detectSectionType(currentChunk),
+        metadata: extractMetadata(currentChunk)
+      });
+      currentChunk = sentence;
+      chunkStartPosition = chunkStartPosition + currentChunk.length;
+    } else {
+      currentChunk += sentence;
+    }
+  }
+
+  // Add the last chunk
+  if (currentChunk.trim().length > 0) {
+    chunks.push({
+      content: currentChunk.trim(),
+      startPosition: chunkStartPosition,
+      endPosition: chunkStartPosition + currentChunk.length,
+      sectionType: detectSectionType(currentChunk),
+      metadata: extractMetadata(currentChunk)
+    });
+  }
+
+  return chunks;
+}
+
--- a/backend/src/services/rag/embeddingService.ts
+++ b/backend/src/services/rag/embeddingService.ts
@@ -0,0 +1,96 @@
+import { logger } from '../../utils/logger';
+import { vectorDatabaseService } from '../vectorDatabaseService';
+import { VectorDatabaseModel } from '../../models/VectorDatabaseModel';
+import type { ProcessingChunk } from './types';
+
+const MAX_CONCURRENT_EMBEDDINGS = 5;
+const STORE_BATCH_SIZE = 20;
+
+/**
+ * Generate embeddings with rate limiting and error handling
+ * Returns both the chunks with embeddings and the number of API calls made
+ */
+export async function generateEmbeddingsWithRateLimit(
+  chunks: ProcessingChunk[]
+): Promise<{ chunks: Array<ProcessingChunk & { embedding: number[]; documentId: string }>; apiCalls: number }> {
+  const chunksWithEmbeddings: Array<ProcessingChunk & { embedding: number[]; documentId: string }> = [];
+  let totalApiCalls = 0;
+  
+  // Process with concurrency control
+  for (let i = 0; i < chunks.length; i += MAX_CONCURRENT_EMBEDDINGS) {
+    const batch = chunks.slice(i, i + MAX_CONCURRENT_EMBEDDINGS);
+    
+    const batchPromises = batch.map(async (chunk, batchIndex) => {
+      try {
+        // Add delay between API calls
+        if (batchIndex > 0) {
+          await new Promise(resolve => setTimeout(resolve, 200));
+        }
+
+        const embedding = await vectorDatabaseService.generateEmbeddings(chunk.content);
+        
+        return {
+          ...chunk,
+          embedding,
+          documentId: chunk.id.split('-chunk-')[0] // Extract document ID from chunk ID
+        };
+      } catch (error) {
+        logger.error(`Failed to generate embedding for chunk ${chunk.chunkIndex}`, error);
+        // Return null for failed chunks
+        return null;
+      }
+    });
+
+    const batchResults = await Promise.all(batchPromises);
+    const successfulChunks = batchResults.filter(chunk => chunk !== null) as Array<ProcessingChunk & { embedding: number[]; documentId: string }>;
+    chunksWithEmbeddings.push(...successfulChunks);
+    
+    // Count successful API calls (each successful embedding generation is 1 API call)
+    totalApiCalls += successfulChunks.length;
+
+    // Log progress
+    logger.info(`Generated embeddings for ${chunksWithEmbeddings.length}/${chunks.length} chunks`);
+  }
+
+  return { chunks: chunksWithEmbeddings, apiCalls: totalApiCalls };
+}
+
+/**
+ * Store chunks with optimized batching
+ * Returns the number of API calls made for embeddings
+ */
+export async function storeChunksOptimized(
+  chunks: ProcessingChunk[],
+  documentId: string
+): Promise<number> {
+  try {
+    // Generate embeddings in parallel with rate limiting
+    const { chunks: chunksWithEmbeddings, apiCalls } = await generateEmbeddingsWithRateLimit(chunks);
+
+    // Store in batches
+    for (let i = 0; i < chunksWithEmbeddings.length; i += STORE_BATCH_SIZE) {
+      const batch = chunksWithEmbeddings.slice(i, i + STORE_BATCH_SIZE);
+      
+      await VectorDatabaseModel.storeDocumentChunks(
+        batch.map(chunk => ({
+          documentId: chunk.documentId,
+          content: chunk.content,
+          metadata: chunk.metadata || {},
+          embedding: chunk.embedding,
+          chunkIndex: chunk.chunkIndex,
+          section: chunk.sectionType || 'general',
+          pageNumber: chunk.metadata?.['pageNumber']
+        }))
+      );
+
+      logger.info(`Stored batch ${Math.floor(i / STORE_BATCH_SIZE) + 1}/${Math.ceil(chunksWithEmbeddings.length / STORE_BATCH_SIZE)} for document: ${documentId}`);
+    }
+
+    logger.info(`Successfully stored ${chunksWithEmbeddings.length} chunks for document: ${documentId}`);
+    return apiCalls;
+  } catch (error) {
+    logger.error(`Failed to store chunks for document: ${documentId}`, error);
+    throw error;
+  }
+}
+
--- a/backend/src/services/rag/index.ts
+++ b/backend/src/services/rag/index.ts
@@ -0,0 +1,3 @@
+export { OptimizedAgenticRAGProcessor, optimizedAgenticRAGProcessor } from './optimizedAgenticRAGProcessor';
+export type { ProcessingResult, ProcessingChunk, ProcessingOptions, ChunkingOptions } from './types';
+
--- a/backend/src/services/rag/optimizedAgenticRAGProcessor.ts
+++ b/backend/src/services/rag/optimizedAgenticRAGProcessor.ts
@@ -0,0 +1,129 @@
+import { logger } from '../../utils/logger';
+import type { ProcessingResult, ProcessingChunk, ProcessingOptions } from './types';
+import { createIntelligentChunks } from './chunking';
+import { processChunksInBatches } from './chunkProcessing';
+import { storeChunksOptimized } from './embeddingService';
+import { generateSummaryFromAnalysis } from './summaryGenerator';
+import type { CIMReview } from '../llmSchemas';
+import type { StructuredTable } from '../documentAiProcessor';
+import type { ParsedFinancials } from '../financialTableParser';
+
+// Import the LLM analysis methods from the original file for now
+// TODO: Extract these to a separate llmAnalysis.ts module
+import { OptimizedAgenticRAGProcessor as OriginalProcessor } from '../optimizedAgenticRAGProcessor';
+
+export class OptimizedAgenticRAGProcessor {
+  private readonly originalProcessor: OriginalProcessor;
+
+  constructor() {
+    // Use the original processor for LLM analysis methods until they're fully extracted
+    this.originalProcessor = new OriginalProcessor();
+  }
+
+  /**
+   * Process large documents with optimized memory usage and proper chunking
+   */
+  async processLargeDocument(
+    documentId: string,
+    text: string,
+    options: ProcessingOptions = {}
+  ): Promise<ProcessingResult> {
+    const startTime = Date.now();
+    const initialMemory = process.memoryUsage().heapUsed;
+
+    try {
+      logger.info(`Starting optimized processing for document: ${documentId}`, {
+        textLength: text.length,
+        estimatedChunks: Math.ceil(text.length / 4000)
+      });
+
+      // Step 1: Create intelligent chunks with semantic boundaries
+      const {
+        enableSemanticChunking = true,
+        enableMetadataEnrichment,
+        similarityThreshold,
+        structuredTables = []
+      } = options;
+
+      const chunks = await createIntelligentChunks(
+        text,
+        documentId,
+        enableSemanticChunking,
+        structuredTables
+      );
+
+      // Step 2: Process chunks in batches to manage memory
+      const processedChunks = await processChunksInBatches(chunks, documentId, {
+        enableMetadataEnrichment,
+        similarityThreshold
+      });
+
+      // Step 3: Store chunks with optimized batching and track API calls
+      const embeddingApiCalls = await storeChunksOptimized(processedChunks, documentId);
+
+      // Step 4: Generate LLM analysis using MULTI-PASS extraction and track API calls
+      logger.info(`Starting MULTI-PASS LLM analysis for document: ${documentId}`);
+      const llmResult = await this.originalProcessor.generateLLMAnalysisMultiPass(
+        documentId,
+        text,
+        processedChunks
+      );
+
+      const processingTime = Date.now() - startTime;
+      const finalMemory = process.memoryUsage().heapUsed;
+      const memoryUsage = finalMemory - initialMemory;
+
+      // Sum all API calls: embeddings + LLM
+      const totalApiCalls = embeddingApiCalls + llmResult.apiCalls;
+
+      const result: ProcessingResult = {
+        totalChunks: chunks.length,
+        processedChunks: processedChunks.length,
+        processingTime,
+        averageChunkSize: Math.round(
+          processedChunks.reduce((sum: number, c: ProcessingChunk) => sum + c.content.length, 0) /
+          processedChunks.length
+        ),
+        memoryUsage: Math.round(memoryUsage / 1024 / 1024), // MB
+        success: true,
+        summary: llmResult.summary,
+        analysisData: llmResult.analysisData,
+        apiCalls: totalApiCalls,
+        processingStrategy: 'document_ai_multi_pass_rag'
+      };
+
+      logger.info(`Optimized processing completed for document: ${documentId}`, result);
+
+      console.log('✅ Optimized agentic RAG processing completed successfully for document:', documentId);
+      console.log('✅ Total chunks processed:', result.processedChunks);
+      console.log('✅ Processing time:', result.processingTime, 'ms');
+      console.log('✅ Memory usage:', result.memoryUsage, 'MB');
+      console.log('✅ Summary length:', result.summary?.length || 0);
+      console.log('✅ Total API calls:', result.apiCalls);
+
+      return result;
+    } catch (error) {
+      logger.error(`Optimized processing failed for document: ${documentId}`, error);
+      
+      console.log('❌ Optimized agentic RAG processing failed for document:', documentId);
+      console.log('❌ Error:', error instanceof Error ? error.message : String(error));
+      
+      throw error;
+    }
+  }
+
+  /**
+   * Generate LLM analysis using multi-pass extraction strategy
+   * Delegates to original processor until fully extracted
+   */
+  async generateLLMAnalysisMultiPass(
+    documentId: string,
+    text: string,
+    chunks: ProcessingChunk[]
+  ): Promise<{ summary: string; analysisData: CIMReview; apiCalls: number }> {
+    return this.originalProcessor.generateLLMAnalysisMultiPass(documentId, text, chunks);
+  }
+}
+
+export const optimizedAgenticRAGProcessor = new OptimizedAgenticRAGProcessor();
+
--- a/backend/src/services/rag/ragQueries.ts
+++ b/backend/src/services/rag/ragQueries.ts
@@ -0,0 +1,51 @@
+/**
+ * Create a comprehensive query for CIM document analysis
+ * This query represents what we're looking for in the document
+ */
+export function createCIMAnalysisQuery(): string {
+  return `Confidential Information Memorandum (CIM) document comprehensive analysis with priority weighting:
+
+**HIGH PRIORITY (Weight: 10/10)** - Critical for investment decision:
+- Historical financial performance table with revenue, EBITDA, gross profit, margins, and growth rates for FY-3, FY-2, FY-1, and LTM periods
+- Executive summary financial highlights and key metrics
+- Investment thesis, key attractions, risks, and value creation opportunities
+- Deal overview including target company name, industry sector, transaction type, geography, deal source
+
+**HIGH PRIORITY (Weight: 9/10)** - Essential investment analysis:
+- Market analysis including total addressable market (TAM), serviceable addressable market (SAM), market growth rates, CAGR
+- Competitive landscape analysis with key competitors, market position, market share, competitive differentiation
+- Business description including core operations, key products and services, unique value proposition, revenue mix
+- Management team overview including key leaders, management quality assessment, post-transaction intentions
+
+**MEDIUM PRIORITY (Weight: 7/10)** - Important context:
+- Customer base overview including customer segments, customer concentration risk, top customers percentage, contract length, recurring revenue
+- Industry trends, drivers, tailwinds, headwinds, regulatory environment
+- Barriers to entry, competitive moats, basis of competition
+- Quality of earnings analysis, EBITDA adjustments, addbacks, capital expenditures, working capital intensity, free cash flow quality
+
+**MEDIUM PRIORITY (Weight: 6/10)** - Supporting information:
+- Key supplier dependencies, supply chain risks, supplier concentration
+- Organizational structure, reporting relationships, depth of team
+- Revenue growth drivers, margin stability analysis, profitability trends
+- Critical questions for management, missing information, preliminary recommendation, proposed next steps
+
+**LOWER PRIORITY (Weight: 4/10)** - Additional context:
+- Transaction details and deal structure
+- CIM document dates, reviewers, page count, stated reason for sale, employee count
+- Geographic locations and operating locations
+- Market dynamics and macroeconomic factors
+
+**SEMANTIC SPECIFICITY ENHANCEMENTS**:
+Use specific financial terminology: "historical financial performance table", "income statement", "P&L statement", "financial summary table", "consolidated financials", "revenue growth year-over-year", "EBITDA margin percentage", "gross profit margin", "trailing twelve months LTM", "fiscal year FY-1 FY-2 FY-3"
+
+Use specific market terminology: "total addressable market TAM", "serviceable addressable market SAM", "compound annual growth rate CAGR", "market share percentage", "competitive positioning", "barriers to entry", "competitive moat", "market leader", "niche player"
+
+Use specific investment terminology: "investment thesis", "value creation levers", "margin expansion opportunities", "add-on acquisition potential", "operational improvements", "M&A strategy", "preliminary recommendation", "due diligence questions"
+
+**CONTEXT ENRICHMENT**:
+- Document structure hints: Look for section headers like "Financial Summary", "Market Analysis", "Competitive Landscape", "Management Team", "Investment Highlights"
+- Table locations: Financial tables typically in "Financial Summary" or "Historical Financials" sections, may also be in appendices
+- Appendix references: Check appendices for detailed financials, management bios, market research, competitive analysis
+- Page number context: Note page numbers for key sections and tables for validation`;
+}
+
--- a/backend/src/services/rag/ragSearch.ts
+++ b/backend/src/services/rag/ragSearch.ts
@@ -0,0 +1,118 @@
+import { logger } from '../../utils/logger';
+import { vectorDatabaseService } from '../vectorDatabaseService';
+import type { ProcessingChunk } from './types';
+
+/**
+ * Search for relevant chunks using RAG-based vector search
+ * Returns top-k most relevant chunks for the document
+ */
+export async function findRelevantChunks(
+  documentId: string,
+  queryText: string,
+  originalChunks: ProcessingChunk[],
+  targetTokenCount: number = 15000
+): Promise<{ chunks: ProcessingChunk[]; usedRAG: boolean }> {
+  try {
+    logger.info('Starting RAG-based chunk selection', {
+      documentId,
+      totalChunks: originalChunks.length,
+      targetTokenCount,
+      queryPreview: queryText.substring(0, 200)
+    });
+
+    // Generate embedding for the query
+    const queryEmbedding = await vectorDatabaseService.generateEmbeddings(queryText);
+    
+    // Get all chunks for this document
+    const allChunks = await vectorDatabaseService.searchByDocumentId(documentId);
+    
+    if (allChunks.length === 0) {
+      logger.warn('No chunks found for document, falling back to full document', { documentId });
+      return { chunks: [], usedRAG: false };
+    }
+
+    // Calculate similarity for each chunk
+    // We'll use a simplified approach: search for similar chunks and filter by documentId
+    const similarChunks = await vectorDatabaseService.searchSimilar(
+      queryEmbedding,
+      Math.min(allChunks.length, 30), // Increased from 20 to 30 to get more chunks
+      0.4 // Lower threshold from 0.5 to 0.4 to get more chunks
+    );
+
+    // Filter to only chunks from this document and sort by similarity
+    const relevantChunks = similarChunks
+      .filter(chunk => chunk.documentId === documentId)
+      .sort((a, b) => b.similarity - a.similarity);
+
+    logger.info('Found relevant chunks via RAG search', {
+      documentId,
+      totalChunks: allChunks.length,
+      relevantChunks: relevantChunks.length,
+      avgSimilarity: relevantChunks.length > 0 
+        ? relevantChunks.reduce((sum, c) => sum + c.similarity, 0) / relevantChunks.length 
+        : 0
+    });
+
+    // If we didn't get enough chunks, supplement with chunks from key sections
+    if (relevantChunks.length < 10) {
+      logger.info('Supplementing with section-based chunks', {
+        documentId,
+        currentChunks: relevantChunks.length
+      });
+
+      // Get chunks from important sections (executive summary, financials, etc.)
+      const sectionKeywords = ['executive', 'summary', 'financial', 'revenue', 'ebitda', 'management', 'market', 'competitive'];
+      const sectionChunks = allChunks.filter(chunk => {
+        const contentLower = chunk.content.toLowerCase();
+        return sectionKeywords.some(keyword => contentLower.includes(keyword));
+      });
+
+      // Add section chunks that aren't already included
+      const existingIndices = new Set(relevantChunks.map(c => c.chunkIndex));
+      const additionalChunks = sectionChunks
+        .filter(c => !existingIndices.has(c.chunkIndex))
+        .slice(0, 10 - relevantChunks.length);
+
+      relevantChunks.push(...additionalChunks);
+    }
+
+    // Estimate tokens and select chunks until we reach target
+    const selectedChunks: ProcessingChunk[] = [];
+    let currentTokenCount = 0;
+    const avgTokensPerChar = 0.25; // Rough estimate: 4 chars per token
+
+    for (const chunk of relevantChunks) {
+      const chunkTokens = chunk.content.length * avgTokensPerChar;
+      if (currentTokenCount + chunkTokens <= targetTokenCount) {
+        // Find the original ProcessingChunk to preserve metadata
+        const originalChunk = originalChunks.find(c => c.chunkIndex === chunk.chunkIndex);
+        if (originalChunk) {
+          selectedChunks.push(originalChunk);
+          currentTokenCount += chunkTokens;
+        }
+      } else {
+        break;
+      }
+    }
+
+    // Sort selected chunks by chunkIndex to maintain document order
+    selectedChunks.sort((a, b) => a.chunkIndex - b.chunkIndex);
+
+    logger.info('RAG-based chunk selection completed', {
+      documentId,
+      selectedChunks: selectedChunks.length,
+      estimatedTokens: currentTokenCount,
+      targetTokens: targetTokenCount,
+      reductionRatio: `${((1 - selectedChunks.length / originalChunks.length) * 100).toFixed(1)}%`
+    });
+
+    return { chunks: selectedChunks, usedRAG: true };
+  } catch (error) {
+    logger.error('RAG-based chunk selection failed, falling back to full document', {
+      documentId,
+      error: error instanceof Error ? error.message : String(error)
+    });
+    return { chunks: [], usedRAG: false };
+  }
+}
+
--- a/backend/src/services/rag/summaryGenerator.ts
+++ b/backend/src/services/rag/summaryGenerator.ts
@@ -0,0 +1,273 @@
+import type { CIMReview } from '../llmSchemas';
+
+/**
+ * Generate a comprehensive summary from the analysis data
+ */
+export function generateSummaryFromAnalysis(analysisData: CIMReview): string {
+  let summary = '# CIM Review Summary\n\n';
+  
+  // Add deal overview
+  if (analysisData.dealOverview?.targetCompanyName) {
+    summary += `## Deal Overview\n\n`;
+    summary += `**Target Company:** ${analysisData.dealOverview.targetCompanyName}\n\n`;
+    
+    if (analysisData.dealOverview.industrySector) {
+      summary += `**Industry:** ${analysisData.dealOverview.industrySector}\n\n`;
+    }
+    if (analysisData.dealOverview.transactionType) {
+      summary += `**Transaction Type:** ${analysisData.dealOverview.transactionType}\n\n`;
+    }
+    if (analysisData.dealOverview.geography) {
+      summary += `**Geography:** ${analysisData.dealOverview.geography}\n\n`;
+    }
+    if (analysisData.dealOverview.employeeCount) {
+      summary += `**Employee Count:** ${analysisData.dealOverview.employeeCount}\n\n`;
+    }
+    if (analysisData.dealOverview.dealSource) {
+      summary += `**Deal Source:** ${analysisData.dealOverview.dealSource}\n\n`;
+    }
+    if (analysisData.dealOverview.statedReasonForSale) {
+      summary += `**Reason for Sale:** ${analysisData.dealOverview.statedReasonForSale}\n\n`;
+    }
+  }
+  
+  // Add business description
+  if (analysisData.businessDescription?.coreOperationsSummary) {
+    summary += `## Business Description\n\n`;
+    summary += `**Core Operations:** ${analysisData.businessDescription.coreOperationsSummary}\n\n`;
+    
+    if (analysisData.businessDescription.keyProductsServices) {
+      summary += `**Key Products/Services:** ${analysisData.businessDescription.keyProductsServices}\n\n`;
+    }
+    if (analysisData.businessDescription.uniqueValueProposition) {
+      summary += `**Unique Value Proposition:** ${analysisData.businessDescription.uniqueValueProposition}\n\n`;
+    }
+    
+    // Add customer base overview
+    if (analysisData.businessDescription.customerBaseOverview) {
+      summary += `### Customer Base Overview\n\n`;
+      if (analysisData.businessDescription.customerBaseOverview.keyCustomerSegments) {
+        summary += `**Key Customer Segments:** ${analysisData.businessDescription.customerBaseOverview.keyCustomerSegments}\n\n`;
+      }
+      if (analysisData.businessDescription.customerBaseOverview.customerConcentrationRisk) {
+        summary += `**Customer Concentration Risk:** ${analysisData.businessDescription.customerBaseOverview.customerConcentrationRisk}\n\n`;
+      }
+      if (analysisData.businessDescription.customerBaseOverview.typicalContractLength) {
+        summary += `**Typical Contract Length:** ${analysisData.businessDescription.customerBaseOverview.typicalContractLength}\n\n`;
+      }
+    }
+    
+    // Add supplier overview
+    if (analysisData.businessDescription.keySupplierOverview?.dependenceConcentrationRisk) {
+      summary += `**Supplier Dependence Risk:** ${analysisData.businessDescription.keySupplierOverview.dependenceConcentrationRisk}\n\n`;
+    }
+  }
+  
+  // Add market analysis
+  if (analysisData.marketIndustryAnalysis?.estimatedMarketSize) {
+    summary += `## Market & Industry Analysis\n\n`;
+    summary += `**Market Size:** ${analysisData.marketIndustryAnalysis.estimatedMarketSize}\n\n`;
+    
+    if (analysisData.marketIndustryAnalysis.estimatedMarketGrowthRate) {
+      summary += `**Market Growth Rate:** ${analysisData.marketIndustryAnalysis.estimatedMarketGrowthRate}\n\n`;
+    }
+    if (analysisData.marketIndustryAnalysis.keyIndustryTrends) {
+      summary += `**Industry Trends:** ${analysisData.marketIndustryAnalysis.keyIndustryTrends}\n\n`;
+    }
+    if (analysisData.marketIndustryAnalysis.barriersToEntry) {
+      summary += `**Barriers to Entry:** ${analysisData.marketIndustryAnalysis.barriersToEntry}\n\n`;
+    }
+    
+    // Add competitive landscape
+    if (analysisData.marketIndustryAnalysis.competitiveLandscape) {
+      summary += `### Competitive Landscape\n\n`;
+      if (analysisData.marketIndustryAnalysis.competitiveLandscape.keyCompetitors) {
+        summary += `**Key Competitors:** ${analysisData.marketIndustryAnalysis.competitiveLandscape.keyCompetitors}\n\n`;
+      }
+      if (analysisData.marketIndustryAnalysis.competitiveLandscape.targetMarketPosition) {
+        summary += `**Market Position:** ${analysisData.marketIndustryAnalysis.competitiveLandscape.targetMarketPosition}\n\n`;
+      }
+      if (analysisData.marketIndustryAnalysis.competitiveLandscape.basisOfCompetition) {
+        summary += `**Basis of Competition:** ${analysisData.marketIndustryAnalysis.competitiveLandscape.basisOfCompetition}\n\n`;
+      }
+    }
+  }
+  
+  // Add financial summary
+  if (analysisData.financialSummary?.financials) {
+    summary += `## Financial Summary\n\n`;
+    const financials = analysisData.financialSummary.financials;
+    
+    // Helper function to check if a period has any non-empty metric
+    const hasAnyMetric = (period: 'fy3' | 'fy2' | 'fy1' | 'ltm'): boolean => {
+      const periodData = financials[period];
+      if (!periodData) return false;
+      return !!(
+        periodData.revenue ||
+        periodData.revenueGrowth ||
+        periodData.grossProfit ||
+        periodData.grossMargin ||
+        periodData.ebitda ||
+        periodData.ebitdaMargin
+      );
+    };
+    
+    // Build periods array in chronological order (oldest to newest): FY3 → FY2 → FY1 → LTM
+    // Only include periods that have at least one non-empty metric
+    const periods: Array<{ key: 'fy3' | 'fy2' | 'fy1' | 'ltm'; label: string }> = [];
+    if (hasAnyMetric('fy3')) periods.push({ key: 'fy3', label: 'FY3' });
+    if (hasAnyMetric('fy2')) periods.push({ key: 'fy2', label: 'FY2' });
+    if (hasAnyMetric('fy1')) periods.push({ key: 'fy1', label: 'FY1' });
+    if (hasAnyMetric('ltm')) periods.push({ key: 'ltm', label: 'LTM' });
+    
+    // Only create table if we have at least one period with data
+    if (periods.length > 0) {
+      // Create financial table
+      summary += `<table class="financial-table">\n`;
+      summary += `<thead>\n<tr>\n<th>Metric</th>\n`;
+      
+      periods.forEach(period => {
+        summary += `<th>${period.label}</th>\n`;
+      });
+      summary += `</tr>\n</thead>\n<tbody>\n`;
+      
+      // Helper function to get value for a period and metric
+      const getValue = (periodKey: 'fy3' | 'fy2' | 'fy1' | 'ltm', metric: keyof typeof financials.fy1): string => {
+        const periodData = financials[periodKey];
+        if (!periodData) return '-';
+        const value = periodData[metric];
+        return value && value.trim() && value !== 'Not specified in CIM' ? value : '-';
+      };
+      
+      // Revenue row
+      if (financials.fy1?.revenue || financials.fy2?.revenue || financials.fy3?.revenue || financials.ltm?.revenue) {
+        summary += `<tr>\n<td><strong>Revenue</strong></td>\n`;
+        periods.forEach(period => {
+          summary += `<td>${getValue(period.key, 'revenue')}</td>\n`;
+        });
+        summary += `</tr>\n`;
+      }
+      
+      // Gross Profit row
+      if (financials.fy1?.grossProfit || financials.fy2?.grossProfit || financials.fy3?.grossProfit || financials.ltm?.grossProfit) {
+        summary += `<tr>\n<td><strong>Gross Profit</strong></td>\n`;
+        periods.forEach(period => {
+          summary += `<td>${getValue(period.key, 'grossProfit')}</td>\n`;
+        });
+        summary += `</tr>\n`;
+      }
+      
+      // Gross Margin row
+      if (financials.fy1?.grossMargin || financials.fy2?.grossMargin || financials.fy3?.grossMargin || financials.ltm?.grossMargin) {
+        summary += `<tr>\n<td><strong>Gross Margin</strong></td>\n`;
+        periods.forEach(period => {
+          summary += `<td>${getValue(period.key, 'grossMargin')}</td>\n`;
+        });
+        summary += `</tr>\n`;
+      }
+      
+      // EBITDA row
+      if (financials.fy1?.ebitda || financials.fy2?.ebitda || financials.fy3?.ebitda || financials.ltm?.ebitda) {
+        summary += `<tr>\n<td><strong>EBITDA</strong></td>\n`;
+        periods.forEach(period => {
+          summary += `<td>${getValue(period.key, 'ebitda')}</td>\n`;
+        });
+        summary += `</tr>\n`;
+      }
+      
+      // EBITDA Margin row
+      if (financials.fy1?.ebitdaMargin || financials.fy2?.ebitdaMargin || financials.fy3?.ebitdaMargin || financials.ltm?.ebitdaMargin) {
+        summary += `<tr>\n<td><strong>EBITDA Margin</strong></td>\n`;
+        periods.forEach(period => {
+          summary += `<td>${getValue(period.key, 'ebitdaMargin')}</td>\n`;
+        });
+        summary += `</tr>\n`;
+      }
+      
+      // Revenue Growth row
+      if (financials.fy1?.revenueGrowth || financials.fy2?.revenueGrowth || financials.fy3?.revenueGrowth || financials.ltm?.revenueGrowth) {
+        summary += `<tr>\n<td><strong>Revenue Growth</strong></td>\n`;
+        periods.forEach(period => {
+          summary += `<td>${getValue(period.key, 'revenueGrowth')}</td>\n`;
+        });
+        summary += `</tr>\n`;
+      }
+      
+      summary += `</tbody>\n</table>\n\n`;
+    }
+    
+    // Add financial notes
+    if (analysisData.financialSummary.qualityOfEarnings) {
+      summary += `**Quality of Earnings:** ${analysisData.financialSummary.qualityOfEarnings}\n\n`;
+    }
+    if (analysisData.financialSummary.revenueGrowthDrivers) {
+      summary += `**Revenue Growth Drivers:** ${analysisData.financialSummary.revenueGrowthDrivers}\n\n`;
+    }
+    if (analysisData.financialSummary.marginStabilityAnalysis) {
+      summary += `**Margin Stability:** ${analysisData.financialSummary.marginStabilityAnalysis}\n\n`;
+    }
+    if (analysisData.financialSummary.capitalExpenditures) {
+      summary += `**Capital Expenditures:** ${analysisData.financialSummary.capitalExpenditures}\n\n`;
+    }
+    if (analysisData.financialSummary.workingCapitalIntensity) {
+      summary += `**Working Capital Intensity:** ${analysisData.financialSummary.workingCapitalIntensity}\n\n`;
+    }
+    if (analysisData.financialSummary.freeCashFlowQuality) {
+      summary += `**Free Cash Flow Quality:** ${analysisData.financialSummary.freeCashFlowQuality}\n\n`;
+    }
+  }
+  
+  // Add management team
+  if (analysisData.managementTeamOverview?.keyLeaders) {
+    summary += `## Management Team\n\n`;
+    summary += `**Key Leaders:** ${analysisData.managementTeamOverview.keyLeaders}\n\n`;
+    
+    if (analysisData.managementTeamOverview.managementQualityAssessment) {
+      summary += `**Quality Assessment:** ${analysisData.managementTeamOverview.managementQualityAssessment}\n\n`;
+    }
+    if (analysisData.managementTeamOverview.postTransactionIntentions) {
+      summary += `**Post-Transaction Intentions:** ${analysisData.managementTeamOverview.postTransactionIntentions}\n\n`;
+    }
+    if (analysisData.managementTeamOverview.organizationalStructure) {
+      summary += `**Organizational Structure:** ${analysisData.managementTeamOverview.organizationalStructure}\n\n`;
+    }
+  }
+  
+  // Add investment thesis
+  if (analysisData.preliminaryInvestmentThesis?.keyAttractions) {
+    summary += `## Investment Thesis\n\n`;
+    summary += `**Key Attractions:** ${analysisData.preliminaryInvestmentThesis.keyAttractions}\n\n`;
+    
+    if (analysisData.preliminaryInvestmentThesis.potentialRisks) {
+      summary += `**Potential Risks:** ${analysisData.preliminaryInvestmentThesis.potentialRisks}\n\n`;
+    }
+    if (analysisData.preliminaryInvestmentThesis.valueCreationLevers) {
+      summary += `**Value Creation Levers:** ${analysisData.preliminaryInvestmentThesis.valueCreationLevers}\n\n`;
+    }
+    if (analysisData.preliminaryInvestmentThesis.alignmentWithFundStrategy) {
+      summary += `**Alignment with Fund Strategy:** ${analysisData.preliminaryInvestmentThesis.alignmentWithFundStrategy}\n\n`;
+    }
+  }
+  
+  // Add key questions and next steps
+  if (analysisData.keyQuestionsNextSteps?.criticalQuestions) {
+    summary += `## Key Questions & Next Steps\n\n`;
+    summary += `**Critical Questions:** ${analysisData.keyQuestionsNextSteps.criticalQuestions}\n\n`;
+    
+    if (analysisData.keyQuestionsNextSteps.missingInformation) {
+      summary += `**Missing Information:** ${analysisData.keyQuestionsNextSteps.missingInformation}\n\n`;
+    }
+    if (analysisData.keyQuestionsNextSteps.preliminaryRecommendation) {
+      summary += `**Preliminary Recommendation:** ${analysisData.keyQuestionsNextSteps.preliminaryRecommendation}\n\n`;
+    }
+    if (analysisData.keyQuestionsNextSteps.rationaleForRecommendation) {
+      summary += `**Rationale for Recommendation:** ${analysisData.keyQuestionsNextSteps.rationaleForRecommendation}\n\n`;
+    }
+    if (analysisData.keyQuestionsNextSteps.proposedNextSteps) {
+      summary += `**Proposed Next Steps:** ${analysisData.keyQuestionsNextSteps.proposedNextSteps}\n\n`;
+    }
+  }
+  
+  return summary;
+}
+
--- a/backend/src/services/rag/tableProcessor.ts
+++ b/backend/src/services/rag/tableProcessor.ts
@@ -0,0 +1,69 @@
+import { logger } from '../../utils/logger';
+import type { StructuredTable } from '../documentAiProcessor';
+import type { ProcessingChunk } from './types';
+
+/**
+ * Identify whether a structured table likely contains financial data
+ */
+export function isFinancialTable(table: StructuredTable): boolean {
+  const headerText = table.headers.join(' ').toLowerCase();
+  const rowsText = table.rows.map(row => row.join(' ').toLowerCase()).join(' ');
+
+  const hasPeriods = /fy[-\s]?\d{1,2}|20\d{2}|ltm|ttm|ytd|cy\d{2}|q[1-4]/i.test(headerText);
+
+  const financialMetrics = [
+    'revenue', 'sales', 'ebitda', 'ebit', 'profit', 'margin',
+    'gross profit', 'operating income', 'net income', 'cash flow',
+    'earnings', 'assets', 'liabilities', 'equity'
+  ];
+  const hasMetrics = financialMetrics.some(metric => rowsText.includes(metric));
+
+  const hasCurrency = /\$[\d,]+(?:\.\d+)?[kmb]?|\d+(?:\.\d+)?%/.test(rowsText);
+
+  const isFinancial = hasPeriods && (hasMetrics || hasCurrency);
+
+  if (isFinancial) {
+    logger.info('Identified financial structured table', {
+      pageNumber: table.position?.pageNumber ?? -1,
+      headerPreview: table.headers.slice(0, 5),
+      rowCount: table.rows.length
+    });
+  }
+
+  return isFinancial;
+}
+
+/**
+ * Format structured tables as markdown to preserve layout for LLM consumption
+ */
+export function formatTableAsMarkdown(table: StructuredTable): string {
+  const lines: string[] = [];
+
+  if (table.headers.length > 0) {
+    lines.push(`| ${table.headers.join(' | ')} |`);
+    lines.push(`| ${table.headers.map(() => '---').join(' | ')} |`);
+  }
+
+  for (const row of table.rows) {
+    lines.push(`| ${row.join(' | ')} |`);
+  }
+
+  return lines.join('\n');
+}
+
+/**
+ * Remove structured table chunks when focusing on narrative/qualitative sections
+ */
+export function excludeStructuredTableChunks(chunks: ProcessingChunk[]): ProcessingChunk[] {
+  const filtered = chunks.filter(chunk => chunk.metadata?.isStructuredTable !== true);
+
+  if (filtered.length !== chunks.length) {
+    logger.info('Structured table chunks excluded for narrative pass', {
+      originalCount: chunks.length,
+      filteredCount: filtered.length
+    });
+  }
+
+  return filtered;
+}
+
--- a/backend/src/services/rag/types.ts
+++ b/backend/src/services/rag/types.ts
@@ -0,0 +1,41 @@
+import type { CIMReview } from '../llmSchemas';
+import type { StructuredTable } from '../documentAiProcessor';
+
+export interface ProcessingChunk {
+  id: string;
+  content: string;
+  chunkIndex: number;
+  startPosition: number;
+  endPosition: number;
+  sectionType?: string;
+  metadata?: Record<string, any>;
+}
+
+export interface ProcessingResult {
+  totalChunks: number;
+  processedChunks: number;
+  processingTime: number;
+  averageChunkSize: number;
+  memoryUsage: number;
+  summary?: string;
+  analysisData?: CIMReview;
+  success: boolean;
+  error?: string;
+  apiCalls: number;
+  processingStrategy: 'document_ai_agentic_rag' | 'document_ai_multi_pass_rag';
+}
+
+export interface ChunkingOptions {
+  enableSemanticChunking?: boolean;
+  enableMetadataEnrichment?: boolean;
+  similarityThreshold?: number;
+  structuredTables?: StructuredTable[];
+}
+
+export interface ProcessingOptions {
+  enableSemanticChunking?: boolean;
+  enableMetadataEnrichment?: boolean;
+  similarityThreshold?: number;
+  structuredTables?: StructuredTable[];
+}
+
--- a/backend/src/services/rag/utils.ts
+++ b/backend/src/services/rag/utils.ts
@@ -0,0 +1,137 @@
+import { logger } from '../../utils/logger';
+import type { ProcessingChunk } from './types';
+
+/**
+ * Calculate cosine similarity between two embeddings
+ */
+export function calculateCosineSimilarity(embedding1: number[], embedding2: number[]): number {
+  if (embedding1.length !== embedding2.length) {
+    return 0;
+  }
+  
+  let dotProduct = 0;
+  let magnitude1 = 0;
+  let magnitude2 = 0;
+  
+  for (let i = 0; i < embedding1.length; i++) {
+    dotProduct += embedding1[i] * embedding2[i];
+    magnitude1 += embedding1[i] * embedding1[i];
+    magnitude2 += embedding2[i] * embedding2[i];
+  }
+  
+  magnitude1 = Math.sqrt(magnitude1);
+  magnitude2 = Math.sqrt(magnitude2);
+  
+  if (magnitude1 === 0 || magnitude2 === 0) {
+    return 0;
+  }
+  
+  return dotProduct / (magnitude1 * magnitude2);
+}
+
+/**
+ * Detect section type from content
+ */
+export function detectSectionType(content: string): string {
+  const lowerContent = content.toLowerCase();
+  
+  if (lowerContent.includes('financial') || lowerContent.includes('revenue') || lowerContent.includes('ebitda')) {
+    return 'financial';
+  } else if (lowerContent.includes('market') || lowerContent.includes('industry') || lowerContent.includes('competitive')) {
+    return 'market';
+  } else if (lowerContent.includes('business') || lowerContent.includes('operation') || lowerContent.includes('product')) {
+    return 'business';
+  } else if (lowerContent.includes('management') || lowerContent.includes('team') || lowerContent.includes('leadership')) {
+    return 'management';
+  } else if (lowerContent.includes('technology') || lowerContent.includes('software') || lowerContent.includes('platform')) {
+    return 'technology';
+  } else if (lowerContent.includes('risk') || lowerContent.includes('challenge') || lowerContent.includes('opportunity')) {
+    return 'risk_opportunity';
+  }
+  
+  return 'general';
+}
+
+/**
+ * Extract metadata from content
+ */
+export function extractMetadata(content: string): Record<string, any> {
+  const metadata: Record<string, any> = {};
+  
+  // Extract key metrics
+  const revenueMatch = content.match(/\$[\d,]+(?:\.\d+)?\s*(?:million|billion|M|B)/gi);
+  if (revenueMatch) {
+    metadata['revenueMentions'] = revenueMatch.length;
+  }
+
+  // Extract company names
+  const companyMatch = content.match(/\b[A-Z][a-z]+(?:\s+[A-Z][a-z]+)*\s+(?:Inc|Corp|LLC|Ltd|Company|Group)\b/g);
+  if (companyMatch) {
+    metadata['companies'] = companyMatch;
+  }
+
+  // Extract financial terms
+  const financialTerms = ['revenue', 'ebitda', 'profit', 'margin', 'growth', 'valuation'];
+  metadata['financialTerms'] = financialTerms.filter(term => 
+    content.toLowerCase().includes(term)
+  );
+
+  return metadata;
+}
+
+/**
+ * Deep merge helper that prefers non-empty, non-"Not specified" values
+ */
+export function deepMerge(target: any, source: any): void {
+  for (const key in source) {
+    if (source[key] === null || source[key] === undefined) {
+      continue;
+    }
+
+    const sourceValue = source[key];
+    const targetValue = target[key];
+
+    // If source value is "Not specified in CIM", skip it if we already have data
+    if (typeof sourceValue === 'string' && sourceValue.includes('Not specified')) {
+      if (targetValue && typeof targetValue === 'string' && !targetValue.includes('Not specified')) {
+        continue; // Keep existing good data
+      }
+    }
+
+    // Handle objects (recursive merge)
+    if (typeof sourceValue === 'object' && !Array.isArray(sourceValue) && sourceValue !== null) {
+      if (!target[key] || typeof target[key] !== 'object') {
+        target[key] = {};
+      }
+      deepMerge(target[key], sourceValue);
+    } else {
+      // For primitive values, only overwrite if target is empty or "Not specified"
+      if (!targetValue ||
+          (typeof targetValue === 'string' && targetValue.includes('Not specified')) ||
+          targetValue === '') {
+            target[key] = sourceValue;
+      }
+    }
+  }
+}
+
+/**
+ * Get nested field value from object using dot notation
+ */
+export function getNestedField(obj: any, path: string): any {
+  return path.split('.').reduce((curr, key) => curr?.[key], obj);
+}
+
+/**
+ * Set nested field value in object using dot notation
+ */
+export function setNestedField(obj: any, path: string, value: any): void {
+  const keys = path.split('.');
+  const lastKey = keys.pop()!;
+  const target = keys.reduce((curr, key) => {
+    if (!curr[key]) curr[key] = {};
+    return curr[key];
+  }, obj);
+  target[lastKey] = value;
+}
+
--- a/backend/src/services/simpleDocumentProcessor.ts
+++ b/backend/src/services/simpleDocumentProcessor.ts
@@ -5,6 +5,7 @@ import { llmService } from './llmService';
 import { CIMReview } from './llmSchemas';
 import { cimReviewSchema } from './llmSchemas';
 import { defaultCIMReview } from './unifiedDocumentProcessor';
+import { financialExtractionMonitoringService } from './financialExtractionMonitoringService';

 interface ProcessingResult {
  success: boolean;
@@ -111,12 +112,14 @@ class SimpleDocumentProcessor {
      });

      let financialData: CIMReview['financialSummary'] | null = null;
+      const financialExtractionStartTime = Date.now();
      try {
        const financialResult = await llmService.processFinancialsOnly(
          extractedText,
          deterministicFinancials || undefined
        );
        apiCalls += 1;
+        const financialExtractionDuration = Date.now() - financialExtractionStartTime;

        if (financialResult.success && financialResult.jsonOutput?.financialSummary) {
          financialData = financialResult.jsonOutput.financialSummary;
@@ -124,13 +127,92 @@ class SimpleDocumentProcessor {
            documentId,
            hasFinancials: !!financialData.financials
          });
+
+          // Track successful financial extraction event
+          const financials = financialData.financials;
+          const periodsExtracted: string[] = [];
+          const metricsExtractedSet = new Set<string>();
+          
+          if (financials) {
+            ['fy3', 'fy2', 'fy1', 'ltm'].forEach(period => {
+              const periodData = financials[period as keyof typeof financials];
+              if (periodData) {
+                // Check if period has any data
+                const hasData = periodData.revenue || periodData.ebitda || periodData.grossProfit;
+                if (hasData) {
+                  periodsExtracted.push(period);
+                  
+                  // Track which metrics are present
+                  if (periodData.revenue) metricsExtractedSet.add('revenue');
+                  if (periodData.revenueGrowth) metricsExtractedSet.add('revenueGrowth');
+                  if (periodData.grossProfit) metricsExtractedSet.add('grossProfit');
+                  if (periodData.grossMargin) metricsExtractedSet.add('grossMargin');
+                  if (periodData.ebitda) metricsExtractedSet.add('ebitda');
+                  if (periodData.ebitdaMargin) metricsExtractedSet.add('ebitdaMargin');
+                }
+              }
+            });
+          }
+
+          // Determine extraction method
+          const extractionMethod = deterministicFinancials 
+            ? 'deterministic_parser' 
+            : (financialResult.model?.includes('haiku') ? 'llm_haiku' : 'llm_sonnet');
+
+          // Track extraction event (non-blocking)
+          financialExtractionMonitoringService.trackExtractionEvent({
+            documentId,
+            userId,
+            extractionMethod: extractionMethod as 'deterministic_parser' | 'llm_haiku' | 'llm_sonnet' | 'fallback',
+            modelUsed: financialResult.model,
+            success: true,
+            hasFinancials: !!financials,
+            periodsExtracted,
+            metricsExtracted: Array.from(metricsExtractedSet),
+            processingTimeMs: financialExtractionDuration,
+            apiCallDurationMs: financialExtractionDuration, // Approximate
+            tokensUsed: financialResult.inputTokens + financialResult.outputTokens,
+            costEstimateUsd: financialResult.cost,
+          }).catch(err => {
+            logger.debug('Failed to track financial extraction event (non-critical)', { error: err.message });
+          });
        } else {
+          // Track failed financial extraction event
+          const extractionMethod = deterministicFinancials 
+            ? 'deterministic_parser' 
+            : 'llm_haiku'; // Default assumption
+
+          financialExtractionMonitoringService.trackExtractionEvent({
+            documentId,
+            userId,
+            extractionMethod: extractionMethod as 'deterministic_parser' | 'llm_haiku' | 'llm_sonnet' | 'fallback',
+            success: false,
+            errorType: 'api_error',
+            errorMessage: financialResult.error,
+            processingTimeMs: Date.now() - financialExtractionStartTime,
+          }).catch(err => {
+            logger.debug('Failed to track financial extraction event (non-critical)', { error: err.message });
+          });
+
          logger.warn('Financial extraction failed, will try in main extraction', {
            documentId,
            error: financialResult.error
          });
        }
      } catch (financialError) {
+        // Track error event
+        financialExtractionMonitoringService.trackExtractionEvent({
+          documentId,
+          userId,
+          extractionMethod: deterministicFinancials ? 'deterministic_parser' : 'llm_haiku',
+          success: false,
+          errorType: 'api_error',
+          errorMessage: financialError instanceof Error ? financialError.message : String(financialError),
+          processingTimeMs: Date.now() - financialExtractionStartTime,
+        }).catch(err => {
+          logger.debug('Failed to track financial extraction event (non-critical)', { error: err.message });
+        });
+
        logger.warn('Financial extraction threw error, will try in main extraction', {
          documentId,
          error: financialError instanceof Error ? financialError.message : String(financialError)
--- a/backend/src/types/document.ts
+++ b/backend/src/types/document.ts
@@ -0,0 +1,54 @@
+/**
+ * Shared types for document-related operations
+ */
+
+/**
+ * Document status types
+ */
+export type DocumentStatus = 
+  | 'pending' 
+  | 'uploading' 
+  | 'processing' 
+  | 'completed' 
+  | 'failed' 
+  | 'cancelled';
+
+/**
+ * Document metadata
+ */
+export interface DocumentMetadata {
+  id: string;
+  userId: string;
+  fileName: string;
+  fileSize: number;
+  mimeType: string;
+  status: DocumentStatus;
+  createdAt: Date;
+  updatedAt: Date;
+  processingStartedAt?: Date;
+  processingCompletedAt?: Date;
+  error?: string;
+}
+
+/**
+ * Document upload options
+ */
+export interface DocumentUploadOptions {
+  fileName: string;
+  mimeType: string;
+  fileSize: number;
+  userId: string;
+}
+
+/**
+ * Document processing metadata
+ */
+export interface DocumentProcessingMetadata {
+  documentId: string;
+  userId: string;
+  strategy: string;
+  processingTime?: number;
+  apiCalls?: number;
+  error?: string;
+}
+
--- a/backend/src/types/job.ts
+++ b/backend/src/types/job.ts
@@ -0,0 +1,60 @@
+/**
+ * Shared types for job processing
+ */
+
+/**
+ * Job status types
+ */
+export type JobStatus = 
+  | 'pending' 
+  | 'processing' 
+  | 'completed' 
+  | 'failed' 
+  | 'cancelled';
+
+/**
+ * Job priority levels
+ */
+export type JobPriority = 'low' | 'normal' | 'high' | 'urgent';
+
+/**
+ * Processing job interface
+ */
+export interface ProcessingJob {
+  id: string;
+  documentId: string;
+  userId: string;
+  status: JobStatus;
+  priority: JobPriority;
+  createdAt: Date;
+  updatedAt: Date;
+  startedAt?: Date;
+  completedAt?: Date;
+  error?: string;
+  retryCount: number;
+  maxRetries: number;
+  metadata?: Record<string, any>;
+}
+
+/**
+ * Job queue configuration
+ */
+export interface JobQueueConfig {
+  maxConcurrentJobs: number;
+  retryDelay: number;
+  maxRetries: number;
+  timeout: number;
+}
+
+/**
+ * Job processing result
+ */
+export interface JobProcessingResult {
+  success: boolean;
+  jobsProcessed: number;
+  jobsCompleted: number;
+  jobsFailed: number;
+  processingTime: number;
+  errors?: string[];
+}
+
--- a/backend/src/types/llm.ts
+++ b/backend/src/types/llm.ts
@@ -0,0 +1,56 @@
+/**
+ * Shared types for LLM services
+ */
+
+import { CIMReview, cimReviewSchema } from '../services/llmSchemas';
+import { z } from 'zod';
+
+/**
+ * LLM request interface
+ */
+export interface LLMRequest {
+  prompt: string;
+  systemPrompt?: string;
+  maxTokens?: number;
+  temperature?: number;
+  model?: string;
+}
+
+/**
+ * LLM response interface
+ */
+export interface LLMResponse {
+  success: boolean;
+  content: string;
+  usage?: {
+    promptTokens: number;
+    completionTokens: number;
+    totalTokens: number;
+  };
+  error?: string;
+}
+
+/**
+ * CIM analysis result from LLM processing
+ */
+export interface CIMAnalysisResult {
+  success: boolean;
+  jsonOutput?: CIMReview;
+  error?: string;
+  model: string;
+  cost: number;
+  inputTokens: number;
+  outputTokens: number;
+  validationIssues?: z.ZodIssue[];
+}
+
+/**
+ * LLM provider types
+ */
+export type LLMProvider = 'anthropic' | 'openai' | 'openrouter';
+
+/**
+ * LLM endpoint types for tracking
+ */
+export type LLMEndpoint = 'financial_extraction' | 'full_extraction' | 'other';
+
--- a/backend/src/types/processing.ts
+++ b/backend/src/types/processing.ts
@@ -0,0 +1,63 @@
+/**
+ * Shared types for document processing
+ */
+
+import { CIMReview } from '../services/llmSchemas';
+
+/**
+ * Processing strategy types
+ */
+export type ProcessingStrategy = 
+  | 'document_ai_agentic_rag' 
+  | 'simple_full_document' 
+  | 'parallel_sections'
+  | 'document_ai_multi_pass_rag';
+
+/**
+ * Standard processing result for document processors
+ */
+export interface ProcessingResult {
+  success: boolean;
+  summary: string;
+  analysisData: CIMReview;
+  processingStrategy: ProcessingStrategy;
+  processingTime: number;
+  apiCalls: number;
+  error?: string;
+}
+
+/**
+ * Extended processing result for RAG processors with chunk information
+ */
+export interface RAGProcessingResult extends ProcessingResult {
+  totalChunks?: number;
+  processedChunks?: number;
+  averageChunkSize?: number;
+  memoryUsage?: number;
+}
+
+/**
+ * Processing options for document processors
+ */
+export interface ProcessingOptions {
+  strategy?: ProcessingStrategy;
+  fileBuffer?: Buffer;
+  fileName?: string;
+  mimeType?: string;
+  enableSemanticChunking?: boolean;
+  enableMetadataEnrichment?: boolean;
+  similarityThreshold?: number;
+  structuredTables?: any[];
+  [key: string]: any; // Allow additional options
+}
+
+/**
+ * Document AI processing result
+ */
+export interface DocumentAIProcessingResult {
+  success: boolean;
+  content: string;
+  metadata?: any;
+  error?: string;
+}
+
--- a/backend/src/utils/errorHandlers.ts
+++ b/backend/src/utils/errorHandlers.ts
@@ -0,0 +1,204 @@
+/**
+ * Common Error Handling Utilities
+ * Shared error handling patterns used across services
+ */
+
+import { logger } from './logger';
+
+/**
+ * Extract error message from any error type
+ */
+export function extractErrorMessage(error: unknown): string {
+  if (error instanceof Error) {
+    return error.message;
+  }
+  if (typeof error === 'string') {
+    return error;
+  }
+  if (error && typeof error === 'object') {
+    const errorObj = error as Record<string, any>;
+    return errorObj.message || errorObj.error || String(error);
+  }
+  return String(error);
+}
+
+/**
+ * Extract error stack trace
+ */
+export function extractErrorStack(error: unknown): string | undefined {
+  if (error instanceof Error) {
+    return error.stack;
+  }
+  return undefined;
+}
+
+/**
+ * Extract detailed error information for logging
+ */
+export function extractErrorDetails(error: unknown): {
+  name?: string;
+  message: string;
+  stack?: string;
+  type: string;
+  value?: any;
+} {
+  if (error instanceof Error) {
+    return {
+      name: error.name,
+      message: error.message,
+      stack: error.stack,
+      type: 'Error',
+    };
+  }
+  
+  return {
+    message: extractErrorMessage(error),
+    type: typeof error,
+    value: error,
+  };
+}
+
+/**
+ * Check if error is a timeout error
+ */
+export function isTimeoutError(error: unknown): boolean {
+  const message = extractErrorMessage(error);
+  return message.toLowerCase().includes('timeout') || 
+         message.toLowerCase().includes('timed out') ||
+         message.toLowerCase().includes('exceeded');
+}
+
+/**
+ * Check if error is a rate limit error
+ */
+export function isRateLimitError(error: unknown): boolean {
+  if (error && typeof error === 'object') {
+    const errorObj = error as Record<string, any>;
+    return errorObj.status === 429 ||
+           errorObj.code === 429 ||
+           errorObj.error?.type === 'rate_limit_error' ||
+           extractErrorMessage(error).toLowerCase().includes('rate limit');
+  }
+  return false;
+}
+
+/**
+ * Check if error is retryable
+ */
+export function isRetryableError(error: unknown): boolean {
+  // Timeout errors are retryable
+  if (isTimeoutError(error)) {
+    return true;
+  }
+  
+  // Rate limit errors are retryable (with backoff)
+  if (isRateLimitError(error)) {
+    return true;
+  }
+  
+  // Network/connection errors are retryable
+  const message = extractErrorMessage(error).toLowerCase();
+  if (message.includes('network') || 
+      message.includes('connection') ||
+      message.includes('econnrefused') ||
+      message.includes('etimedout')) {
+    return true;
+  }
+  
+  // 5xx server errors are retryable
+  if (error && typeof error === 'object') {
+    const errorObj = error as Record<string, any>;
+    const status = errorObj.status || errorObj.statusCode;
+    if (status && status >= 500 && status < 600) {
+      return true;
+    }
+  }
+  
+  return false;
+}
+
+/**
+ * Extract retry delay from rate limit error
+ */
+export function extractRetryAfter(error: unknown): number {
+  if (error && typeof error === 'object') {
+    const errorObj = error as Record<string, any>;
+    const retryAfter = errorObj.headers?.['retry-after'] || 
+                      errorObj.error?.retry_after ||
+                      errorObj.retryAfter;
+    if (retryAfter) {
+      return typeof retryAfter === 'number' ? retryAfter : parseInt(retryAfter, 10);
+    }
+  }
+  return 60; // Default 60 seconds
+}
+
+/**
+ * Log error with structured context
+ */
+export function logErrorWithContext(
+  error: unknown,
+  context: Record<string, any>,
+  level: 'error' | 'warn' | 'info' = 'error'
+): void {
+  const errorMessage = extractErrorMessage(error);
+  const errorStack = extractErrorStack(error);
+  const errorDetails = extractErrorDetails(error);
+  
+  const logData = {
+    ...context,
+    error: {
+      message: errorMessage,
+      stack: errorStack,
+      details: errorDetails,
+      isRetryable: isRetryableError(error),
+      isTimeout: isTimeoutError(error),
+      isRateLimit: isRateLimitError(error),
+    },
+    timestamp: new Date().toISOString(),
+  };
+  
+  if (level === 'error') {
+    logger.error('Error occurred', logData);
+  } else if (level === 'warn') {
+    logger.warn('Warning occurred', logData);
+  } else {
+    logger.info('Info', logData);
+  }
+}
+
+/**
+ * Create a standardized error object
+ */
+export function createStandardError(
+  message: string,
+  code?: string,
+  statusCode?: number,
+  retryable?: boolean
+): Error & { code?: string; statusCode?: number; retryable?: boolean } {
+  const error = new Error(message) as Error & { code?: string; statusCode?: number; retryable?: boolean };
+  if (code) error.code = code;
+  if (statusCode) error.statusCode = statusCode;
+  if (retryable !== undefined) error.retryable = retryable;
+  return error;
+}
+
+/**
+ * Wrap async function with error handling
+ */
+export async function withErrorHandling<T>(
+  fn: () => Promise<T>,
+  context: Record<string, any>,
+  onError?: (error: unknown) => void
+): Promise<T> {
+  try {
+    return await fn();
+  } catch (error) {
+    logErrorWithContext(error, context);
+    if (onError) {
+      onError(error);
+    }
+    throw error;
+  }
+}
+