cim_summary/backend/src/scripts/test-haiku-financial-extraction.ts

#!/usr/bin/env ts-node

/**
 * Test Haiku 4.5 Financial Extraction
 *
 * Tests that:
 * 1. Haiku 4.5 is used for financial extraction by default
 * 2. Fallback to Sonnet works if validation fails
 * 3. Model selection logic works correctly
 * 4. Performance improvements are measurable
 *
 * Usage:
 *   npx ts-node backend/src/scripts/test-haiku-financial-extraction.ts [path-to-pdf]
 *
 * Examples:
 *   npx ts-node backend/src/scripts/test-haiku-financial-extraction.ts
 *   npx ts-node backend/src/scripts/test-haiku-financial-extraction.ts "../Stax Holding Company.pdf"
 */

// CRITICAL: Load .env file BEFORE importing config
import dotenv from 'dotenv';
import * as path from 'path';
dotenv.config({ path: path.join(__dirname, '../../.env') });

import { llmService } from '../services/llmService';
import { config } from '../config/env';
import { logger } from '../utils/logger';
import { parseFinancialsFromText } from '../services/financialTableParser';
import { documentAiProcessor } from '../services/documentAiProcessor';
import * as fs from 'fs';

// Sample financial table text (fallback if no PDF provided)
const SAMPLE_FINANCIAL_TEXT = `
CONFIDENTIAL INFORMATION MEMORANDUM

FINANCIAL SUMMARY

Historical Financial Performance

The following table presents the Company's historical financial performance:

                    FY-3        FY-2        FY-1        LTM
Revenue            $64.0M      $71.0M      $71.0M      $76.0M
Revenue Growth       N/A        10.9%        0.0%        7.0%
Gross Profit       $45.0M      $50.0M      $50.0M      $54.0M
Gross Margin        70.3%       70.4%       70.4%       71.1%
EBITDA              $19.0M      $24.0M      $24.0M      $27.0M
EBITDA Margin        29.7%       33.8%       33.8%       35.5%

The Company has demonstrated consistent revenue growth and improving margins over the historical period.
EBITDA margins have improved from 29.7% in FY-3 to 35.5% in LTM, reflecting operational efficiency gains.

Quality of Earnings
The Company's financial results include certain addbacks and adjustments. Management has identified
approximately $2.5M in annualized EBITDA adjustments related to owner compensation and one-time expenses.

Capital Expenditures
Capital expenditures have averaged approximately 2-3% of revenue over the historical period, reflecting
the Company's asset-light business model.

Working Capital
The Company operates with minimal working capital requirements. Accounts receivable typically convert
to cash within 30-45 days, and inventory levels are low due to the service-based nature of the business.

Free Cash Flow
The Company generates strong free cash flow, with free cash flow conversion typically exceeding 90% of EBITDA.
`;

async function testHaikuFinancialExtraction() {
  console.log('\n🧪 Testing Haiku 4.5 Financial Extraction');
  console.log('='.repeat(60));

  // Get PDF path from command line or use sample text
  const pdfPathArg = process.argv[2];
  let textToUse = SAMPLE_FINANCIAL_TEXT;
  let usingRealCIM = false;

  // Helper function to extract text from PDF
  const extractTextFromPDF = async (pdfPath: string): Promise<string | null> => {
    try {
      const documentId = `test-haiku-${Date.now()}`;
      const userId = 'test-user';
      const fileBuffer = fs.readFileSync(pdfPath);
      const fileName = path.basename(pdfPath);

      console.log('Extracting text from PDF using Document AI...');
      const extractionResult = await documentAiProcessor.extractTextOnly(
        documentId,
        userId,
        fileBuffer,
        fileName,
        'application/pdf'
      );

      if (extractionResult.text) {
        return extractionResult.text;
      }
      return null;
    } catch (error) {
      console.error(`⚠️  Failed to extract text: ${error instanceof Error ? error.message : String(error)}`);
      return null;
    }
  };

  if (pdfPathArg && fs.existsSync(pdfPathArg)) {
    console.log(`\n📄 Using real CIM: ${pdfPathArg}`);
    const extractedText = await extractTextFromPDF(pdfPathArg);
    if (extractedText) {
      textToUse = extractedText;
      usingRealCIM = true;
      console.log(`✅ Extracted ${textToUse.length} characters from PDF`);
    } else {
      console.log('Falling back to sample text...');
    }
  } else if (pdfPathArg) {
    console.error(`❌ PDF not found: ${pdfPathArg}`);
    console.log('Falling back to sample text...');
  } else {
    // Try to find Stax CIM
    const staxDocumentName = '2025-04-23 Stax Holding Company, LLC Confidential Information Presentation for Stax Holding Company, LLC - April 2025-1.pdf';
    const possiblePaths = [
      path.join(process.cwd(), '..', staxDocumentName),
      path.join(process.cwd(), '..', '..', staxDocumentName),
      path.join(process.cwd(), staxDocumentName),
      path.join(process.env.HOME || '', 'Downloads', staxDocumentName),
    ];

    for (const testPath of possiblePaths) {
      if (fs.existsSync(testPath)) {
        console.log(`\n📄 Found Stax CIM: ${testPath}`);
        const extractedText = await extractTextFromPDF(testPath);
        if (extractedText) {
          textToUse = extractedText;
          usingRealCIM = true;
          console.log(`✅ Extracted ${textToUse.length} characters from PDF`);
          break;
        }
      }
    }

    if (!usingRealCIM) {
      console.log('\n📝 Using sample financial text (no PDF found)');
      console.log('   To test with a real CIM, provide a path:');
      console.log('   npx ts-node backend/src/scripts/test-haiku-financial-extraction.ts <path-to-pdf>');
    }
  }

  // Test 1: Check model configuration
  console.log('\n📋 Test 1: Model Configuration');
  console.log('-'.repeat(60));
  console.log(`Primary Model: ${config.llm.model}`);
  console.log(`Fast Model: ${config.llm.fastModel}`);
  console.log(`Financial Model: ${config.llm.financialModel || 'Not set (will use fastModel)'}`);

  const expectedFinancialModel = config.llm.financialModel || config.llm.fastModel || config.llm.model;
  const isHaiku = expectedFinancialModel.includes('haiku');

  console.log(`\n✅ Expected Financial Model: ${expectedFinancialModel}`);
  console.log(`   ${isHaiku ? '✅ Using Haiku (fast model)' : '⚠️  Not using Haiku - using ' + expectedFinancialModel}`);
  console.log(`   ${usingRealCIM ? '📄 Using real CIM document' : '📝 Using sample text'}`);

  // Test 2: Test deterministic parser first
  console.log('\n📋 Test 2: Deterministic Parser');
  console.log('-'.repeat(60));
  const parserResults = parseFinancialsFromText(textToUse);
  console.log('Parser Results:');
  console.log(`  FY3 Revenue: ${parserResults.fy3.revenue || 'Not found'}`);
  console.log(`  FY2 Revenue: ${parserResults.fy2.revenue || 'Not found'}`);
  console.log(`  FY1 Revenue: ${parserResults.fy1.revenue || 'Not found'}`);
  console.log(`  LTM Revenue: ${parserResults.ltm.revenue || 'Not found'}`);

  const parserHasData = !!(parserResults.fy3.revenue || parserResults.fy2.revenue || parserResults.fy1.revenue || parserResults.ltm.revenue);
  console.log(`\n${parserHasData ? '✅' : '⚠️ '} Parser ${parserHasData ? 'found' : 'did not find'} financial data`);

  // Test 3: Test LLM extraction with Haiku
  console.log('\n📋 Test 3: LLM Financial Extraction (Haiku 4.5)');
  console.log('-'.repeat(60));

  const startTime = Date.now();

  try {
    console.log('Calling processFinancialsOnly()...');
    console.log(`Expected model: ${expectedFinancialModel}`);
    console.log(`Text length: ${textToUse.length} characters`);

    const result = await llmService.processFinancialsOnly(
      textToUse,
      parserHasData ? parserResults : undefined
    );

    const endTime = Date.now();
    const processingTime = endTime - startTime;

    console.log(`\n⏱️  Processing Time: ${processingTime}ms (${(processingTime / 1000).toFixed(2)}s)`);
    console.log(`\n📊 Extraction Results:`);
    console.log(`   Success: ${result.success ? '✅' : '❌'}`);
    console.log(`   Model Used: ${result.model}`);
    console.log(`   Cost: $${result.cost.toFixed(4)}`);
    console.log(`   Input Tokens: ${result.inputTokens}`);
    console.log(`   Output Tokens: ${result.outputTokens}`);

    if (result.success && result.jsonOutput?.financialSummary?.financials) {
      const financials = result.jsonOutput.financialSummary.financials;

      console.log(`\n💰 Extracted Financial Data:`);
      ['fy3', 'fy2', 'fy1', 'ltm'].forEach(period => {
        const periodData = financials[period as keyof typeof financials];
        if (periodData) {
          console.log(`\n   ${period.toUpperCase()}:`);
          console.log(`     Revenue: ${periodData.revenue || 'Not found'}`);
          console.log(`     Revenue Growth: ${periodData.revenueGrowth || 'Not found'}`);
          console.log(`     Gross Profit: ${periodData.grossProfit || 'Not found'}`);
          console.log(`     Gross Margin: ${periodData.grossMargin || 'Not found'}`);
          console.log(`     EBITDA: ${periodData.ebitda || 'Not found'}`);
          console.log(`     EBITDA Margin: ${periodData.ebitdaMargin || 'Not found'}`);
        }
      });

      // Validation checks
      console.log(`\n✅ Validation Checks:`);
      const hasRevenue = !!(financials.fy3?.revenue || financials.fy2?.revenue || financials.fy1?.revenue || financials.ltm?.revenue);
      const hasEBITDA = !!(financials.fy3?.ebitda || financials.fy2?.ebitda || financials.fy1?.ebitda || financials.ltm?.ebitda);
      const hasGrossProfit = !!(financials.fy3?.grossProfit || financials.fy2?.grossProfit || financials.fy1?.grossProfit || financials.ltm?.grossProfit);

      console.log(`   Revenue extracted: ${hasRevenue ? '✅' : '❌'}`);
      console.log(`   EBITDA extracted: ${hasEBITDA ? '✅' : '❌'}`);
      console.log(`   Gross Profit extracted: ${hasGrossProfit ? '✅' : '❌'}`);

      // Check if Haiku was used
      const usedHaiku = result.model.includes('haiku');
      console.log(`\n🚀 Model Performance:`);
      console.log(`   Model Used: ${result.model}`);
      console.log(`   ${usedHaiku ? '✅ Haiku 4.5 used (fast path)' : '⚠️  Sonnet used (fallback or configured)'}`);

      if (usedHaiku) {
        console.log(`   ✅ Successfully used Haiku 4.5 for extraction`);
        console.log(`   💰 Cost savings: ~92% vs Sonnet`);
        console.log(`   ⚡ Speed improvement: ~2x faster`);
      }

      // Expected values for comparison
      const expectedValues = {
        fy3: { revenue: '$64.0M', ebitda: '$19.0M' },
        fy2: { revenue: '$71.0M', ebitda: '$24.0M' },
        fy1: { revenue: '$71.0M', ebitda: '$24.0M' },
        ltm: { revenue: '$76.0M', ebitda: '$27.0M' }
      };

      console.log(`\n🔍 Accuracy Check:`);
      let accuracyScore = 0;
      let totalChecks = 0;

      Object.entries(expectedValues).forEach(([period, expected]) => {
        const actual = financials[period as keyof typeof financials];
        if (actual) {
          // Check revenue (should contain "64" or "71" or "76")
          const revenueMatch = actual.revenue?.includes('64') || actual.revenue?.includes('71') || actual.revenue?.includes('76');
          totalChecks++;
          if (revenueMatch) accuracyScore++;

          // Check EBITDA (should contain "19" or "24" or "27")
          const ebitdaMatch = actual.ebitda?.includes('19') || actual.ebitda?.includes('24') || actual.ebitda?.includes('27');
          totalChecks++;
          if (ebitdaMatch) accuracyScore++;
        }
      });

      const accuracyPercent = totalChecks > 0 ? (accuracyScore / totalChecks) * 100 : 0;
      console.log(`   Accuracy: ${accuracyScore}/${totalChecks} checks passed (${accuracyPercent.toFixed(1)}%)`);
      console.log(`   ${accuracyPercent >= 80 ? '✅' : '⚠️ '} ${accuracyPercent >= 80 ? 'Good accuracy' : 'Some values may be incorrect'}`);

      // Test 4: Performance comparison estimate
      console.log(`\n📋 Test 4: Performance Estimate`);
      console.log('-'.repeat(60));
      console.log(`Current processing time: ${processingTime}ms`);

      if (usedHaiku) {
        const estimatedSonnetTime = processingTime * 2; // Haiku is ~2x faster
        console.log(`Estimated Sonnet time: ~${estimatedSonnetTime}ms`);
        console.log(`Time saved: ~${estimatedSonnetTime - processingTime}ms (${((estimatedSonnetTime - processingTime) / estimatedSonnetTime * 100).toFixed(1)}%)`);
      } else {
        console.log(`⚠️  Sonnet was used - cannot estimate Haiku performance`);
        console.log(`   This may indicate validation failed and fallback occurred`);
      }

      console.log(`\n${'='.repeat(60)}`);
      console.log('✅ Test Complete');
      console.log('='.repeat(60));

      if (result.success && usedHaiku) {
        console.log('\n🎉 SUCCESS: Haiku 4.5 is working correctly!');
        console.log('   - Financial extraction successful');
        console.log('   - Haiku model used (fast path)');
        console.log('   - Validation passed');
        process.exit(0);
      } else if (result.success && !usedHaiku) {
        console.log('\n⚠️  WARNING: Sonnet was used instead of Haiku');
        console.log('   - Extraction successful but using slower model');
        console.log('   - Check configuration or fallback logic');
        process.exit(0);
      } else {
        console.log('\n❌ FAILURE: Extraction failed');
        process.exit(1);
      }

    } else {
      console.log(`\n❌ Extraction failed: ${result.error || 'Unknown error'}`);
      if (result.validationIssues) {
        console.log(`\nValidation Issues:`);
        result.validationIssues.forEach(issue => {
          console.log(`   - ${issue.path.join('.')}: ${issue.message}`);
        });
      }

      console.log(`\n${'='.repeat(60)}`);
      console.log('❌ Test Failed');
      console.log('='.repeat(60));
      process.exit(1);
    }

  } catch (error) {
    logger.error('Test failed', {
      error: error instanceof Error ? error.message : String(error),
      stack: error instanceof Error ? error.stack : undefined
    });
    console.error(`\n❌ Test failed: ${error instanceof Error ? error.message : String(error)}`);
    if (error instanceof Error && error.stack) {
      console.error(`\nStack trace:\n${error.stack}`);
    }
    process.exit(1);
  }
}

// Run test
testHaikuFinancialExtraction().catch(error => {
  logger.error('Test execution failed', { error: error instanceof Error ? error.message : String(error) });
  console.error('❌ Test execution failed:', error);
  process.exit(1);
});