mnttnm · mnttnm · Nov 5, 2025 · Nov 5, 2025 · Nov 13, 2025 · Nov 19, 2025
diff --git a/ENTERPRISE_FEATURE_ANALYSIS.md b/ENTERPRISE_FEATURE_ANALYSIS.md
diff --git a/docs/ENTERPRISE_ROADMAP.md b/docs/ENTERPRISE_ROADMAP.md
diff --git a/docs/UPDATED_RECOMMENDATIONS.md b/docs/UPDATED_RECOMMENDATIONS.md
diff --git a/docs/implementation-plans/01-api-layer.md b/docs/implementation-plans/01-api-layer.md
diff --git a/docs/implementation-plans/02-data-platform-integrations.md b/docs/implementation-plans/02-data-platform-integrations.md
diff --git a/docs/implementation-plans/03-elasticsearch-integration.md b/docs/implementation-plans/03-elasticsearch-integration.md
diff --git a/docs/implementation-plans/04-compliance-security-suite.md b/docs/implementation-plans/04-compliance-security-suite.md
diff --git a/docs/implementation-plans/05-multi-llm-provider-support.md b/docs/implementation-plans/05-multi-llm-provider-support.md
diff --git a/package-lock.json b/package-lock.json
diff --git a/package.json b/package.json
@@ -14,6 +14,10 @@
     "generate-embeddings": "tsx scripts/generate_embeddings.ts"
   },
   "dependencies": {
+    "@ai-sdk/anthropic": "^2.0.45",
+    "@ai-sdk/google": "^2.0.38",
+    "@ai-sdk/openai": "^2.0.68",
+    "@aws-sdk/client-textract": "^3.934.0",
     "@radix-ui/react-checkbox": "^1.1.1",
     "@radix-ui/react-collapsible": "^1.1.0",
     "@radix-ui/react-dialog": "^1.1.4",
@@ -33,6 +37,7 @@
     "@supabase/supabase-js": "^2.45.3",
     "@types/pdfjs-dist": "^2.10.378",
     "@types/uuid": "^10.0.0",
+    "ai": "^5.0.95",
     "bcryptjs": "^2.4.3",
     "checkbox": "^0.0.1",
     "class-variance-authority": "^0.7.0",

diff --git a/src/app/api/v1/chat/route.ts b/src/app/api/v1/chat/route.ts
@@ -0,0 +1,138 @@
+/**
+ * Chat Completion Endpoint
+ *
+ * POST /api/v1/chat
+ *
+ * Generate chat completions using multi-provider LLM.
+ */
+
+import { NextRequest } from 'next/server';
+import { z } from 'zod';
+import { generateCompletion, generateStreamingCompletion, type LLMProviderType } from '@/lib/llm';
+import {
+  validateAPIKey,
+  hasPermission,
+  checkRateLimit,
+  authError,
+  rateLimitError,
+} from '../utils/auth';
+import { ErrorResponses, handleError } from '../utils/errors';
+
+// Request validation schema
+const ChatRequestSchema = z.object({
+  messages: z.array(
+    z.object({
+      role: z.enum(['system', 'user', 'assistant']),
+      content: z.string(),
+    })
+  ),
+  provider: z.enum(['openai', 'anthropic', 'google', 'azure', 'ollama']).optional(),
+  model: z.string().optional(),
+  temperature: z.number().min(0).max(2).optional(),
+  maxTokens: z.number().positive().optional(),
+  stream: z.boolean().optional(),
+});
+
+export async function POST(request: NextRequest) {
+  try {
+    // Authenticate
+    const keyInfo = await validateAPIKey(request);
+    if (!keyInfo) {
+      return authError('Invalid or missing API key');
+    }
+
+    // Check permission
+    if (!hasPermission(keyInfo, 'chat')) {
+      return authError('API key does not have chat permission', 403);
+    }
+
+    // Check rate limit
+    const rateLimit = checkRateLimit(keyInfo);
+    if (!rateLimit.allowed) {
+      return rateLimitError(rateLimit.resetAt);
+    }
+
+    // Parse and validate request body
+    const body = await request.json();
+    const validation = ChatRequestSchema.safeParse(body);
+
+    if (!validation.success) {
+      return ErrorResponses.validationError('Invalid request body', {
+        errors: validation.error.flatten().fieldErrors,
+      });
+    }
+
+    const { messages, provider, model, temperature, maxTokens, stream } = validation.data;
+
+    // Determine provider and model
+    const llmProvider = (provider || 'openai') as LLMProviderType;
+    const llmModel = model || (llmProvider === 'openai' ? 'gpt-4o' : undefined);
+
+    if (!llmModel) {
+      return ErrorResponses.validationError('Model must be specified for this provider');
+    }
+
+    // Build prompt from messages
+    const systemMessage = messages.find((m) => m.role === 'system')?.content;
+    const conversationMessages = messages.filter((m) => m.role !== 'system');
+
+    // Format conversation for prompt
+    const prompt = conversationMessages
+      .map((m) => `${m.role === 'user' ? 'User' : 'Assistant'}: ${m.content}`)
+      .join('\n\n');
+
+    const config = {
+      provider: llmProvider,
+      model: llmModel,
+      temperature,
+      maxTokens,
+    };
+
+    if (stream) {
+      // Streaming response
+      const textStream = await generateStreamingCompletion({
+        prompt,
+        config,
+        systemPrompt: systemMessage,
+      });
+
+      // Return the stream with appropriate headers
+      return new Response(textStream, {
+        headers: {
+          'Content-Type': 'text/event-stream',
+          'Cache-Control': 'no-cache',
+          Connection: 'keep-alive',
+          'X-RateLimit-Remaining': String(rateLimit.remaining),
+          'X-RateLimit-Reset': String(rateLimit.resetAt),
+        },
+      });
+    } else {
+      // Non-streaming response
+      const result = await generateCompletion({
+        prompt,
+        config,
+        systemPrompt: systemMessage,
+      });
+
+      return Response.json(
+        {
+          success: true,
+          data: {
+            content: result.text,
+            usage: result.usage,
+            model: llmModel,
+            provider: llmProvider,
+          },
+        },
+        {
+          headers: {
+            'X-RateLimit-Remaining': String(rateLimit.remaining),
+            'X-RateLimit-Reset': String(rateLimit.resetAt),
+          },
+        }
+      );
+    }
+  } catch (error) {
+    return handleError(error);
+  }
+}
diff --git a/src/app/api/v1/extract/route.ts b/src/app/api/v1/extract/route.ts
@@ -0,0 +1,124 @@
+/**
+ * Document Extraction Endpoint
+ *
+ * POST /api/v1/extract
+ *
+ * Extract text from PDF documents using OCR.
+ */
+
+import { NextRequest } from 'next/server';
+import { z } from 'zod';
+import { extractText, type OCRMethod } from '@/lib/ocr';
+import {
+  validateAPIKey,
+  hasPermission,
+  checkRateLimit,
+  authError,
+  rateLimitError,
+} from '../utils/auth';
+import { ErrorResponses, handleError } from '../utils/errors';
+
+// Request validation schema
+const ExtractRequestSchema = z.object({
+  // Either file (base64) or url must be provided
+  file: z.string().optional(),
+  url: z.string().url().optional(),
+  // OCR options
+  method: z.enum(['llmwhisperer', 'deepseek', 'textract', 'tesseract', 'pdfjs']).optional(),
+  preserveLayout: z.boolean().optional(),
+  detectForms: z.boolean().optional(),
+  extractTables: z.boolean().optional(),
+  pages: z.array(z.number().positive()).optional(),
+  language: z.string().optional(),
+  password: z.string().optional(),
+});
+
+export async function POST(request: NextRequest) {
+  try {
+    // Authenticate
+    const keyInfo = await validateAPIKey(request);
+    if (!keyInfo) {
+      return authError('Invalid or missing API key');
+    }
+
+    // Check permission
+    if (!hasPermission(keyInfo, 'extract')) {
+      return authError('API key does not have extraction permission', 403);
+    }
+
+    // Check rate limit
+    const rateLimit = checkRateLimit(keyInfo);
+    if (!rateLimit.allowed) {
+      return rateLimitError(rateLimit.resetAt);
+    }
+
+    // Parse and validate request body
+    const body = await request.json();
+    const validation = ExtractRequestSchema.safeParse(body);
+
+    if (!validation.success) {
+      return ErrorResponses.validationError('Invalid request body', {
+        errors: validation.error.flatten().fieldErrors,
+      });
+    }
+
+    const { file, url, method, preserveLayout, detectForms, extractTables, pages, language, password } =
+      validation.data;
+
+    // Ensure either file or url is provided
+    if (!file && !url) {
+      return ErrorResponses.validationError('Either file (base64) or url must be provided');
+    }
+
+    // Convert base64 to buffer if file provided
+    let input: Buffer | string;
+    if (file) {
+      try {
+        input = Buffer.from(file, 'base64');
+      } catch {
+        return ErrorResponses.validationError('Invalid base64 file data');
+      }
+    } else {
+      input = url!;
+    }
+
+    // Extract text
+    const result = await extractText({
+      input,
+      options: {
+        method: method as OCRMethod,
+        preserveLayout,
+        detectForms,
+        extractTables,
+        pages,
+        language,
+        password,
+      },
+    });
+
+    // Return result with rate limit headers
+    return Response.json(
+      {
+        success: true,
+        data: {
+          text: result.text,
+          markdown: result.markdown,
+          confidence: result.confidence,
+          method: result.method,
+          pageCount: result.pageCount,
+          processingTimeMs: result.processingTimeMs,
+          tables: result.tables,
+          formFields: result.formFields,
+        },
+      },
+      {
+        headers: {
+          'X-RateLimit-Remaining': String(rateLimit.remaining),
+          'X-RateLimit-Reset': String(rateLimit.resetAt),
+        },
+      }
+    );
+  } catch (error) {
+    return handleError(error);
+  }
+}
diff --git a/src/app/api/v1/health/route.ts b/src/app/api/v1/health/route.ts
@@ -0,0 +1,55 @@
+/**
+ * Health Check Endpoint
+ *
+ * GET /api/v1/health
+ *
+ * Returns service health status and available features.
+ */
+
+import { NextRequest } from 'next/server';
+import { isProviderAvailable, getAvailableProviders } from '@/lib/llm';
+import { getLLMWhispererQuota } from '@/lib/ocr';
+
+export async function GET(request: NextRequest) {
+  const startTime = Date.now();
+
+  // Check service health
+  const [llmProviders, ocrQuota] = await Promise.all([
+    getAvailableProviders(),
+    getLLMWhispererQuota(),
+  ]);
+
+  const health = {
+    status: 'healthy',
+    timestamp: new Date().toISOString(),
+    version: '1.0.0',
+    responseTimeMs: Date.now() - startTime,
+    services: {
+      llm: {
+        status: llmProviders.length > 0 ? 'available' : 'degraded',
+        providers: llmProviders,
+      },
+      ocr: {
+        status: ocrQuota ? 'available' : 'limited',
+        llmwhisperer: ocrQuota
+          ? {
+              remaining: ocrQuota.remaining,
+              limit: ocrQuota.limit,
+            }
+          : null,
+        textract: !!process.env.AWS_ACCESS_KEY_ID,
+        deepseek: !!process.env.DEEPSEEK_OCR_ENDPOINT,
+      },
+      database: {
+        status: process.env.NEXT_PUBLIC_SUPABASE_URL ? 'configured' : 'not_configured',
+      },
+    },
+  };
+
+  // Determine overall status
+  if (llmProviders.length === 0 && !ocrQuota) {
+    health.status = 'degraded';
+  }
+
+  return Response.json(health);
+}