From 5f190fbf02c1fdd53f52038cdb90eff8f6374336 Mon Sep 17 00:00:00 2001
From: overcuriousity <overcuriousity@posteo.org>
Date: Wed, 30 Jul 2025 23:38:54 +0200
Subject: [PATCH] try work with embeddings

---
 src/data/tools.yaml                   |  60 +++
 src/pages/api/ai/embeddings-status.ts |  18 +
 src/pages/api/ai/enhance-input.ts     | 122 ++----
 src/pages/api/ai/query.ts             | 601 ++++++++++++++------------
 src/utils/aiPrompts.ts                | 221 ++++++++++
 src/utils/aiService.ts                | 106 +++++
 src/utils/embeddingsService.ts        | 215 +++++++++
 src/utils/rateLimitedQueue.ts         |  55 ++-
 8 files changed, 1025 insertions(+), 373 deletions(-)
 create mode 100644 src/pages/api/ai/embeddings-status.ts
 create mode 100644 src/utils/aiPrompts.ts
 create mode 100644 src/utils/aiService.ts
 create mode 100644 src/utils/embeddingsService.ts

diff --git a/src/data/tools.yaml b/src/data/tools.yaml
index c742722..fae358a 100644
--- a/src/data/tools.yaml
+++ b/src/data/tools.yaml
@@ -226,6 +226,66 @@ tools:
       - TheHive 5
       - Cortex
       - OpenCTI
+  - name: DFIR-IRIS
+    icon: 🌺
+    type: software
+    description: >-
+      Collaborative Incident Response Management Platform für strukturierte
+      DFIR-Case-Organisation. Zentralisiert alle Aspekte einer Untersuchung:
+      Assets, IOCs, Tasks, Timeline, Evidence-Tracking. Multi-User-Environment
+      mit granularen Permissions für verschiedene Analysten-Rollen. Besonders
+      wertvoll: Case-Templates standardisieren Workflows, automatische IOC-
+      Enrichment via MISP/OpenCTI, integrierte Timeline-Visualisierung,
+      Evidence-Chain-of-Custody-Tracking. Plugin-System erweitert für Custom-
+      Integrations. RESTful API für Tool-Orchestrierung. Dashboard zeigt Case-
+      Status und Team-Workload. Notes-System dokumentiert Findings strukturiert.
+      Reporting-Engine generiert Executive-Summaries. Die Web-basierte
+      Architektur skaliert von kleinen Teams bis Enterprise-SOCs. Docker-
+      Deployment vereinfacht Installation. Besonders stark bei komplexen,
+      langwierigen Ermittlungen mit mehreren Beteiligten. Open-Source
+      Alternative zu kommerziellen Case-Management-Systemen.
+    domains:
+      - incident-response
+      - static-investigations
+      - malware-analysis
+      - fraud-investigation
+      - network-forensics
+      - mobile-forensics
+      - cloud-forensics
+    phases:
+      - data-collection
+      - examination
+      - analysis
+      - reporting
+    platforms:
+      - Web
+    related_software:
+      - TheHive 5
+      - MISP
+      - OpenCTI
+    domain-agnostic-software:
+      - collaboration-general
+    skillLevel: intermediate
+    accessType: server-based
+    url: https://dfir-iris.org/
+    projectUrl: ''
+    license: LGPL-3.0
+    knowledgebase: false
+    tags:
+      - web-interface
+      - case-management
+      - collaboration
+      - multi-user-support
+      - api
+      - workflow
+      - timeline-view
+      - ioc-tracking
+      - evidence-management
+      - reporting
+      - plugin-support
+      - docker-ready
+    related_concepts:
+      - Digital Evidence Chain of Custody
   - name: Timesketch
     icon: ⏱️
     type: software
diff --git a/src/pages/api/ai/embeddings-status.ts b/src/pages/api/ai/embeddings-status.ts
new file mode 100644
index 0000000..b08eb77
--- /dev/null
+++ b/src/pages/api/ai/embeddings-status.ts
@@ -0,0 +1,18 @@
+import type { APIRoute } from 'astro';
+import { isEmbeddingsEnabled } from '../../../utils/embeddingsService.js';
+import { apiResponse } from '../../../utils/api.js';
+
+export const prerender = false;
+
+export const GET: APIRoute = async () => {
+  const embeddingsEnabled = isEmbeddingsEnabled();
+  
+  return apiResponse.success({
+    embeddingsEnabled,
+    endpointConfigured: !!process.env.AI_EMBEDDINGS_ENDPOINT,
+    apiKeyConfigured: !!process.env.AI_EMBEDDINGS_API_KEY,
+    model: process.env.AI_EMBEDDINGS_MODEL || 'mistral-embed',
+    maxCandidates: parseInt(process.env.AI_EMBEDDING_CANDIDATES || '30'),
+    similarityThreshold: parseFloat(process.env.AI_SIMILARITY_THRESHOLD || '0.3')
+  });
+};
\ No newline at end of file
diff --git a/src/pages/api/ai/enhance-input.ts b/src/pages/api/ai/enhance-input.ts
index 34d5347..7d27117 100644
--- a/src/pages/api/ai/enhance-input.ts
+++ b/src/pages/api/ai/enhance-input.ts
@@ -1,23 +1,15 @@
-// src/pages/api/ai/enhance-input.ts
 import type { APIRoute } from 'astro';
 import { withAPIAuth } from '../../../utils/auth.js';
 import { apiError, apiServerError, createAuthErrorResponse } from '../../../utils/api.js';
 import { enqueueApiCall } from '../../../utils/rateLimitedQueue.js';
+import { callAI, getAnalyzerConfig } from '../../../utils/aiService.js';
+import { createEnhancementPrompt } from '../../../utils/aiPrompts.js';
 
 export const prerender = false;
 
-function getEnv(key: string): string {
-  const value = process.env[key];
-  if (!value) {
-    throw new Error(`Missing environment variable: ${key}`);
-  }
-  return value;
-}
-
-const AI_MODEL = getEnv('AI_MODEL');
 const rateLimitStore = new Map<string, { count: number; resetTime: number }>();
-const RATE_LIMIT_WINDOW = 60 * 1000; // 1 minute
-const RATE_LIMIT_MAX = 5; // 5 enhancement requests per minute per user
+const RATE_LIMIT_WINDOW = 60 * 1000;
+const RATE_LIMIT_MAX = 5;
 
 function sanitizeInput(input: string): string {
   return input
@@ -26,7 +18,7 @@ function sanitizeInput(input: string): string {
     .replace(/\b(system|assistant|user)\s*[:]/gi, '[ROLE_REMOVED]')
     .replace(/\b(ignore|forget|disregard)\s+(previous|all|your)\s+(instructions?|context|rules?)/gi, '[INSTRUCTION_REMOVED]')
     .trim()
-    .slice(0, 1000); // Shorter limit for enhancement
+    .slice(0, 1000);
 }
 
 function checkRateLimit(userId: string): boolean {
@@ -55,33 +47,8 @@ function cleanupExpiredRateLimits() {
   }
 }
 
-// Clean up expired limits every 5 minutes
 setInterval(cleanupExpiredRateLimits, 5 * 60 * 1000);
 
-function createEnhancementPrompt(input: string): string {
-  return `
-Du bist eine KI für digitale Forensik. Der Nutzer beschreibt ein forensisches Szenario. Analysiere die Eingabe.
-
-Wenn die Beschreibung unvollständig oder vage ist, stelle bis zu drei präzise Rückfragen im JSON-Array-Format, um wichtige Details zu klären (z. B. Vorfalltyp, System, Ziel, Datenquellen, Zeit, Beteiligte, rechtlicher Rahmen).
-
-Wenn die Eingabe bereits klar, spezifisch und vollständig ist, gib stattdessen nur eine leere Liste [] zurück.
-
-Antwortformat strikt:
-
-\`\`\`json
-[
-  "Frage 1?",
-  "Frage 2?",
-  "Frage 3?"
-]
-\`\`\`
-
-Nutzer-Eingabe:
-${input}
-  `.trim();
-}
-
-
 export const POST: APIRoute = async ({ request }) => {
   try {
     const authResult = await withAPIAuth(request, 'ai');
@@ -110,77 +77,68 @@ export const POST: APIRoute = async ({ request }) => {
     const systemPrompt = createEnhancementPrompt(sanitizedInput);
     const taskId = `enhance_${userId}_${Date.now()}_${Math.random().toString(36).substr(2, 4)}`;
     
-    const aiResponse = await enqueueApiCall(() =>
-      fetch(process.env.AI_API_ENDPOINT + '/v1/chat/completions', {
-        method: 'POST',
-        headers: {
-          'Content-Type': 'application/json',
-          'Authorization': `Bearer ${process.env.AI_API_KEY}`
-        },
-        body: JSON.stringify({
-          model: AI_MODEL,
-          messages: [
-            {
-              role: 'user',
-              content: systemPrompt
-            }
-          ],
-          max_tokens: 200,
-          temperature: 0.7
-        })
-      }), taskId);
+    console.log(`[ENHANCEMENT] Starting for user ${userId}, input length: ${sanitizedInput.length}`);
+    
+    const analyzerConfig = getAnalyzerConfig();
+    
+    let aiContent;
+    try {
+      const aiResponse = await enqueueApiCall(() =>
+        callAI(analyzerConfig, [
+          { role: 'user', content: systemPrompt }
+        ], 200, 0.1), taskId); // Lower temperature for consistent JSON
 
-    if (!aiResponse.ok) {
-      console.error('AI enhancement error:', await aiResponse.text());
-      return apiServerError.unavailable('Enhancement service unavailable');
-    }
+      aiContent = aiResponse.choices?.[0]?.message?.content;
 
-    const aiData = await aiResponse.json();
-    const aiContent = aiData.choices?.[0]?.message?.content;
+      if (!aiContent) {
+        console.error(`[ENHANCEMENT] No AI response content for task ${taskId}`);
+        return apiServerError.unavailable('No enhancement response');
+      }
 
-    if (!aiContent) {
-      return apiServerError.unavailable('No enhancement response');
+      console.log(`[ENHANCEMENT] Received AI response for task ${taskId}, length: ${aiContent.length}`);
+      
+    } catch (apiError) {
+      console.error(`[ENHANCEMENT] AI API call failed for task ${taskId}:`, apiError);
+      return apiServerError.unavailable('AI service temporarily unavailable');
     }
 
     let questions;
     try {
-    const cleanedContent = aiContent
+      const cleanedContent = aiContent
         .replace(/^```json\s*/i, '')
         .replace(/\s*```\s*$/, '')
         .trim();
-    questions = JSON.parse(cleanedContent);
+      questions = JSON.parse(cleanedContent);
       
       if (!Array.isArray(questions) || questions.length === 0) {
-        throw new Error('Invalid questions format');
-      }
-      
-      // Validate and clean questions
-      questions = questions
-        .filter(q => typeof q === 'string' && q.length > 5 && q.length < 120)
-        .slice(0, 3);
-        
-      if (questions.length === 0) {
-        throw new Error('No valid questions found');
+        console.log(`[ENHANCEMENT] No questions generated for task ${taskId} - input likely complete`);
+        questions = [];
+      } else {
+        questions = questions
+          .filter(q => typeof q === 'string' && q.length > 5 && q.length < 120)
+          .slice(0, 3);
       }
 
-    } catch (error) {
-      console.error('Failed to parse enhancement response:', aiContent);
+    } catch (parseError) {
+      console.error(`[ENHANCEMENT] Failed to parse AI response for task ${taskId}:`, parseError);
+      console.error(`[ENHANCEMENT] Raw AI content:`, aiContent);
       return apiServerError.unavailable('Invalid enhancement response format');
     }
 
-    console.log(`[AI Enhancement] User: ${userId}, Questions: ${questions.length}, Input length: ${sanitizedInput.length}`);
+    console.log(`[ENHANCEMENT] Completed for user ${userId}: ${questions.length} questions, input length: ${sanitizedInput.length}`);
 
     return new Response(JSON.stringify({
       success: true,
       questions,
-      taskId
+      taskId,
+      hasQuestions: questions.length > 0
     }), {
       status: 200,
       headers: { 'Content-Type': 'application/json' }
     });
 
   } catch (error) {
-    console.error('Enhancement error:', error);
+    console.error('[ENHANCEMENT] Unexpected error:', error);
     return apiServerError.internal('Enhancement processing failed');
   }
 };
\ No newline at end of file
diff --git a/src/pages/api/ai/query.ts b/src/pages/api/ai/query.ts
index c6ce37e..ee3d449 100644
--- a/src/pages/api/ai/query.ts
+++ b/src/pages/api/ai/query.ts
@@ -1,29 +1,22 @@
-// src/pages/api/ai/query.ts
 import type { APIRoute } from 'astro';
 import { withAPIAuth } from '../../../utils/auth.js';
 import { getCompressedToolsDataForAI } from '../../../utils/dataService.js';
 import { apiError, apiServerError, createAuthErrorResponse } from '../../../utils/api.js';
-import { enqueueApiCall } from '../../../utils/rateLimitedQueue.js';   
+import { enqueueChainedApiCall } from '../../../utils/rateLimitedQueue.js';
+import { callAI, getSelectorConfig, getAnalyzerConfig } from '../../../utils/aiService.js';
+import { createSelectorPrompt, createWorkflowSystemPrompt, createToolSystemPrompt, createJsonConversionPrompt } from '../../../utils/aiPrompts.js';
+import { isEmbeddingsEnabled, generateToolEmbeddings, findSimilarItems, type ToolEmbedding } from '../../../utils/embeddingsService.js';
 
 export const prerender = false;
 
-function getEnv(key: string): string {
-  const value = process.env[key];
-  if (!value) {
-    throw new Error(`Missing environment variable: ${key}`);
-  }
-  return value;
-}
-
-const AI_MODEL = getEnv('AI_MODEL');
 const rateLimitStore = new Map<string, { count: number; resetTime: number }>();
 const RATE_LIMIT_WINDOW = 60 * 1000; 
 const RATE_LIMIT_MAX = 10; 
 
 function sanitizeInput(input: string): string {
   let sanitized = input
-    .replace(/```[\s\S]*?```/g, '[CODE_BLOCK_REMOVED]') // Remove code blocks
-    .replace(/\<\/?[^>]+(>|$)/g, '') // Remove HTML tags
+    .replace(/```[\s\S]*?```/g, '[CODE_BLOCK_REMOVED]')
+    .replace(/\<\/?[^>]+(>|$)/g, '')
     .replace(/\b(system|assistant|user)\s*[:]/gi, '[ROLE_REMOVED]')
     .replace(/\b(ignore|forget|disregard)\s+(previous|all|your)\s+(instructions?|context|rules?)/gi, '[INSTRUCTION_REMOVED]')
     .trim();
@@ -33,11 +26,34 @@ function sanitizeInput(input: string): string {
   return sanitized;
 }
 
-function stripMarkdownJson(content: string): string {
-  return content
+function extractJsonFromResponse(content: string): string {
+  // First try simple markdown removal
+  let cleaned = content
     .replace(/^```json\s*/i, '')
-    .replace(/\s*```\s*$/, '')
+    .replace(/\s*```\s*$/i, '')
     .trim();
+  
+  // If it looks like JSON already, return it
+  if (cleaned.startsWith('{') && cleaned.endsWith('}')) {
+    return cleaned;
+  }
+  
+  // Try to find JSON block in the response
+  const jsonMatch = content.match(/```json\s*(\{[\s\S]*?\})\s*```/i);
+  if (jsonMatch) {
+    return jsonMatch[1].trim();
+  }
+  
+  // Try to find any JSON-like structure
+  const jsonStart = content.indexOf('{');
+  const jsonEnd = content.lastIndexOf('}');
+  
+  if (jsonStart >= 0 && jsonEnd > jsonStart) {
+    return content.substring(jsonStart, jsonEnd + 1);
+  }
+  
+  // If no JSON found, return original (will likely fail parsing)
+  return cleaned;
 }
 
 function checkRateLimit(userId: string): boolean {
@@ -77,301 +93,266 @@ async function loadToolsDatabase() {
   }
 }
 
-function createWorkflowSystemPrompt(toolsData: any): string {
-  const toolsList = toolsData.tools.map((tool: any) => ({
-    name: tool.name,
-    description: tool.description,
-    domains: tool.domains,
-    phases: tool.phases,
-    domainAgnostic: tool['domain-agnostic-software'],
-    platforms: tool.platforms,
-    skillLevel: tool.skillLevel,
-    license: tool.license,
-    tags: tool.tags,
-    related_concepts: tool.related_concepts || []
-  }));
-
-  const conceptsList = toolsData.concepts.map((concept: any) => ({
-    name: concept.name,
-    description: concept.description,
-    domains: concept.domains,
-    phases: concept.phases,
-    skillLevel: concept.skillLevel,
-    tags: concept.tags
-  }));
-
-  const regularPhases = toolsData.phases || [];
+function simpleTextBasedSelection(query: string, allItems: any[]): any[] {
+  const maxCandidates = parseInt(process.env.AI_EMBEDDING_CANDIDATES || '30');
+  const queryLower = query.toLowerCase();
+  const queryWords = queryLower.split(/\s+/).filter(word => word.length > 2);
   
-  const domainAgnosticSoftware = toolsData['domain-agnostic-software'] || [];
+  console.log(`[FALLBACK] Using text-based selection with ${queryWords.length} query words`);
   
-  const allPhaseItems = [
-    ...regularPhases,
-    ...domainAgnosticSoftware
-  ];
+  const scoredItems = allItems.map(item => {
+    let score = 0;
+    const searchText = `${item.name} ${item.description} ${(item.tags || []).join(' ')} ${(item.domains || []).join(' ')} ${(item.phases || []).join(' ')}`.toLowerCase();
+    
+    // Exact name match gets highest score
+    if (item.name.toLowerCase().includes(queryLower)) {
+      score += 100;
+    }
+    
+    // Description match
+    if (item.description.toLowerCase().includes(queryLower)) {
+      score += 50;
+    }
+    
+    // Word matches
+    queryWords.forEach(word => {
+      if (searchText.includes(word)) {
+        score += 10;
+      }
+    });
+    
+    // Tag exact matches get bonus
+    (item.tags || []).forEach((tag: string) => {
+      if (queryLower.includes(tag.toLowerCase()) || tag.toLowerCase().includes(queryLower)) {
+        score += 25;
+      }
+    });
+    
+    return { item, score };
+  });
   
-  const phasesDescription = allPhaseItems.map((phase: any) => 
-    `- ${phase.id}: ${phase.name}`
-  ).join('\n');
-
-  const domainsDescription = toolsData.domains.map((domain: any) => 
-    `- ${domain.id}: ${domain.name}`
-  ).join('\n');
-
-  const phaseDescriptions = regularPhases.map((phase: any) => 
-    `- ${phase.name}: ${phase.description || 'Tools/Methods for this phase'}`
-  ).join('\n');
-
-  const domainAgnosticDescriptions = domainAgnosticSoftware.map((section: any) => 
-    `- ${section.name}: ${section.description || 'Cross-cutting software and platforms'}`
-  ).join('\n');
-
-  const validPhases = [
-    ...regularPhases.map((p: any) => p.id),
-    ...domainAgnosticSoftware.map((s: any) => s.id)
-  ].join('|');
-
-  return `Du bist ein DFIR (Digital Forensics and Incident Response) Experte, der Ermittlern bei der Auswahl von Software und Methoden hilft.
-
-VERFÜGBARE TOOLS/METHODEN:
-${JSON.stringify(toolsList, null, 2)}
-
-VERFÜGBARE HINTERGRUNDWISSEN-KONZEPTE:
-${JSON.stringify(conceptsList, null, 2)}
-
-UNTERSUCHUNGSPHASEN (NIST Framework):
-${phasesDescription}
-
-FORENSISCHE DOMÄNEN:
-${domainsDescription}
-
-WICHTIGE REGELN:
-1. Pro Phase 2-3 Tools/Methoden empfehlen (immer mindestens 2 wenn verfügbar)
-2. Tools/Methoden können in MEHREREN Phasen empfohlen werden wenn sinnvoll - versuche ein Tool/Methode für jede Phase zu empfehlen, selbst wenn die Priorität "low" ist.
-3. Für Reporting-Phase: Visualisierungs- und Dokumentationssoftware einschließen
-4. Gib stets dem spezieller für den Fall geeigneten Werkzeug den Vorzug.
-5. Deutsche Antworten für deutsche Anfragen, English for English queries
-6. Methoden haben, sofern für das SZENARIO passend, IMMER Vorrang vor Software.
-7. Bevorzuge alles, was nicht proprietär ist (license != "Proprietary"), aber erkenne an, wenn proprietäre Software besser geeignet ist.
-8. WICHTIG: Erwähne relevante Hintergrundwissen-Konzepte wenn Tools verwendet werden, die related_concepts haben
-9. Konzepte sind NICHT Tools - empfehle sie nicht als actionable Schritte, sondern als Wissensbasis
-
-ENHANCED CONTEXTUAL ANALYSIS:
-10. Analysiere das Szenario detailliert und identifiziere Schlüsselelemente, Bedrohungen und forensische Herausforderungen
-11. Entwickle einen strategischen Untersuchungsansatz basierend auf dem spezifischen Szenario
-12. Identifiziere zeitkritische oder besonders wichtige Faktoren für diesen Fall
-
-SOFTWARE/METHODEN-AUSWAHL NACH PHASE:
-${phaseDescriptions}
-
-DOMÄNENAGNOSTISCHE SOFTWARE/METHODEN:
-${domainAgnosticDescriptions}
-
-ANTWORT-FORMAT (strict JSON):
-{
-  "scenario_analysis": "Detaillierte Analyse des Szenarios: Erkannte Schlüsselelemente, Art des Vorfalls, betroffene Systeme, potentielle Bedrohungen und forensische Herausforderungen",
-  "investigation_approach": "Strategischer Untersuchungsansatz für dieses spezifische Szenario: Prioritäten, Reihenfolge der Phasen, besondere Überlegungen",
-  "critical_considerations": "Zeitkritische Faktoren, wichtige Sicherheitsaspekte oder besondere Vorsichtsmaßnahmen für diesen Fall",
-  "recommended_tools": [
-    {
-      "name": "EXAKTER Name aus der Tools-Database",
-      "priority": "high|medium|low", 
-      "phase": "${validPhases}",
-      "justification": "Warum diese Methode für diese Phase und dieses spezifische Szenario geeignet ist - mit Bezug zu den erkannten Schlüsselelementen"
-    }
-  ],
-  "workflow_suggestion": "Vorgeschlagener Untersuchungsablauf mit konkreten Schritten für dieses Szenario",
-  "background_knowledge": [
-    {
-      "concept_name": "EXAKTER Name aus der Konzepte-Database",
-      "relevance": "Warum dieses Konzept für das Szenario relevant ist, und bei welchen der empfohlenen Methoden/Tools."
-    }
-  ],
-  "additional_notes": "Wichtige Überlegungen und Hinweise"
+  const selected = scoredItems
+    .filter(({ score }) => score > 0)
+    .sort((a, b) => b.score - a.score)
+    .slice(0, maxCandidates)
+    .map(({ item }) => item);
+  
+  console.log(`[FALLBACK] Selected ${selected.length} items from ${allItems.length} total`);
+  return selected;
 }
 
-Antworte NUR mit validen JSON. Keine zusätzlichen Erklärungen außerhalb des JSON.`;
-}
-
-function createToolSystemPrompt(toolsData: any): string {
-  const toolsList = toolsData.tools.map((tool: any) => ({
-    name: tool.name,
-    description: tool.description,
-    domains: tool.domains,
-    phases: tool.phases,
-    platforms: tool.platforms,
-    skillLevel: tool.skillLevel,
-    license: tool.license,
-    tags: tool.tags,
-    url: tool.url,
-    projectUrl: tool.projectUrl,
-    related_concepts: tool.related_concepts || []
-  }));
-
-  const conceptsList = toolsData.concepts.map((concept: any) => ({
-    name: concept.name,
-    description: concept.description,
-    domains: concept.domains,
-    phases: concept.phases,
-    skillLevel: concept.skillLevel,
-    tags: concept.tags
-  }));
-
-  return `Du bist ein DFIR (Digital Forensics and Incident Response) Experte, der bei der Auswahl spezifischer Software/Methoden für konkrete Probleme hilft.
-
-VERFÜGBARE TOOLS/METHODEN:
-${JSON.stringify(toolsList, null, 2)}
-
-VERFÜGBARE HINTERGRUNDWISSEN-KONZEPTE:
-${JSON.stringify(conceptsList, null, 2)}
-
-WICHTIGE REGELN:
-1. Analysiere das spezifische Problem/die Anforderung sorgfältig
-2. Empfehle 1-3 Methoden/Tools, sortiert nach Eignung (beste Empfehlung zuerst)
-3. Gib detaillierte Erklärungen, WARUM und WIE jede Methode/Tool das Problem löst
-4. Berücksichtige praktische Aspekte: Skill Level, Plattformen, Verfügbarkeit
-5. Deutsche Antworten für deutsche Anfragen, English for English queries
-6. Gib konkrete Anwendungshinweise, nicht nur allgemeine Beschreibungen - Methoden haben, sofern für das SZENARIO passend, IMMER Vorrang vor Software.
-7. Erwähne sowohl Stärken als auch Schwächen/Limitationen
-8. Schlage alternative Ansätze vor, wenn sinnvoll
-9. Gib grundsätzliche Hinweise, WIE die Methode/Tool konkret eingesetzt wird
-10. WICHTIG: Erwähne relevante Hintergrundwissen-Konzepte wenn Tools verwendet werden, die related_concepts haben
-11. Konzepte sind NICHT Tools - empfehle sie nicht als actionable Schritte, sondern als Wissensbasis
-
-ENHANCED CONTEXTUAL ANALYSIS:
-12. Analysiere das Problem detailliert und identifiziere technische Anforderungen, Herausforderungen und Erfolgsfaktoren
-13. Entwickle einen strategischen Lösungsansatz basierend auf dem spezifischen Problem
-14. Identifiziere wichtige Voraussetzungen oder Warnungen für die Anwendung
-
-ANTWORT-FORMAT (strict JSON):
-{
-  "problem_analysis": "Detaillierte Analyse des Problems: Erkannte technische Anforderungen, Herausforderungen, benötigte Fähigkeiten und Erfolgsfaktoren",
-  "investigation_approach": "Strategischer Lösungsansatz für dieses spezifische Problem: Herangehensweise, Prioritäten, optimale Anwendungsreihenfolge",
-  "critical_considerations": "Wichtige Voraussetzungen, potentielle Fallstricke oder Warnungen für die Anwendung der empfohlenen Lösungen",
-  "recommended_tools": [
-    {
-      "name": "EXAKTER Name aus der Tools-Database",
-      "rank": 1,
-      "suitability_score": "high|medium|low",
-      "detailed_explanation": "Detaillierte Erklärung, warum dieses Tool/diese Methode das spezifische Problem löst - mit Bezug zu den erkannten Anforderungen",
-      "implementation_approach": "Konkrete Schritte/Ansatz zur Anwendung für dieses spezifische Problem",
-      "pros": ["Spezifische Vorteile für diesen Anwendungsfall", "Weitere Vorteile"],
-      "cons": ["Potentielle Nachteile oder Limitationen", "Weitere Einschränkungen"],
-      "alternatives": "Alternative Ansätze oder ergänzende Tools/Methoden, falls relevant"
+async function selectRelevantItemsWithEmbeddings(query: string, mode: string) {
+  const fullToolsData = await loadToolsDatabase();
+  let candidates;
+  let embeddingCandidates = 0;
+  let selectionMethod = 'text-based';
+  
+  const allItems = [...fullToolsData.tools, ...fullToolsData.concepts];
+  
+  if (isEmbeddingsEnabled()) {
+    try {
+      console.log(`[SELECTION] Attempting embeddings-based selection for ${allItems.length} items`);
+      const toolEmbeddings = await generateToolEmbeddings(fullToolsData);
+      const similarItems = await findSimilarItems(query, toolEmbeddings);
+      candidates = similarItems.map(item => item.tool);
+      embeddingCandidates = candidates.length;
+      selectionMethod = 'embeddings';
+      console.log(`[SELECTION] Embeddings selection successful: ${candidates.length} candidates`);
+    } catch (error) {
+      console.warn('[SELECTION] Embeddings failed, using text-based fallback:', error.message);
+      candidates = simpleTextBasedSelection(query, allItems);
+      selectionMethod = 'text-fallback';
     }
-  ],
-  "background_knowledge": [
-    {
-      "concept_name": "EXAKTER Name aus der Konzepte-Database",
-      "relevance": "Warum dieses Konzept für die empfohlenen Tools/das Problem relevant ist, und für welche der empfohlenen Methoden/Tools."
-    }
-  ],
-  "additional_considerations": "Wichtige Überlegungen, Voraussetzungen oder Warnungen"
-}
+  } else {
+    console.log('[SELECTION] Embeddings disabled, using text-based selection');
+    candidates = simpleTextBasedSelection(query, allItems);
+  }
 
-Antworte NUR mit validen JSON. Keine zusätzlichen Erklärungen außerhalb des JSON.`;
-}
+  // Safety check - ensure we have some candidates
+  if (candidates.length === 0) {
+    console.warn('[SELECTION] No candidates found, using top items from full dataset');
+    candidates = allItems.slice(0, parseInt(process.env.AI_EMBEDDING_CANDIDATES || '30'));
+    selectionMethod = 'emergency-fallback';
+  }
 
-export const POST: APIRoute = async ({ request }) => {
+  console.log(`[SELECTION] Using ${selectionMethod} selection: ${candidates.length} candidates for AI selector`);
+
+  const selectorConfig = getSelectorConfig();
+  
   try {
-    const authResult = await withAPIAuth(request, 'ai');
-    if (!authResult.authenticated) {
-      return createAuthErrorResponse();
-    }
+    const prompt = createSelectorPrompt(candidates, query, mode);
     
-    const userId = authResult.userId;
+    console.log(`[SELECTION] Sending ${candidates.length} candidates to AI selector (prompt length: ${prompt.length})`);
+    
+    const response = await callAI(selectorConfig, [
+      { role: 'user', content: prompt }
+    ], 1500, 0.1); // Lower temperature for consistent JSON
 
-    if (!checkRateLimit(userId)) {
-      return apiError.rateLimit('Rate limit exceeded');
+    const content = response.choices?.[0]?.message?.content;
+    if (!content) {
+      console.error('[SELECTION] AI response structure:', JSON.stringify(response, null, 2));
+      throw new Error('No selection response from AI');
     }
 
-    const body = await request.json();
-    const { query, mode = 'workflow', taskId: clientTaskId } = body;
+    console.log(`[SELECTION] AI response received, length: ${content.length}`);
+    console.log(`[SELECTION] AI response preview:`, content.slice(0, 200) + '...');
 
-    // ADD THIS DEBUG LOGGING
-    console.log(`[AI API] Received request - TaskId: ${clientTaskId}, Mode: ${mode}, Query length: ${query?.length || 0}`);
-
-    if (!query || typeof query !== 'string') {
-      console.log(`[AI API] Invalid query for task ${clientTaskId}`);
-      return apiError.badRequest('Query required');
+    let selection;
+    try {
+      const cleanedContent = extractJsonFromResponse(content);
+      console.log(`[SELECTION] Extracted JSON preview:`, cleanedContent.slice(0, 200) + '...');
+      selection = JSON.parse(cleanedContent);
+    } catch (parseError) {
+      console.error('[SELECTION] JSON parsing failed:', parseError);
+      console.error('[SELECTION] Raw AI content:', content);
+      console.error('[SELECTION] Cleaned content:', extractJsonFromResponse(content));
+      throw new Error(`JSON parsing failed: ${parseError.message}`);
     }
-
-    if (!['workflow', 'tool'].includes(mode)) {
-      console.log(`[AI API] Invalid mode for task ${clientTaskId}: ${mode}`);
-      return apiError.badRequest('Invalid mode. Must be "workflow" or "tool"');
-    }
-
-    const sanitizedQuery = sanitizeInput(query);
-    if (sanitizedQuery.includes('[FILTERED]')) {
-      console.log(`[AI API] Filtered input detected for task ${clientTaskId}`);
-      return apiError.badRequest('Invalid input detected');
-    }
-
-    const toolsData = await loadToolsDatabase();
-
-    const systemPrompt = mode === 'workflow' 
-      ? createWorkflowSystemPrompt(toolsData)
-      : createToolSystemPrompt(toolsData);
     
-    const taskId = clientTaskId || `ai_${userId}_${Date.now()}_${Math.random().toString(36).substr(2, 6)}`;
-    
-    console.log(`[AI API] About to enqueue task ${taskId}`);
-    
-    
-    const aiResponse = await enqueueApiCall(() =>
-      fetch(process.env.AI_API_ENDPOINT + '/v1/chat/completions', {
-        method: 'POST',
-        headers: {
-          'Content-Type': 'application/json',
-          'Authorization': `Bearer ${process.env.AI_API_KEY}`
-        },
-        body: JSON.stringify({
-          model: AI_MODEL,
-          messages: [
-            {
-              role: 'system',
-              content: systemPrompt
-            },
-            {
-              role: 'user',
-              content: sanitizedQuery
+    const selectedTools = candidates.filter(item => 
+      item.type !== 'concept' && (selection.selected_tools || []).includes(item.name)
+    );
+    const selectedConcepts = candidates.filter(item => 
+      item.type === 'concept' && (selection.selected_concepts || []).includes(item.name)
+    );
+
+    console.log(`[SELECTION] Final selection: ${selectedTools.length} tools, ${selectedConcepts.length} concepts from ${candidates.length} candidates`);
+
+    // Ensure we have at least some tools selected
+    if (selectedTools.length === 0 && selectedConcepts.length === 0) {
+      console.warn('[SELECTION] No items selected by AI, using fallback selection');
+      const fallbackTools = candidates.filter(item => item.type !== 'concept').slice(0, 10);
+      const fallbackConcepts = candidates.filter(item => item.type === 'concept').slice(0, 3);
+      return {
+        selectedItems: {
+          tools: fallbackTools,
+          concepts: fallbackConcepts,
+          domains: fullToolsData.domains,
+          phases: fullToolsData.phases,
+          ...Object.keys(fullToolsData).reduce((acc, key) => {
+            if (!['tools', 'concepts', 'domains', 'phases'].includes(key)) {
+              acc[key] = fullToolsData[key];
             }
-          ],
-          max_tokens: 3500,
-          temperature: 0.3
-        })
-      })
-    , taskId);
-
-    if (!aiResponse.ok) {
-      console.error('AI API error:', await aiResponse.text());
-      return apiServerError.unavailable('AI service unavailable');
+            return acc;
+          }, {} as any)
+        },
+        reasoning: 'Fallback selection used due to AI selection failure',
+        candidateCount: candidates.length,
+        embeddingCandidates,
+        selectionMethod: selectionMethod + '-fallback'
+      };
     }
 
-    const aiData = await aiResponse.json();
-    const aiContent = aiData.choices?.[0]?.message?.content;
+    return {
+      selectedItems: {
+        tools: selectedTools,
+        concepts: selectedConcepts,
+        domains: fullToolsData.domains,
+        phases: fullToolsData.phases,
+        ...Object.keys(fullToolsData).reduce((acc, key) => {
+          if (!['tools', 'concepts', 'domains', 'phases'].includes(key)) {
+            acc[key] = fullToolsData[key];
+          }
+          return acc;
+        }, {} as any)
+      },
+      reasoning: selection.reasoning,
+      candidateCount: candidates.length,
+      embeddingCandidates,
+      selectionMethod
+    };
+  } catch (error) {
+    console.error('[SELECTION] AI selector failed:', error);
+    console.error('[SELECTION] Selector model:', selectorConfig.model);
+    console.error('[SELECTION] Query length:', query.length);
+    console.error('[SELECTION] Candidate count:', candidates.length);
+    throw new Error(`Selection failed: ${error.message}`);
+  }
+}
 
-    if (!aiContent) {
-      return apiServerError.unavailable('No response from AI');
+async function analyzeWithSelectedItems(selectionResult: any, query: string, mode: string) {
+  const analyzerConfig = getAnalyzerConfig();
+  const prompt = mode === 'workflow' 
+    ? createWorkflowSystemPrompt(selectionResult.selectedItems)
+    : createToolSystemPrompt(selectionResult.selectedItems);
+  
+  console.log(`[ANALYSIS] Starting ${mode} analysis with ${selectionResult.selectedItems.tools.length} tools and ${selectionResult.selectedItems.concepts.length} concepts`);
+  console.log(`[ANALYSIS] Using model: ${analyzerConfig.model}`);
+  console.log(`[ANALYSIS] System prompt length: ${prompt.length}`);
+  
+  try {
+    const response = await callAI(analyzerConfig, [
+      { role: 'system', content: prompt },
+      { role: 'user', content: query }
+    ], 3500, 0.1); // Lower temperature for more consistent JSON output
+
+    const content = response.choices?.[0]?.message?.content;
+    if (!content) {
+      console.error('[ANALYSIS] No content in AI response:', JSON.stringify(response, null, 2));
+      throw new Error('No analysis response from AI');
     }
 
+    console.log(`[ANALYSIS] Received AI response, length: ${content.length}`);
+    console.log(`[ANALYSIS] Response preview:`, content.slice(0, 200) + '...');
+
     let recommendation;
     try {
-      const cleanedContent = stripMarkdownJson(aiContent);
+      const cleanedContent = extractJsonFromResponse(content);
+      console.log(`[ANALYSIS] Extracted JSON preview:`, cleanedContent.slice(0, 200) + '...');
       recommendation = JSON.parse(cleanedContent);
-    } catch (error) {
-      console.error('Failed to parse AI response:', aiContent);
-      return apiServerError.unavailable('Invalid AI response format');
+    } catch (parseError) {
+      console.warn('[ANALYSIS] JSON parsing failed, attempting prose-to-JSON conversion...');
+      
+      // Check if response looks like prose (doesn't start with {)
+      const trimmedContent = content.trim();
+      if (!trimmedContent.startsWith('{')) {
+        console.log('[ANALYSIS] Response is prose, converting to JSON...');
+        
+        try {
+          // Use a simpler model for conversion to save costs
+          const conversionConfig = getSelectorConfig(); 
+          const conversionPrompt = createJsonConversionPrompt(content, query, mode);
+          
+          console.log(`[ANALYSIS] Sending prose conversion request (length: ${conversionPrompt.length})`);
+          
+          const conversionResponse = await callAI(conversionConfig, [
+            { role: 'user', content: conversionPrompt }
+          ], 2000, 0.1); // Lower temperature for more consistent JSON
+          
+          const convertedContent = conversionResponse.choices?.[0]?.message?.content;
+          if (!convertedContent) {
+            throw new Error('No conversion response');
+          }
+          
+          console.log(`[ANALYSIS] Conversion response length: ${convertedContent.length}`);
+          console.log(`[ANALYSIS] Conversion preview:`, convertedContent.slice(0, 200) + '...');
+          
+          const finalJsonContent = extractJsonFromResponse(convertedContent);
+          recommendation = JSON.parse(finalJsonContent);
+          
+          console.log('[ANALYSIS] ✅ Successfully converted prose to JSON');
+          
+        } catch (conversionError) {
+          console.error('[ANALYSIS] Prose-to-JSON conversion failed:', conversionError);
+          console.error('[ANALYSIS] Original prose response:', content);
+          throw new Error(`Both direct JSON parsing and prose conversion failed: ${parseError.message}`);
+        }
+      } else {
+        console.error('[ANALYSIS] Response looks like JSON but parsing failed:', parseError);
+        console.error('[ANALYSIS] Raw content:', content);
+        console.error('[ANALYSIS] Cleaned content:', extractJsonFromResponse(content));
+        throw new Error(`JSON parsing failed: ${parseError.message}`);
+      }
     }
 
-    const validToolNames = new Set(toolsData.tools.map((t: any) => t.name));
-    const validConceptNames = new Set(toolsData.concepts.map((c: any) => c.name));
+    const validToolNames = new Set(selectionResult.selectedItems.tools.map((t: any) => t.name));
+    const validConceptNames = new Set(selectionResult.selectedItems.concepts.map((c: any) => c.name));
     
     let validatedRecommendation;
 
     if (mode === 'workflow') {
       validatedRecommendation = {
         ...recommendation,
-        // Ensure all new fields are included with fallbacks
         scenario_analysis: recommendation.scenario_analysis || recommendation.problem_analysis || '',
         investigation_approach: recommendation.investigation_approach || '',
         critical_considerations: recommendation.critical_considerations || '',
@@ -393,7 +374,6 @@ export const POST: APIRoute = async ({ request }) => {
     } else {
       validatedRecommendation = {
         ...recommendation,
-        // Ensure all new fields are included with fallbacks
         problem_analysis: recommendation.problem_analysis || recommendation.scenario_analysis || '',
         investigation_approach: recommendation.investigation_approach || '',
         critical_considerations: recommendation.critical_considerations || '',
@@ -420,14 +400,71 @@ export const POST: APIRoute = async ({ request }) => {
       };
     }
 
-    console.log(`[AI Query] Mode: ${mode}, User: ${userId}, Query length: ${sanitizedQuery.length}, Tools: ${validatedRecommendation.recommended_tools.length}, Concepts: ${validatedRecommendation.background_knowledge?.length || 0}`);
+    console.log(`[ANALYSIS] Completed successfully: ${validatedRecommendation.recommended_tools.length} final recommendations`);
+    return validatedRecommendation;
+  } catch (error) {
+    console.error('[ANALYSIS] Failed:', error);
+    throw new Error(`Analysis failed: ${error.message}`);
+  }
+}
+
+export const POST: APIRoute = async ({ request }) => {
+  try {
+    const authResult = await withAPIAuth(request, 'ai');
+    if (!authResult.authenticated) {
+      return createAuthErrorResponse();
+    }
+    
+    const userId = authResult.userId;
+
+    if (!checkRateLimit(userId)) {
+      return apiError.rateLimit('Rate limit exceeded');
+    }
+
+    const body = await request.json();
+    const { query, mode = 'workflow', taskId: clientTaskId } = body;
+
+    console.log(`[AI API] Received request - TaskId: ${clientTaskId}, Mode: ${mode}, Query length: ${query?.length || 0}`);
+
+    if (!query || typeof query !== 'string') {
+      console.log(`[AI API] Invalid query for task ${clientTaskId}`);
+      return apiError.badRequest('Query required');
+    }
+
+    if (!['workflow', 'tool'].includes(mode)) {
+      console.log(`[AI API] Invalid mode for task ${clientTaskId}: ${mode}`);
+      return apiError.badRequest('Invalid mode. Must be "workflow" or "tool"');
+    }
+
+    const sanitizedQuery = sanitizeInput(query);
+    if (sanitizedQuery.includes('[FILTERED]')) {
+      console.log(`[AI API] Filtered input detected for task ${clientTaskId}`);
+      return apiError.badRequest('Invalid input detected');
+    }
+
+    const taskId = clientTaskId || `ai_${userId}_${Date.now()}_${Math.random().toString(36).substr(2, 6)}`;
+    
+    console.log(`[AI API] Starting AI processing for task ${taskId}`);
+    
+    const result = await enqueueChainedApiCall(
+      async () => selectRelevantItemsWithEmbeddings(sanitizedQuery, mode),
+      (selectionResult: any) => async () => analyzeWithSelectedItems(selectionResult, sanitizedQuery, mode),
+      taskId
+    );
+
+    console.log(`[AI Query] Success - Mode: ${mode}, User: ${userId}, Method: ${result.stage1Result.selectionMethod}, Tools: ${result.finalResult.recommended_tools.length}, Concepts: ${result.finalResult.background_knowledge?.length || 0}`);
 
     return new Response(JSON.stringify({
       success: true,
       mode,
       taskId,
-      recommendation: validatedRecommendation,
-      query: sanitizedQuery
+      recommendation: result.finalResult,
+      query: sanitizedQuery,
+      selectedItems: result.stage1Result.candidateCount,
+      embeddingCandidates: result.stage1Result.embeddingCandidates,
+      selectionMethod: result.stage1Result.selectionMethod,
+      selectionReasoning: result.stage1Result.reasoning,
+      embeddingsEnabled: isEmbeddingsEnabled()
     }), {
       status: 200,
       headers: { 'Content-Type': 'application/json' }
diff --git a/src/utils/aiPrompts.ts b/src/utils/aiPrompts.ts
new file mode 100644
index 0000000..edbaee8
--- /dev/null
+++ b/src/utils/aiPrompts.ts
@@ -0,0 +1,221 @@
+export function createSelectorPrompt(candidateItems: any[], query: string, mode: string): string {
+  const maxItems = parseInt(process.env.AI_MAX_SELECTED_ITEMS || '15');
+  
+  // Create a simpler representation of items for selection
+  const simplifiedItems = candidateItems.map(item => ({
+    name: item.name,
+    type: item.type,
+    description: item.description?.slice(0, 150) + (item.description?.length > 150 ? '...' : ''),
+    tags: (item.tags || []).slice(0, 5),
+    domains: item.domains || [],
+    phases: item.phases || []
+  }));
+  
+  return `RESPOND ONLY IN JSON FORMAT. NO EXPLANATIONS. NO MARKDOWN. ONLY JSON.
+
+You are a DFIR expert selecting relevant tools and concepts.
+
+QUERY: "${query}"
+MODE: ${mode}
+
+From these ${candidateItems.length} candidates, select the ${maxItems} most relevant:
+
+${JSON.stringify(simplifiedItems, null, 2)}
+
+OUTPUT FORMAT (COPY EXACTLY):
+{"selected_tools":["name1","name2"],"selected_concepts":["concept1"],"reasoning":"brief explanation"}
+
+CRITICAL: Output ONLY the JSON object above. No other text.`;
+}
+
+export function createWorkflowSystemPrompt(selectedData: any): string {
+  const toolsList = selectedData.tools.map((tool: any) => ({
+    name: tool.name,
+    description: tool.description?.slice(0, 200),
+    domains: tool.domains,
+    phases: tool.phases,
+    platforms: tool.platforms,
+    skillLevel: tool.skillLevel,
+    license: tool.license,
+    tags: tool.tags?.slice(0, 5),
+    related_concepts: tool.related_concepts || []
+  }));
+
+  const conceptsList = selectedData.concepts.map((concept: any) => ({
+    name: concept.name,
+    description: concept.description?.slice(0, 200),
+    domains: concept.domains,
+    phases: concept.phases,
+    skillLevel: concept.skillLevel,
+    tags: concept.tags?.slice(0, 5)
+  }));
+
+  const validPhases = [
+    ...selectedData.phases.map((p: any) => p.id),
+    ...Object.keys(selectedData).filter(key => 
+      !['tools', 'concepts', 'domains', 'phases'].includes(key)
+    ).map(key => selectedData[key]).flat().filter(Boolean).map((s: any) => s.id)
+  ].join('|');
+
+  return `RESPOND ONLY IN VALID JSON FORMAT. NO EXPLANATIONS BEFORE OR AFTER JSON.
+
+You are a DFIR expert providing workflow recommendations.
+
+AVAILABLE TOOLS: ${JSON.stringify(toolsList)}
+AVAILABLE CONCEPTS: ${JSON.stringify(conceptsList)}
+
+RULES:
+- Recommend 2-3 tools per phase
+- Use exact tool names from the database
+- Include relevant concepts for background knowledge
+- German responses for German queries
+
+REQUIRED OUTPUT FORMAT:
+{
+  "scenario_analysis": "Analysis text in German",
+  "investigation_approach": "Approach text in German", 
+  "critical_considerations": "Considerations text in German",
+  "recommended_tools": [
+    {
+      "name": "EXACT_TOOL_NAME",
+      "priority": "high|medium|low",
+      "phase": "${validPhases}",
+      "justification": "Why this tool fits"
+    }
+  ],
+  "workflow_suggestion": "Workflow text in German",
+  "background_knowledge": [
+    {
+      "concept_name": "EXACT_CONCEPT_NAME", 
+      "relevance": "Why relevant"
+    }
+  ],
+  "additional_notes": "Important notes"
+}
+
+CRITICAL: Output ONLY the JSON object. No markdown. No explanations outside JSON.`;
+}
+
+export function createToolSystemPrompt(selectedData: any): string {
+  const toolsList = selectedData.tools.map((tool: any) => ({
+    name: tool.name,
+    description: tool.description?.slice(0, 200),
+    domains: tool.domains,
+    phases: tool.phases,
+    platforms: tool.platforms,
+    skillLevel: tool.skillLevel,
+    license: tool.license,
+    tags: tool.tags?.slice(0, 5),
+    related_concepts: tool.related_concepts || []
+  }));
+
+  const conceptsList = selectedData.concepts.map((concept: any) => ({
+    name: concept.name,
+    description: concept.description?.slice(0, 200),
+    domains: concept.domains,
+    phases: concept.phases,
+    skillLevel: concept.skillLevel,
+    tags: concept.tags?.slice(0, 5)
+  }));
+
+  return `RESPOND ONLY IN VALID JSON FORMAT. NO EXPLANATIONS BEFORE OR AFTER JSON.
+
+You are a DFIR expert providing specific tool recommendations.
+
+AVAILABLE TOOLS: ${JSON.stringify(toolsList)}
+AVAILABLE CONCEPTS: ${JSON.stringify(conceptsList)}
+
+RULES:
+- Recommend 1-3 tools ranked by suitability
+- Use exact tool names from the database
+- German responses for German queries
+
+REQUIRED OUTPUT FORMAT:
+{
+  "problem_analysis": "Problem analysis in German",
+  "investigation_approach": "Solution approach in German",
+  "critical_considerations": "Important prerequisites in German", 
+  "recommended_tools": [
+    {
+      "name": "EXACT_TOOL_NAME",
+      "rank": 1,
+      "suitability_score": "high|medium|low",
+      "detailed_explanation": "Why this tool solves the problem",
+      "implementation_approach": "How to apply it",
+      "pros": ["advantage1", "advantage2"],
+      "cons": ["limitation1", "limitation2"],
+      "alternatives": "Alternative approaches"
+    }
+  ],
+  "background_knowledge": [
+    {
+      "concept_name": "EXACT_CONCEPT_NAME",
+      "relevance": "Why relevant for this problem"
+    }
+  ],
+  "additional_considerations": "Important considerations"
+}
+
+CRITICAL: Output ONLY the JSON object. No markdown. No explanations outside JSON.`;
+}
+
+export function createJsonConversionPrompt(proseResponse: string, originalQuery: string, mode: string): string {
+  return `Convert this prose response to JSON format.
+
+ORIGINAL QUERY: "${originalQuery}"
+MODE: ${mode}
+
+PROSE RESPONSE TO CONVERT:
+${proseResponse}
+
+OUTPUT REQUIRED FORMAT FOR ${mode.toUpperCase()}:
+${mode === 'workflow' ? `{
+  "scenario_analysis": "extracted analysis text",
+  "investigation_approach": "extracted approach text",
+  "critical_considerations": "extracted considerations",
+  "recommended_tools": [
+    {
+      "name": "tool name from response",
+      "priority": "high|medium|low",
+      "phase": "phase_id",
+      "justification": "extracted reasoning"
+    }
+  ],
+  "workflow_suggestion": "extracted workflow",
+  "background_knowledge": [],
+  "additional_notes": "extracted notes"
+}` : `{
+  "problem_analysis": "extracted analysis",
+  "investigation_approach": "extracted approach", 
+  "critical_considerations": "extracted considerations",
+  "recommended_tools": [
+    {
+      "name": "tool name",
+      "rank": 1,
+      "suitability_score": "high|medium|low",
+      "detailed_explanation": "extracted explanation",
+      "implementation_approach": "extracted approach",
+      "pros": ["extracted pros"],
+      "cons": ["extracted cons"],
+      "alternatives": "extracted alternatives"
+    }
+  ],
+  "background_knowledge": [],
+  "additional_considerations": "extracted considerations"
+}`}
+
+CRITICAL: Extract the information from the prose and format as JSON. Output ONLY the JSON object.`;
+}
+
+export function createEnhancementPrompt(input: string): string {
+  return `Analyze this forensic scenario input and provide questions if incomplete.
+
+If incomplete: return JSON array of 1-3 questions
+If complete: return empty array []
+
+INPUT: ${input}
+
+FORMAT: ["question1?", "question2?"] or []
+
+CRITICAL: Output ONLY the JSON array.`;
+}
\ No newline at end of file
diff --git a/src/utils/aiService.ts b/src/utils/aiService.ts
new file mode 100644
index 0000000..b00411b
--- /dev/null
+++ b/src/utils/aiService.ts
@@ -0,0 +1,106 @@
+interface AIConfig {
+  model: string;
+  endpoint: string;
+  apiKey: string;
+}
+
+function getSelectorConfig(): AIConfig {
+  return {
+    model: process.env.AI_SELECTOR_MODEL || process.env.AI_MODEL || 'claude-sonnet-4-20250514',
+    endpoint: (process.env.AI_SELECTOR_ENDPOINT || process.env.AI_API_ENDPOINT!) + '/v1/messages',
+    apiKey: process.env.AI_SELECTOR_API_KEY || process.env.AI_API_KEY!
+  };
+}
+
+function getAnalyzerConfig(): AIConfig {
+  return {
+    model: process.env.AI_ANALYZER_MODEL || process.env.AI_MODEL || 'claude-sonnet-4-20250514',
+    endpoint: (process.env.AI_ANALYZER_ENDPOINT || process.env.AI_API_ENDPOINT!) + '/v1/messages',
+    apiKey: process.env.AI_ANALYZER_API_KEY || process.env.AI_API_KEY!
+  };
+}
+
+export async function callAI(config: AIConfig, messages: any[], maxTokens: number = 1000, temperature: number = 0.3) {
+  const requestBody = {
+    model: config.model,
+    max_tokens: maxTokens,
+    temperature,
+    messages
+  };
+
+  console.log(`[AI API] Calling ${config.model} with ${messages.length} messages, max_tokens: ${maxTokens}`);
+  
+  try {
+    const response = await fetch(config.endpoint, {
+      method: "POST",
+      headers: {
+        "Content-Type": "application/json",
+        "Authorization": `Bearer ${config.apiKey}`
+      },
+      body: JSON.stringify(requestBody)
+    });
+
+    if (!response.ok) {
+      let errorDetails = `${response.status} ${response.statusText}`;
+      try {
+        const errorBody = await response.text();
+        console.error(`[AI API] Error response body:`, errorBody);
+        errorDetails += ` - ${errorBody}`;
+      } catch {
+        console.error(`[AI API] Could not read error response body`);
+      }
+      
+      console.error(`[AI API] Request failed:`, {
+        endpoint: config.endpoint,
+        model: config.model,
+        messageCount: messages.length,
+        maxTokens,
+        status: response.status,
+        hasApiKey: !!config.apiKey
+      });
+      
+      throw new Error(`AI API error: ${response.status} - ${response.statusText}`);
+    }
+
+    const result = await response.json();
+    
+    // Handle different API response formats
+    let content: string | null = null;
+    
+    // Mistral API format
+    if (result.content && Array.isArray(result.content) && result.content[0]?.text) {
+      content = result.content[0].text;
+      console.log(`[AI API] Success (Mistral format) - Response length: ${content.length} chars`);
+      return {
+        choices: [{
+          message: {
+            content: content
+          }
+        }]
+      };
+    }
+    
+    // Anthropic/OpenAI format
+    if (result.choices && result.choices[0] && result.choices[0].message) {
+      content = result.choices[0].message.content;
+      console.log(`[AI API] Success (OpenAI/Anthropic format) - Response length: ${content?.length || 0} chars`);
+      return result;
+    }
+    
+    // If neither format matches, log the structure and fail
+    console.error(`[AI API] Unexpected response structure:`, JSON.stringify(result, null, 2));
+    throw new Error('Unexpected AI API response structure');
+    
+  } catch (error) {
+    if (error.message?.includes('AI API error:')) {
+      // Re-throw API errors as-is
+      throw error;
+    } else {
+      // Network or other errors
+      console.error(`[AI API] Network/request error:`, error);
+      throw new Error(`AI API request failed: ${error.message}`);
+    }
+  }
+}
+
+export { getSelectorConfig, getAnalyzerConfig };
\ No newline at end of file
diff --git a/src/utils/embeddingsService.ts b/src/utils/embeddingsService.ts
new file mode 100644
index 0000000..8940454
--- /dev/null
+++ b/src/utils/embeddingsService.ts
@@ -0,0 +1,215 @@
+interface EmbeddingConfig {
+  endpoint: string;
+  apiKey: string;
+  model: string;
+}
+
+export interface ToolEmbedding {
+  id: string;
+  name: string;
+  type: 'tool' | 'concept';
+  embedding: number[];
+  content: string;
+  tool: any;
+  similarity?: number;
+}
+
+function getEmbeddingConfig(): EmbeddingConfig {
+  return {
+    endpoint: process.env.AI_EMBEDDINGS_ENDPOINT || 'https://api.mistral.ai/v1/embeddings',
+    apiKey: process.env.AI_EMBEDDINGS_API_KEY!,
+    model: process.env.AI_EMBEDDINGS_MODEL || 'mistral-embed'
+  };
+}
+
+export function isEmbeddingsEnabled(): boolean {
+  return process.env.AI_EMBEDDINGS_ENABLED === 'true';
+}
+
+export async function generateEmbedding(text: string): Promise<number[]> {
+  const config = getEmbeddingConfig();
+  
+  const response = await fetch(config.endpoint, {
+    method: 'POST',
+    headers: {
+      'Content-Type': 'application/json',
+      'Authorization': `Bearer ${config.apiKey}`
+    },
+    body: JSON.stringify({
+      model: config.model,
+      input: [text]
+    })
+  });
+
+  if (!response.ok) {
+    let errorDetails = `${response.status} ${response.statusText}`;
+    try {
+      const errorBody = await response.text();
+      errorDetails += ` - ${errorBody}`;
+    } catch {
+      // If we can't read the error body, use basic error info
+    }
+    console.error('Embeddings API error details:', errorDetails);
+    throw new Error(`Embeddings API error: ${response.status}`);
+  }
+
+  const data = await response.json();
+  return data.data[0].embedding;
+}
+
+export async function generateBatchEmbeddings(texts: string[]): Promise<number[][]> {
+  const config = getEmbeddingConfig();
+  const batchSize = parseInt(process.env.AI_EMBEDDINGS_BATCH_SIZE || '20');
+  const delay = parseInt(process.env.AI_EMBEDDINGS_BATCH_DELAY_MS || '1000');
+  
+  console.log(`[EMBEDDINGS] Processing ${texts.length} items in batches of ${batchSize}`);
+  
+  const results: number[][] = [];
+  
+  for (let i = 0; i < texts.length; i += batchSize) {
+    const batch = texts.slice(i, i + batchSize);
+    const batchNum = Math.floor(i/batchSize) + 1;
+    const totalBatches = Math.ceil(texts.length/batchSize);
+    
+    console.log(`[EMBEDDINGS] Processing batch ${batchNum}/${totalBatches} (${batch.length} items)`);
+    
+    // Log batch content lengths for debugging
+    const batchLengths = batch.map(text => text.length);
+    const batchTotalLength = batchLengths.reduce((a, b) => a + b, 0);
+    console.log(`[EMBEDDINGS] Batch ${batchNum} total chars: ${batchTotalLength}, avg per item: ${Math.round(batchTotalLength / batch.length)}`);
+    
+    try {
+      const response = await fetch(config.endpoint, {
+        method: 'POST',
+        headers: {
+          'Content-Type': 'application/json',
+          'Authorization': `Bearer ${config.apiKey}`
+        },
+        body: JSON.stringify({
+          model: config.model,
+          input: batch
+        })
+      });
+
+      if (!response.ok) {
+        let errorDetails = `${response.status} ${response.statusText}`;
+        try {
+          const errorBody = await response.text();
+          errorDetails += ` - ${errorBody}`;
+        } catch {
+          // If we can't read the error body, use basic error info
+        }
+        console.error(`Batch embeddings API error (batch ${i/batchSize + 1}):`, errorDetails);
+        throw new Error(`Batch embeddings API error: ${response.status}`);
+      }
+
+      const data = await response.json();
+      const batchEmbeddings = data.data.map((item: any) => item.embedding);
+      results.push(...batchEmbeddings);
+      
+      // Add delay between batches to avoid rate limiting
+      if (i + batchSize < texts.length && delay > 0) {
+        await new Promise(resolve => setTimeout(resolve, delay));
+      }
+      
+    } catch (error) {
+      console.error(`Failed to process batch ${i/batchSize + 1}:`, error);
+      throw error;
+    }
+  }
+  
+  console.log(`[EMBEDDINGS] Successfully processed all ${results.length} embeddings`);
+  return results;
+}
+
+function cosineSimilarity(a: number[], b: number[]): number {
+  if (a.length !== b.length) return 0;
+  
+  let dotProduct = 0;
+  let normA = 0;
+  let normB = 0;
+  
+  for (let i = 0; i < a.length; i++) {
+    dotProduct += a[i] * b[i];
+    normA += a[i] * a[i];
+    normB += b[i] * b[i];
+  }
+  
+  return dotProduct / (Math.sqrt(normA) * Math.sqrt(normB));
+}
+
+export function createEmbeddingContent(item: any): string {
+  const maxDescriptionLength = 200;
+  const maxTags = 5;
+  const maxTotalLength = 400;
+  
+  // Truncate description if too long
+  const description = item.description?.slice(0, maxDescriptionLength) || '';
+  
+  // Limit tags
+  const tags = (item.tags || []).slice(0, maxTags).join(', ');
+  
+  let content: string;
+  
+  if (item.type === 'concept') {
+    content = `${item.name}: ${description}`;
+    if (tags) content += ` | Tags: ${tags}`;
+    if (item.domains?.length) content += ` | Domains: ${item.domains.slice(0, 3).join(', ')}`;
+  } else {
+    content = `${item.name}: ${description}`;
+    if (tags) content += ` | Tags: ${tags}`;
+    if (item.platforms?.length) content += ` | Platforms: ${item.platforms.slice(0, 3).join(', ')}`;
+    if (item.skillLevel) content += ` | Skill: ${item.skillLevel}`;
+  }
+  
+  // Ensure total length doesn't exceed limit
+  if (content.length > maxTotalLength) {
+    content = content.slice(0, maxTotalLength - 3) + '...';
+  }
+  
+  return content;
+}
+
+export async function generateToolEmbeddings(toolsData: any): Promise<ToolEmbedding[]> {
+  const allItems = [
+    ...toolsData.tools.map((tool: any) => ({ ...tool, type: 'tool' })),
+    ...toolsData.concepts.map((concept: any) => ({ ...concept, type: 'concept' }))
+  ];
+
+  console.log(`[EMBEDDINGS] Creating content for ${allItems.length} items`);
+  const contents = allItems.map(createEmbeddingContent);
+  
+  // Log content length statistics
+  const lengths = contents.map(c => c.length);
+  const avgLength = lengths.reduce((a, b) => a + b, 0) / lengths.length;
+  const maxLength = Math.max(...lengths);
+  console.log(`[EMBEDDINGS] Content lengths - avg: ${Math.round(avgLength)}, max: ${maxLength}`);
+  
+  const embeddings = await generateBatchEmbeddings(contents);
+  
+  return allItems.map((item, index) => ({
+    id: `${item.type}_${item.name}`,
+    name: item.name,
+    type: item.type,
+    embedding: embeddings[index],
+    content: contents[index],
+    tool: item
+  }));
+}
+
+export async function findSimilarItems(query: string, toolEmbeddings: ToolEmbedding[]): Promise<ToolEmbedding[]> {
+  const maxCandidates = parseInt(process.env.AI_EMBEDDING_CANDIDATES || '30');
+  const threshold = parseFloat(process.env.AI_SIMILARITY_THRESHOLD || '0.3');
+
+  const queryEmbedding = await generateEmbedding(query);
+  
+  const similarities = toolEmbeddings.map(item => ({
+    ...item,
+    similarity: cosineSimilarity(queryEmbedding, item.embedding)
+  }));
+
+  return similarities
+    .filter(item => item.similarity >= threshold)
+    .sort((a, b) => b.similarity - a.similarity)
+    .slice(0, maxCandidates);
+}
\ No newline at end of file
diff --git a/src/utils/rateLimitedQueue.ts b/src/utils/rateLimitedQueue.ts
index e858b25..4d41157 100644
--- a/src/utils/rateLimitedQueue.ts
+++ b/src/utils/rateLimitedQueue.ts
@@ -1,5 +1,3 @@
-// src/utils/rateLimitedQueue.ts
-
 import dotenv from "dotenv";
 
 dotenv.config();
@@ -25,6 +23,11 @@ export interface QueueStatus {
   taskStatus?: string;
 }
 
+interface ChainedTaskResult<T> {
+  stage1Result: any;
+  finalResult: T;
+}
+
 class RateLimitedQueue {
   private tasks: QueuedTask[] = [];
   private isProcessing = false;
@@ -60,6 +63,39 @@ class RateLimitedQueue {
     });
   }
 
+  addChained<T>(
+    stage1Task: Task<any>, 
+    stage2TaskBuilder: (stage1Result: any) => Task<T>,
+    taskId?: string
+  ): Promise<ChainedTaskResult<T>> {
+    const id = taskId || this.generateTaskId();
+    
+    return new Promise<ChainedTaskResult<T>>((resolve, reject) => {
+      const chainedTask: QueuedTask = {
+        id,
+        task: async () => {
+          try {
+            const stage1Result = await stage1Task();
+            const stage2Task = stage2TaskBuilder(stage1Result);
+            const finalResult = await stage2Task();
+            
+            const result = { stage1Result, finalResult };
+            resolve(result);
+            return result;
+          } catch (err) {
+            reject(err);
+            throw err;
+          }
+        },
+        addedAt: Date.now(),
+        status: 'queued'
+      };
+      
+      this.tasks.push(chainedTask);
+      setTimeout(() => this.processQueue(), 100);
+    });
+  }
+
   getStatus(taskId?: string): QueueStatus {
     const queuedTasks = this.tasks.filter(t => t.status === 'queued');
     const processingTasks = this.tasks.filter(t => t.status === 'processing');
@@ -103,7 +139,6 @@ class RateLimitedQueue {
             const processingOffset = processingTasks.length > 0 ? 1 : 0;
             status.currentPosition = processingOffset + positionInQueue + 1;
           }
-        } else if (task.status === 'completed' || task.status === 'failed') {
         }
       } else {        
         const taskTimestamp = taskId.match(/ai_(\d+)_/)?.[1];
@@ -152,16 +187,13 @@ class RateLimitedQueue {
         this.currentlyProcessingTaskId = nextTask.id;
         this.lastProcessedAt = Date.now();
         
-        
         try {
           await nextTask.task();
           nextTask.status = 'completed';
           nextTask.completedAt = Date.now();
-          console.log(`[QUEUE] Task ${nextTask.id} completed`);
         } catch (error) {
           nextTask.status = 'failed';
           nextTask.completedAt = Date.now();
-          console.error(`[QUEUE] Task ${nextTask.id} failed:`, error);
         }
         
         this.currentlyProcessingTaskId = null;
@@ -169,20 +201,17 @@ class RateLimitedQueue {
         setTimeout(() => {
           const index = this.tasks.findIndex(t => t.id === nextTask.id);
           if (index >= 0) {
-            console.log(`[QUEUE] Removing completed task ${nextTask.id}`);
             this.tasks.splice(index, 1);
           }
         }, 10000); 
         
         const hasMoreQueued = this.tasks.some(t => t.status === 'queued');
         if (hasMoreQueued) {
-          console.log(`[QUEUE] Waiting ${this.delayMs}ms before next task`);
           await new Promise((r) => setTimeout(r, this.delayMs));
         }
       }
     } finally {
       this.isProcessing = false;
-      console.log(`[QUEUE] Queue processing finished`);
     }
   }
 
@@ -197,6 +226,14 @@ export function enqueueApiCall<T>(task: Task<T>, taskId?: string): Promise<T> {
   return queue.add(task, taskId);
 }
 
+export function enqueueChainedApiCall<T>(
+  stage1Task: Task<any>,
+  stage2TaskBuilder: (stage1Result: any) => Task<T>,
+  taskId?: string
+): Promise<ChainedTaskResult<T>> {
+  return queue.addChained(stage1Task, stage2TaskBuilder, taskId);
+}
+
 export function getQueueStatus(taskId?: string): QueueStatus {
   return queue.getStatus(taskId);
 }