GT AI OS Community Edition v2.0.33

Security hardening release addressing CodeQL and Dependabot alerts: - Fix stack trace exposure in error responses - Add SSRF protection with DNS resolution checking - Implement proper URL hostname validation (replaces substring matching) - Add centralized path sanitization to prevent path traversal - Fix ReDoS vulnerability in email validation regex - Improve HTML sanitization in validation utilities - Fix capability wildcard matching in auth utilities - Update glob dependency to address CVE - Add CodeQL suppression comments for verified false positives 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
2025-12-12 17:04:45 -05:00
commit b9dfb86260
746 changed files with 232071 additions and 0 deletions
--- a/apps/tenant-app/src/services/orchestrator.ts
+++ b/apps/tenant-app/src/services/orchestrator.ts
@@ -0,0 +1,270 @@
+/**
+ * GT 2.0 Task Orchestrator Service
+ * 
+ * DeepAgent-inspired intelligent orchestration layer that analyzes user intent
+ * and selects optimal resources (datasets, history, or direct LLM) for responses.
+ */
+
+import { searchDocuments, searchConversationHistory, ConversationHistoryResult, SearchResult } from './documents';
+import { api } from './api';
+
+export interface TaskContext {
+  conversationId: string;
+  userId: string;
+  availableDatasets: string[];
+  selectedDatasets: string[];
+  historySearchEnabled: boolean;
+  agentId?: string;
+}
+
+export interface IntentAnalysis {
+  intent: 'question' | 'task' | 'creative' | 'analysis';
+  complexity: 'simple' | 'moderate' | 'complex';
+  needsContext: boolean;
+  needsHistory: boolean;
+  confidence: number;
+  reasoning: string;
+}
+
+export interface ResourceSelection {
+  useDatasets: boolean;
+  useHistory: boolean;
+  searchMethod: 'vector' | 'hybrid' | 'keyword';
+  datasetIds: string[];
+  historyParams?: {
+    days_back: number;
+    agent_filter?: string[];
+  };
+}
+
+export interface OrchestrationResult {
+  intent: IntentAnalysis;
+  resources: ResourceSelection;
+  contextSources: ContextSource[];
+  historyResults?: ConversationHistoryResult[];
+  searchResults?: SearchResult[];
+}
+
+export interface ContextSource {
+  id: string;
+  type: 'dataset' | 'history' | 'direct';
+  name: string;
+  relevance: number;
+  content?: string;
+}
+
+export class TaskOrchestrator {
+  private readonly INTENT_KEYWORDS = {
+    question: ['what', 'how', 'why', 'when', 'where', 'explain', 'tell me about'],
+    task: ['create', 'build', 'generate', 'write', 'make', 'develop', 'implement'],
+    creative: ['imagine', 'story', 'poem', 'creative', 'artistic', 'design'],
+    analysis: ['analyze', 'compare', 'evaluate', 'review', 'assess', 'study']
+  };
+
+  private readonly CONTEXT_INDICATORS = [
+    'based on', 'according to', 'in the document', 'from the data', 
+    'previously', 'earlier', 'last time', 'before'
+  ];
+
+  private readonly HISTORY_INDICATORS = [
+    'previously', 'earlier', 'last time', 'before', 'remember when',
+    'what did we discuss', 'go back to', 'from our conversation'
+  ];
+
+  async orchestrate(query: string, context: TaskContext): Promise<OrchestrationResult> {
+    // Step 1: Analyze user intent
+    const intent = this.analyzeIntent(query);
+
+    // Step 2: Determine resource needs
+    const resources = await this.selectResources(query, intent, context);
+
+    // Step 3: Gather context from selected resources
+    const contextSources: ContextSource[] = [];
+    let historyResults: ConversationHistoryResult[] = [];
+    let searchResults: SearchResult[] = [];
+
+    // Execute dataset search if needed
+    if (resources.useDatasets && resources.datasetIds.length > 0) {
+      try {
+        const searchResponse = await searchDocuments({
+          query,
+          dataset_ids: resources.datasetIds,
+          search_method: resources.searchMethod,
+          top_k: 5,
+          similarity_threshold: 0.7
+        });
+
+        if (searchResponse.success) {
+          searchResults = searchResponse.data.results;
+          searchResults.forEach(result => {
+            contextSources.push({
+              id: result.chunk_id,
+              type: 'dataset',
+              name: `Document: ${result.document}`,
+              relevance: result.similarity,
+              content: result.metadata?.content || result.document
+            });
+          });
+        }
+      } catch (error) {
+        console.error('Dataset search failed:', error);
+      }
+    }
+
+    // Execute history search if needed
+    if (resources.useHistory) {
+      try {
+        const historyResponse = await searchConversationHistory({
+          query,
+          ...resources.historyParams,
+          limit: 5
+        });
+
+        if (historyResponse.success) {
+          historyResults = historyResponse.data;
+          historyResults.forEach(result => {
+            contextSources.push({
+              id: result.message_id,
+              type: 'history',
+              name: `${result.conversation_title} - ${result.agent_name}`,
+              relevance: result.relevance_score,
+              content: result.content
+            });
+          });
+        }
+      } catch (error) {
+        console.error('History search failed:', error);
+      }
+    }
+
+    // Sort context sources by relevance
+    contextSources.sort((a, b) => b.relevance - a.relevance);
+
+    return {
+      intent,
+      resources,
+      contextSources: contextSources.slice(0, 8), // Limit to top 8 sources
+      historyResults,
+      searchResults
+    };
+  }
+
+  private analyzeIntent(query: string): IntentAnalysis {
+    const lowerQuery = query.toLowerCase();
+    const words = lowerQuery.split(/\s+/);
+
+    // Determine primary intent
+    let intent: IntentAnalysis['intent'] = 'question';
+    let maxScore = 0;
+
+    for (const [intentType, keywords] of Object.entries(this.INTENT_KEYWORDS)) {
+      const score = keywords.reduce((acc, keyword) => {
+        return acc + (lowerQuery.includes(keyword) ? 1 : 0);
+      }, 0);
+
+      if (score > maxScore) {
+        maxScore = score;
+        intent = intentType as IntentAnalysis['intent'];
+      }
+    }
+
+    // Determine complexity based on query length and structure
+    const complexity: IntentAnalysis['complexity'] = 
+      words.length < 5 ? 'simple' :
+      words.length < 15 ? 'moderate' : 'complex';
+
+    // Check if context is needed
+    const needsContext = this.CONTEXT_INDICATORS.some(indicator => 
+      lowerQuery.includes(indicator)
+    );
+
+    // Check if history is needed
+    const needsHistory = this.HISTORY_INDICATORS.some(indicator => 
+      lowerQuery.includes(indicator)
+    );
+
+    const confidence = Math.min(0.9, 0.5 + (maxScore * 0.1));
+
+    return {
+      intent,
+      complexity,
+      needsContext: needsContext || intent === 'analysis',
+      needsHistory,
+      confidence,
+      reasoning: `Intent: ${intent}, Keywords found: ${maxScore}, Length: ${words.length} words`
+    };
+  }
+
+  private async selectResources(
+    query: string,
+    intent: IntentAnalysis,
+    context: TaskContext
+  ): Promise<ResourceSelection> {
+    const resources: ResourceSelection = {
+      useDatasets: false,
+      useHistory: false,
+      searchMethod: 'hybrid',
+      datasetIds: []
+    };
+
+    // Use datasets if context is needed and datasets are available
+    if ((intent.needsContext || intent.intent === 'analysis') && context.selectedDatasets.length > 0) {
+      resources.useDatasets = true;
+      resources.datasetIds = context.selectedDatasets;
+      
+      // Choose search method based on intent and complexity
+      if (intent.intent === 'creative') {
+        resources.searchMethod = 'vector'; // Better for semantic similarity
+      } else if (intent.complexity === 'simple') {
+        resources.searchMethod = 'keyword'; // Faster for simple queries
+      } else {
+        resources.searchMethod = 'hybrid'; // Best overall performance
+      }
+    }
+
+    // Use history if explicitly requested or if pattern suggests it
+    if (context.historySearchEnabled && (intent.needsHistory || intent.complexity === 'complex')) {
+      resources.useHistory = true;
+      resources.historyParams = {
+        days_back: intent.complexity === 'complex' ? 60 : 30,
+        agent_filter: context.agentId ? [context.agentId] : undefined
+      };
+    }
+
+    return resources;
+  }
+
+  /**
+   * Generate a prompt with context for the LLM
+   */
+  generateContextualPrompt(
+    originalQuery: string,
+    orchestrationResult: OrchestrationResult
+  ): string {
+    let prompt = originalQuery;
+
+    if (orchestrationResult.contextSources.length === 0) {
+      return prompt;
+    }
+
+    // Add context header
+    prompt += '\n\n--- CONTEXT ---\n';
+    
+    // Add relevant sources
+    orchestrationResult.contextSources.forEach((source, index) => {
+      prompt += `\n${index + 1}. [${source.type.toUpperCase()}] ${source.name}\n`;
+      if (source.content) {
+        prompt += `   ${source.content.substring(0, 500)}${source.content.length > 500 ? '...' : ''}\n`;
+      }
+    });
+
+    prompt += '\n--- END CONTEXT ---\n\n';
+    prompt += 'Please answer based on the provided context when relevant. ';
+    prompt += 'If the context doesn\'t contain relevant information, please indicate that and provide a general response.';
+
+    return prompt;
+  }
+}
+
+// Singleton instance
+export const taskOrchestrator = new TaskOrchestrator();