Optimize all AI functions for efficiency and speed

- AI Tagging: batch 10 projects per API call with 3 concurrent batches (~10x faster) - New `tagProjectsBatch()` with `getAISuggestionsBatch()` for multi-project prompts - Single DB query for all projects, single anonymization pass - Compact JSON in prompts (no pretty-print) saves tokens - AI Shortlist: run STARTUP and BUSINESS_CONCEPT categories in parallel (2x faster) - AI Filtering: increase default parallel batches from 1 to 3 (3x faster) Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
2026-02-16 14:02:38 +01:00
parent 989db4dc14
commit 65a22e6f19
4 changed files with 377 additions and 49 deletions
--- a/src/server/routers/tag.ts
+++ b/src/server/routers/tag.ts
@@ -5,6 +5,7 @@ import { prisma } from '@/lib/prisma'
 import { logAudit } from '../utils/audit'
 import {
  tagProject,
  tagProjectsBatch,
  getTagSuggestions,
  addProjectTag,
  removeProjectTag,
@@ -17,7 +18,7 @@ import {
  NotificationTypes,
 } from '../services/in-app-notification'
-// Background job runner for tagging
+// Background job runner for tagging — uses batched API calls for efficiency
 async function runTaggingJob(jobId: string, userId: string) {
  const job = await prisma.taggingJob.findUnique({
    where: { id: jobId },
@@ -28,7 +29,7 @@ async function runTaggingJob(jobId: string, userId: string) {
    return
  }
-  console.log(`[AI Tagging Job] Starting job ${jobId}...`)
+  console.log(`[AI Tagging Job] Starting job ${jobId} (batched mode)...`)
  // Mark as running
  await prisma.taggingJob.update({
@@ -56,7 +57,7 @@ async function runTaggingJob(jobId: string, userId: string) {
    const allProjects = await prisma.project.findMany({
      where: whereClause,
-      select: { id: true, title: true, tags: true },
+      select: { id: true, title: true, tags: true, projectTags: { select: { tagId: true } } },
    })
    const untaggedProjects = allProjects.filter(p => p.tags.length === 0)
@@ -83,48 +84,33 @@ async function runTaggingJob(jobId: string, userId: string) {
      return
    }
    let taggedCount = 0
    let failedCount = 0
    const errors: string[] = []
    const startTime = Date.now()
-    for (let i = 0; i < untaggedProjects.length; i++) {
+    // Use batched tagging — processes 10 projects per API call, 3 concurrent calls
-      const project = untaggedProjects[i]
+    const { results, totalTokens } = await tagProjectsBatch(
-      console.log(`[AI Tagging Job] Processing ${i + 1}/${untaggedProjects.length}: "${project.title.substring(0, 40)}..."`)
+      untaggedProjects,
      userId,
      async (processed, total) => {
        // Update job progress on each batch completion
        const taggedSoFar = results?.length ?? processed
        await prisma.taggingJob.update({
          where: { id: jobId },
          data: {
            processedCount: processed,
            taggedCount: taggedSoFar,
          },
        })
      try {
        const result = await tagProject(project.id, userId)
        taggedCount++
        console.log(`[AI Tagging Job] ✓ Tagged with ${result.applied.length} tags`)
      } catch (error) {
        failedCount++
        const errorMsg = error instanceof Error ? error.message : 'Unknown error'
        errors.push(`${project.title}: ${errorMsg}`)
        console.error(`[AI Tagging Job] ✗ Failed: ${errorMsg}`)
      }
      // Update progress
      await prisma.taggingJob.update({
        where: { id: jobId },
        data: {
          processedCount: i + 1,
          taggedCount,
          failedCount,
          errorsJson: errors.length > 0 ? errors.slice(0, 20) : undefined, // Keep last 20 errors
        },
      })
      // Log progress every 10 projects
      if ((i + 1) % 10 === 0) {
        const elapsed = ((Date.now() - startTime) / 1000).toFixed(0)
-        const avgTime = (Date.now() - startTime) / (i + 1) / 1000
+        console.log(`[AI Tagging Job] Progress: ${processed}/${total} (${elapsed}s elapsed)`)
        const remaining = avgTime * (untaggedProjects.length - i - 1)
        console.log(`[AI Tagging Job] Progress: ${i + 1}/${untaggedProjects.length} (${elapsed}s elapsed, ~${remaining.toFixed(0)}s remaining)`)
      }
-    }
+    )
    const taggedCount = results.filter(r => r.applied.length > 0).length
    const failedCount = untaggedProjects.length - results.length
    const totalTime = ((Date.now() - startTime) / 1000).toFixed(1)
-    console.log(`[AI Tagging Job] Complete: ${taggedCount} tagged, ${failedCount} failed in ${totalTime}s`)
+    console.log(`[AI Tagging Job] Complete: ${taggedCount} tagged, ${failedCount} failed in ${totalTime}s (${totalTokens} tokens)`)
    // Mark as completed
    await prisma.taggingJob.update({
@@ -132,7 +118,9 @@ async function runTaggingJob(jobId: string, userId: string) {
      data: {
        status: 'COMPLETED',
        completedAt: new Date(),
-        errorsJson: errors.length > 0 ? errors : undefined,
+        processedCount: results.length,
        taggedCount,
        failedCount,
      },
    })
@@ -144,7 +132,7 @@ async function runTaggingJob(jobId: string, userId: string) {
      linkUrl: '/admin/projects',
      linkLabel: 'View Projects',
      priority: 'normal',
-      metadata: { jobId, taggedCount, failedCount, skippedCount },
+      metadata: { jobId, taggedCount, failedCount, skippedCount, totalTokens },
    })
  } catch (error) {
--- a/src/server/services/ai-filtering.ts
+++ b/src/server/services/ai-filtering.ts
@@ -142,7 +142,7 @@ interface FilteringRuleInput {
 const DEFAULT_BATCH_SIZE = 20
 const MAX_BATCH_SIZE = 50
 const MIN_BATCH_SIZE = 1
-const DEFAULT_PARALLEL_BATCHES = 1
+const DEFAULT_PARALLEL_BATCHES = 3
 const MAX_PARALLEL_BATCHES = 10
 // Structured system prompt for AI screening
--- a/src/server/services/ai-shortlist.ts
+++ b/src/server/services/ai-shortlist.ts
@@ -344,8 +344,8 @@ export async function generateShortlist(
    let totalTokens = 0
    const allErrors: string[] = []
-    // Run each category independently
+    // Run categories in parallel for efficiency
-    for (const cat of categories) {
+    const categoryPromises = categories.map(async (cat) => {
      const catTopN = cat === 'STARTUP'
        ? (startupTopN ?? topN)
        : (conceptTopN ?? topN)
@@ -357,6 +357,12 @@ export async function generateShortlist(
        prisma,
      )
      return { cat, result }
    })
    const categoryResults = await Promise.all(categoryPromises)
    for (const { cat, result } of categoryResults) {
      if (cat === 'STARTUP') {
        allRecommendations.STARTUP = result.recommendations
      } else {
--- a/src/server/services/ai-tagging.ts
+++ b/src/server/services/ai-tagging.ts
@@ -5,7 +5,7 @@
 *
 * Features:
 * - Single project tagging (on-submit or manual)
- * - Batch tagging for rounds
+ * - Batch tagging with concurrent processing (10 projects/batch, 3 concurrent)
 * - Confidence scores for each tag
 * - Additive only - never removes existing tags
 *
@@ -53,8 +53,10 @@ interface AvailableTag {
 const CONFIDENCE_THRESHOLD = 0.5
 const DEFAULT_MAX_TAGS = 5
 const BATCH_SIZE = 10 // Projects per API call
 const BATCH_CONCURRENCY = 3 // Concurrent API calls
-// System prompt optimized for tag suggestion
+// System prompt optimized for single-project tag suggestion
 const TAG_SUGGESTION_SYSTEM_PROMPT = `You are an expert at categorizing ocean conservation and sustainability projects.
 Analyze the project and suggest the most relevant expertise tags from the provided list.
@@ -78,6 +80,36 @@ Rules:
 - Maximum 7 suggestions per project
 - Be conservative - only suggest tags that truly apply`
 // System prompt optimized for batch tagging (multiple projects in one call)
 const BATCH_TAG_SYSTEM_PROMPT = `You are an expert at categorizing ocean conservation and sustainability projects.
 Analyze EACH project and suggest the most relevant expertise tags from the provided list.
 Consider each project's focus areas, technology, methodology, and domain.
 Return JSON with this format:
 {
  "projects": [
    {
      "project_id": "PROJECT_001",
      "suggestions": [
        {
          "tag_name": "exact tag name from list",
          "confidence": 0.0-1.0,
          "reasoning": "brief explanation"
        }
      ]
    }
  ]
 }
 Rules:
 - Only suggest tags from the provided list (exact names)
 - Order by relevance (most relevant first)
 - Confidence should reflect how well the tag matches
 - Maximum 7 suggestions per project
 - Be conservative - only suggest tags that truly apply
 - Return results for ALL projects provided`
 // ─── Helper Functions ────────────────────────────────────────────────────────
 /**
@@ -132,7 +164,8 @@ export async function getAvailableTags(): Promise<AvailableTag[]> {
 // ─── AI Tagging Core ─────────────────────────────────────────────────────────
 /**
- * Call OpenAI to get tag suggestions for a project
+ * Call OpenAI to get tag suggestions for a single project
 * Used for on-demand single-project tagging
 */
 async function getAISuggestions(
  anonymizedProject: AnonymizedProjectForAI,
@@ -147,7 +180,7 @@ async function getAISuggestions(
  const model = await getConfiguredModel()
-  // Build tag list for prompt
+  // Build compact tag list for prompt
  const tagList = availableTags.map((t) => ({
    name: t.name,
    category: t.category,
@@ -155,10 +188,10 @@ async function getAISuggestions(
  }))
  const userPrompt = `PROJECT:
-${JSON.stringify(anonymizedProject, null, 2)}
+${JSON.stringify(anonymizedProject)}
 AVAILABLE TAGS:
-${JSON.stringify(tagList, null, 2)}
+${JSON.stringify(tagList)}
 Suggest relevant tags for this project.`
@@ -246,6 +279,160 @@ Suggest relevant tags for this project.`
  }
 }
 /**
 * Call OpenAI to get tag suggestions for a batch of projects in one API call.
 * Returns a map of project_id -> TagSuggestion[].
 */
 async function getAISuggestionsBatch(
  anonymizedProjects: AnonymizedProjectForAI[],
  availableTags: AvailableTag[],
  userId?: string
 ): Promise<{ suggestionsMap: Map<string, TagSuggestion[]>; tokensUsed: number }> {
  const openai = await getOpenAI()
  if (!openai) {
    console.warn('[AI Tagging] OpenAI not configured')
    return { suggestionsMap: new Map(), tokensUsed: 0 }
  }
  const model = await getConfiguredModel()
  const suggestionsMap = new Map<string, TagSuggestion[]>()
  // Build compact tag list (sent once for entire batch)
  const tagList = availableTags.map((t) => ({
    name: t.name,
    category: t.category,
    description: t.description,
  }))
  const userPrompt = `PROJECTS (${anonymizedProjects.length}):
 ${JSON.stringify(anonymizedProjects)}
 AVAILABLE TAGS:
 ${JSON.stringify(tagList)}
 Suggest relevant tags for each project.`
  const MAX_PARSE_RETRIES = 2
  let parseAttempts = 0
  try {
    const params = buildCompletionParams(model, {
      messages: [
        { role: 'system', content: BATCH_TAG_SYSTEM_PROMPT },
        { role: 'user', content: userPrompt },
      ],
      jsonMode: true,
      temperature: 0.1,
      maxTokens: Math.min(4000, anonymizedProjects.length * 500),
    })
    let response = await openai.chat.completions.create(params)
    let usage = extractTokenUsage(response)
    let totalTokens = usage.totalTokens
    // Parse with retry logic
    let parsed: {
      projects: Array<{
        project_id: string
        suggestions: Array<{
          tag_name: string
          confidence: number
          reasoning: string
        }>
      }>
    }
    while (true) {
      try {
        const content = response.choices[0]?.message?.content
        if (!content) throw new Error('Empty response from AI')
        const raw = JSON.parse(content)
        parsed = raw.projects ? raw : { projects: Array.isArray(raw) ? raw : [] }
        break
      } catch (parseError) {
        if (parseError instanceof SyntaxError && parseAttempts < MAX_PARSE_RETRIES) {
          parseAttempts++
          console.warn(`[AI Tagging Batch] JSON parse failed, retrying (${parseAttempts}/${MAX_PARSE_RETRIES})`)
          const retryParams = buildCompletionParams(model, {
            messages: [
              { role: 'system', content: BATCH_TAG_SYSTEM_PROMPT },
              { role: 'user', content: userPrompt + '\n\nIMPORTANT: Please ensure valid JSON output.' },
            ],
            jsonMode: true,
            temperature: 0.1,
            maxTokens: Math.min(4000, anonymizedProjects.length * 500),
          })
          response = await openai.chat.completions.create(retryParams)
          const retryUsage = extractTokenUsage(response)
          totalTokens += retryUsage.totalTokens
          continue
        }
        throw parseError
      }
    }
    // Log usage for the entire batch
    await logAIUsage({
      userId,
      action: 'PROJECT_TAGGING',
      entityType: 'Project',
      model,
      promptTokens: usage.promptTokens,
      completionTokens: usage.completionTokens,
      totalTokens,
      batchSize: anonymizedProjects.length,
      itemsProcessed: parsed.projects?.length || 0,
      status: 'SUCCESS',
    })
    // Map results back to TagSuggestion format
    for (const projectResult of parsed.projects || []) {
      const suggestions: TagSuggestion[] = []
      for (const s of projectResult.suggestions || []) {
        const tag = availableTags.find(
          (t) => t.name.toLowerCase() === s.tag_name.toLowerCase()
        )
        if (tag) {
          suggestions.push({
            tagId: tag.id,
            tagName: tag.name,
            confidence: Math.max(0, Math.min(1, s.confidence)),
            reasoning: s.reasoning || '',
          })
        }
      }
      suggestionsMap.set(projectResult.project_id, suggestions)
    }
    return { suggestionsMap, tokensUsed: totalTokens }
  } catch (error) {
    if (error instanceof SyntaxError) {
      const parseError = createParseError(error.message)
      logAIError('Tagging', 'getAISuggestionsBatch', parseError)
    }
    const classified = classifyAIError(error)
    logAIError('Tagging', 'getAISuggestionsBatch', classified)
    await logAIUsage({
      userId,
      action: 'PROJECT_TAGGING',
      entityType: 'Project',
      model: 'unknown',
      promptTokens: 0,
      completionTokens: 0,
      totalTokens: 0,
      batchSize: anonymizedProjects.length,
      itemsProcessed: 0,
      status: 'ERROR',
      errorMessage: error instanceof Error ? error.message : 'Unknown error',
    })
    throw error
  }
 }
 // ─── Public API ──────────────────────────────────────────────────────────────
 /**
@@ -355,6 +542,153 @@ export async function tagProject(
  }
 }
 /**
 * Tag a batch of projects using batched API calls with concurrency.
 * Much more efficient than tagging one-by-one for bulk operations.
 *
 * @param projects Array of { id, projectTags } to tag
 * @param userId The user initiating the tagging
 * @param onProgress Callback for progress updates
 * @returns Array of TaggingResult
 */
 export async function tagProjectsBatch(
  projects: Array<{
    id: string
    title: string
    projectTags: Array<{ tagId: string }>
  }>,
  userId: string,
  onProgress?: (processed: number, total: number) => Promise<void>
 ): Promise<{ results: TaggingResult[]; totalTokens: number }> {
  const settings = await getTaggingSettings()
  if (!settings.enabled) {
    return { results: [], totalTokens: 0 }
  }
  const availableTags = await getAvailableTags()
  if (availableTags.length === 0) {
    return { results: [], totalTokens: 0 }
  }
  // Fetch full project data for all projects at once (single DB query)
  const fullProjects = await prisma.project.findMany({
    where: { id: { in: projects.map((p) => p.id) } },
    include: {
      projectTags: true,
      files: { select: { fileType: true } },
      _count: { select: { teamMembers: true, files: true } },
    },
  })
  const projectMap = new Map(fullProjects.map((p) => [p.id, p]))
  // Anonymize all projects at once
  const projectsWithRelations = fullProjects.map(toProjectWithRelations)
  const { anonymized, mappings } = anonymizeProjectsForAI(projectsWithRelations, 'FILTERING')
  if (!validateAnonymizedProjects(anonymized)) {
    throw new Error('GDPR compliance check failed: PII detected in anonymized data')
  }
  // Build mapping from anonymous ID to real project
  const anonToRealMap = new Map<string, string>()
  for (const mapping of mappings) {
    anonToRealMap.set(mapping.anonymousId, mapping.realId)
  }
  // Split into batches
  const batches: AnonymizedProjectForAI[][] = []
  for (let i = 0; i < anonymized.length; i += BATCH_SIZE) {
    batches.push(anonymized.slice(i, i + BATCH_SIZE))
  }
  const allResults: TaggingResult[] = []
  let totalTokens = 0
  let processedCount = 0
  // Process batches with concurrency
  for (let i = 0; i < batches.length; i += BATCH_CONCURRENCY) {
    const concurrentBatches = batches.slice(i, i + BATCH_CONCURRENCY)
    const batchPromises = concurrentBatches.map(async (batch) => {
      try {
        const { suggestionsMap, tokensUsed } = await getAISuggestionsBatch(
          batch,
          availableTags,
          userId
        )
        return { suggestionsMap, tokensUsed, error: null }
      } catch (error) {
        console.error('[AI Tagging Batch] Batch failed:', error)
        return { suggestionsMap: new Map<string, TagSuggestion[]>(), tokensUsed: 0, error }
      }
    })
    const batchResults = await Promise.all(batchPromises)
    // Process results from all concurrent batches
    for (const { suggestionsMap, tokensUsed } of batchResults) {
      totalTokens += tokensUsed
      for (const [anonId, suggestions] of suggestionsMap) {
        const realId = anonToRealMap.get(anonId)
        if (!realId) continue
        const project = projectMap.get(realId)
        if (!project) continue
        // Filter by confidence
        const validSuggestions = suggestions.filter(
          (s) => s.confidence >= settings.confidenceThreshold
        )
        // Get existing tags
        const existingTagIds = new Set(project.projectTags.map((pt) => pt.tagId))
        const currentTagCount = project.projectTags.length
        const remainingSlots = Math.max(0, settings.maxTags - currentTagCount)
        const newSuggestions = validSuggestions
          .filter((s) => !existingTagIds.has(s.tagId))
          .slice(0, remainingSlots)
        // Apply tags
        const applied: TagSuggestion[] = []
        for (const suggestion of newSuggestions) {
          try {
            await prisma.projectTag.create({
              data: {
                projectId: realId,
                tagId: suggestion.tagId,
                confidence: suggestion.confidence,
                source: 'AI',
              },
            })
            applied.push(suggestion)
          } catch {
            // Skip duplicates
          }
        }
        allResults.push({
          projectId: realId,
          suggestions,
          applied,
          tokensUsed: 0, // Token tracking is per-batch, not per-project
        })
        processedCount++
      }
    }
    // Report progress after each concurrent chunk
    if (onProgress) {
      await onProgress(processedCount, projects.length)
    }
  }
  return { results: allResults, totalTokens }
 }
 /**
 * Get tag suggestions for a project without applying them
 * Useful for preview/review before applying