try a context approach

2025-11-08 14:25:51 +01:00 · 2025-03-10 03:34:48 +00:00
parent adaac46fbf
commit cf0e9242a0
4 changed files with 803 additions and 370 deletions
--- a/src/services/llm/trilium_context_service.ts
+++ b/src/services/llm/trilium_context_service.ts
@@ -0,0 +1,410 @@
+import becca from "../../becca/becca.js";
+import vectorStore from "./embeddings/vector_store.js";
+import providerManager from "./embeddings/providers.js";
+import options from "../options.js";
+import log from "../log.js";
+import type { Message } from "./ai_interface.js";
+import { cosineSimilarity } from "./embeddings/vector_store.js";
+
+/**
+ * TriliumContextService provides intelligent context management for working with large knowledge bases
+ * through limited context window LLMs like Ollama.
+ *
+ * It creates a "meta-prompting" approach where the first LLM call is used
+ * to determine what information might be needed to answer the query,
+ * then only the relevant context is loaded, before making the final
+ * response.
+ */
+class TriliumContextService {
+    private initialized = false;
+    private initPromise: Promise<void> | null = null;
+    private provider: any = null;
+
+    // Cache for recently used context to avoid repeated embedding lookups
+    private recentQueriesCache = new Map<string, {
+        timestamp: number,
+        relevantNotes: any[]
+    }>();
+
+    // Configuration
+    private cacheExpiryMs = 5 * 60 * 1000; // 5 minutes
+    private metaPrompt = `You are an AI assistant that decides what information needs to be retrieved from a knowledge base to answer the user's question.
+Given the user's question, generate 3-5 specific search queries that would help find relevant information.
+Each query should be focused on a different aspect of the question.
+Format your answer as a JSON array of strings, with each string being a search query.
+Example: ["exact topic mentioned", "related concept 1", "related concept 2"]`;
+
+    constructor() {
+        this.setupCacheCleanup();
+    }
+
+    /**
+     * Initialize the service
+     */
+    async initialize() {
+        if (this.initialized) return;
+
+        // Use a promise to prevent multiple simultaneous initializations
+        if (this.initPromise) return this.initPromise;
+
+        this.initPromise = (async () => {
+            try {
+                const providerId = await options.getOption('embeddingsDefaultProvider') || 'ollama';
+                this.provider = providerManager.getEmbeddingProvider(providerId);
+
+                if (!this.provider) {
+                    throw new Error(`Embedding provider ${providerId} not found`);
+                }
+
+                this.initialized = true;
+                log.info(`Trilium context service initialized with provider: ${providerId}`);
+            } catch (error: unknown) {
+                const errorMessage = error instanceof Error ? error.message : String(error);
+                log.error(`Failed to initialize Trilium context service: ${errorMessage}`);
+                throw error;
+            } finally {
+                this.initPromise = null;
+            }
+        })();
+
+        return this.initPromise;
+    }
+
+    /**
+     * Set up periodic cache cleanup
+     */
+    private setupCacheCleanup() {
+        setInterval(() => {
+            const now = Date.now();
+            for (const [key, data] of this.recentQueriesCache.entries()) {
+                if (now - data.timestamp > this.cacheExpiryMs) {
+                    this.recentQueriesCache.delete(key);
+                }
+            }
+        }, 60000); // Run cleanup every minute
+    }
+
+    /**
+     * Generate search queries to find relevant information for the user question
+     * @param userQuestion - The user's question
+     * @param llmService - The LLM service to use for generating queries
+     * @returns Array of search queries
+     */
+    async generateSearchQueries(userQuestion: string, llmService: any): Promise<string[]> {
+        try {
+            const messages: Message[] = [
+                { role: "system", content: this.metaPrompt },
+                { role: "user", content: userQuestion }
+            ];
+
+            const options = {
+                temperature: 0.3,
+                maxTokens: 300
+            };
+
+            // Get the response from the LLM
+            const response = await llmService.sendTextCompletion(messages, options);
+
+            try {
+                // Parse the JSON response
+                const jsonStr = response.trim().replace(/```json|```/g, '').trim();
+                const queries = JSON.parse(jsonStr);
+
+                if (Array.isArray(queries) && queries.length > 0) {
+                    return queries;
+                } else {
+                    throw new Error("Invalid response format");
+                }
+            } catch (parseError) {
+                // Fallback: if JSON parsing fails, try to extract queries line by line
+                const lines = response.split('\n')
+                    .map((line: string) => line.trim())
+                    .filter((line: string) => line.length > 0 && !line.startsWith('```'));
+
+                if (lines.length > 0) {
+                    return lines.map((line: string) => line.replace(/^["'\d\.\-\s]+/, '').trim());
+                }
+
+                // If all else fails, just use the original question
+                return [userQuestion];
+            }
+        } catch (error: unknown) {
+            const errorMessage = error instanceof Error ? error.message : String(error);
+            log.error(`Error generating search queries: ${errorMessage}`);
+            // Fallback to just using the original question
+            return [userQuestion];
+        }
+    }
+
+    /**
+     * Find relevant notes using multiple search queries
+     * @param queries - Array of search queries
+     * @param contextNoteId - Optional note ID to restrict search to a branch
+     * @param limit - Max notes to return
+     * @returns Array of relevant notes
+     */
+    async findRelevantNotesMultiQuery(
+        queries: string[],
+        contextNoteId: string | null = null,
+        limit = 10
+    ): Promise<any[]> {
+        if (!this.initialized) {
+            await this.initialize();
+        }
+
+        try {
+            // Cache key combining all queries
+            const cacheKey = JSON.stringify({ queries, contextNoteId, limit });
+
+            // Check if we have a recent cache hit
+            const cached = this.recentQueriesCache.get(cacheKey);
+            if (cached) {
+                return cached.relevantNotes;
+            }
+
+            // Array to store all results with their similarity scores
+            const allResults: {
+                noteId: string,
+                title: string,
+                content: string | null,
+                similarity: number,
+                branchId?: string
+            }[] = [];
+
+            // Set to keep track of note IDs we've seen to avoid duplicates
+            const seenNoteIds = new Set<string>();
+
+            // Process each query
+            for (const query of queries) {
+                // Get embeddings for this query
+                const queryEmbedding = await this.provider.getEmbedding(query);
+
+                // Find notes similar to this query
+                let results;
+                if (contextNoteId) {
+                    // Find within a specific context/branch
+                    results = await this.findNotesInBranch(
+                        queryEmbedding,
+                        contextNoteId,
+                        Math.min(limit, 5) // Limit per query
+                    );
+                } else {
+                    // Search all notes
+                    results = await vectorStore.findSimilarNotes(
+                        queryEmbedding,
+                        this.provider.id,
+                        this.provider.modelId,
+                        Math.min(limit, 5), // Limit per query
+                        0.5 // Lower threshold to get more diverse results
+                    );
+                }
+
+                // Process results
+                for (const result of results) {
+                    if (!seenNoteIds.has(result.noteId)) {
+                        seenNoteIds.add(result.noteId);
+
+                        // Get the note from Becca
+                        const note = becca.notes[result.noteId];
+                        if (!note) continue;
+
+                        // Add to our results
+                        allResults.push({
+                            noteId: result.noteId,
+                            title: note.title,
+                            content: note.type === 'text' ? note.getContent() as string : null,
+                            similarity: result.similarity,
+                            branchId: note.getBranches()[0]?.branchId
+                        });
+                    }
+                }
+            }
+
+            // Sort by similarity and take the top 'limit' results
+            const sortedResults = allResults
+                .sort((a, b) => b.similarity - a.similarity)
+                .slice(0, limit);
+
+            // Cache the results
+            this.recentQueriesCache.set(cacheKey, {
+                timestamp: Date.now(),
+                relevantNotes: sortedResults
+            });
+
+            return sortedResults;
+        } catch (error: unknown) {
+            const errorMessage = error instanceof Error ? error.message : String(error);
+            log.error(`Error finding relevant notes: ${errorMessage}`);
+            return [];
+        }
+    }
+
+    /**
+     * Find notes in a specific branch/context
+     * @param embedding - Query embedding
+     * @param contextNoteId - Note ID to restrict search to
+     * @param limit - Max notes to return
+     * @returns Array of relevant notes
+     */
+    private async findNotesInBranch(
+        embedding: Float32Array,
+        contextNoteId: string,
+        limit = 5
+    ): Promise<{noteId: string, similarity: number}[]> {
+        try {
+            // Get the subtree note IDs
+            const subtreeNoteIds = await this.getSubtreeNoteIds(contextNoteId);
+
+            if (subtreeNoteIds.length === 0) {
+                return [];
+            }
+
+            // Get all embeddings for these notes using vectorStore instead of direct SQL
+            const similarities: {noteId: string, similarity: number}[] = [];
+
+            for (const noteId of subtreeNoteIds) {
+                const noteEmbedding = await vectorStore.getEmbeddingForNote(
+                    noteId,
+                    this.provider.id,
+                    this.provider.modelId
+                );
+
+                if (noteEmbedding) {
+                    const similarity = cosineSimilarity(embedding, noteEmbedding.embedding);
+                    if (similarity > 0.5) {  // Apply similarity threshold
+                        similarities.push({
+                            noteId,
+                            similarity
+                        });
+                    }
+                }
+            }
+
+            // Sort by similarity and return top results
+            return similarities
+                .sort((a, b) => b.similarity - a.similarity)
+                .slice(0, limit);
+        } catch (error: unknown) {
+            const errorMessage = error instanceof Error ? error.message : String(error);
+            log.error(`Error finding notes in branch: ${errorMessage}`);
+            return [];
+        }
+    }
+
+    /**
+     * Get all note IDs in a subtree (including the root note)
+     * @param rootNoteId - Root note ID
+     * @returns Array of note IDs
+     */
+    private async getSubtreeNoteIds(rootNoteId: string): Promise<string[]> {
+        const note = becca.notes[rootNoteId];
+        if (!note) {
+            return [];
+        }
+
+        // Use becca to walk the note tree instead of direct SQL
+        const noteIds = new Set<string>([rootNoteId]);
+
+        // Helper function to collect all children
+        const collectChildNotes = (noteId: string) => {
+            // Use becca.getNote(noteId).getChildNotes() to get child notes
+            const parentNote = becca.notes[noteId];
+            if (!parentNote) return;
+
+            // Get all branches where this note is the parent
+            for (const branch of Object.values(becca.branches)) {
+                if (branch.parentNoteId === noteId && !branch.isDeleted) {
+                    const childNoteId = branch.noteId;
+                    if (!noteIds.has(childNoteId)) {
+                        noteIds.add(childNoteId);
+                        // Recursively collect children of this child
+                        collectChildNotes(childNoteId);
+                    }
+                }
+            }
+        };
+
+        // Start collecting from the root
+        collectChildNotes(rootNoteId);
+
+        return Array.from(noteIds);
+    }
+
+    /**
+     * Build a context string from relevant notes
+     * @param sources - Array of notes
+     * @param query - Original user query
+     * @returns Formatted context string
+     */
+    buildContextFromNotes(sources: any[], query: string): string {
+        if (!sources || sources.length === 0) {
+            return "";
+        }
+
+        let context = `The following are relevant notes from your knowledge base that may help answer the query: "${query}"\n\n`;
+
+        sources.forEach((source, index) => {
+            context += `--- NOTE ${index + 1}: ${source.title} ---\n`;
+
+            if (source.content) {
+                // Truncate content if it's too long
+                const maxContentLength = 1000;
+                let content = source.content;
+
+                if (content.length > maxContentLength) {
+                    content = content.substring(0, maxContentLength) + " [content truncated due to length]";
+                }
+
+                context += `${content}\n`;
+            } else {
+                context += "[This note doesn't contain textual content]\n";
+            }
+
+            context += "\n";
+        });
+
+        context += "--- END OF NOTES ---\n\n";
+        context += "Please use the information above to help answer the query. If the information doesn't contain what you need, just say so and use your general knowledge instead.";
+
+        return context;
+    }
+
+    /**
+     * Process a user query with the Trilium-specific approach:
+     * 1. Generate search queries from the original question
+     * 2. Find relevant notes using those queries
+     * 3. Build a context string from the relevant notes
+     *
+     * @param userQuestion - The user's original question
+     * @param llmService - The LLM service to use
+     * @param contextNoteId - Optional note ID to restrict search to
+     * @returns Object with context and notes
+     */
+    async processQuery(userQuestion: string, llmService: any, contextNoteId: string | null = null) {
+        if (!this.initialized) {
+            await this.initialize();
+        }
+
+        // Step 1: Generate search queries
+        const searchQueries = await this.generateSearchQueries(userQuestion, llmService);
+        log.info(`Generated search queries: ${JSON.stringify(searchQueries)}`);
+
+        // Step 2: Find relevant notes using those queries
+        const relevantNotes = await this.findRelevantNotesMultiQuery(
+            searchQueries,
+            contextNoteId,
+            8 // Get more notes since we're using multiple queries
+        );
+
+        // Step 3: Build context from the notes
+        const context = this.buildContextFromNotes(relevantNotes, userQuestion);
+
+        return {
+            context,
+            notes: relevantNotes,
+            queries: searchQueries
+        };
+    }
+}
+
+export default new TriliumContextService();