src/services/llm/embeddings/providers/ollama.ts

import axios from "axios";
import log from "../../../log.js";
import { BaseEmbeddingProvider } from "../base_embeddings.js";
import type { EmbeddingConfig, EmbeddingModelInfo } from "../embeddings_interface.js";
import { NormalizationStatus } from "../embeddings_interface.js";
import { LLM_CONSTANTS } from "../../../../routes/api/llm.js";

/**
 * Ollama embedding provider implementation
 */
export class OllamaEmbeddingProvider extends BaseEmbeddingProvider {
    name = "ollama";

    constructor(config: EmbeddingConfig) {
        super(config);
    }

    /**
     * Initialize the provider by detecting model capabilities
     */
    async initialize(): Promise<void> {
        const modelName = this.config.model || "llama3";
        try {
            // Detect model capabilities
            const modelInfo = await this.getModelInfo(modelName);

            // Update the config dimension
            this.config.dimension = modelInfo.dimension;

            log.info(`Ollama model ${modelName} initialized with dimension ${this.config.dimension} and context window ${modelInfo.contextWindow}`);
        } catch (error: any) {
            log.error(`Error initializing Ollama provider: ${error.message}`);
        }
    }

    /**
     * Fetch detailed model information from Ollama API
     * @param modelName The name of the model to fetch information for
     */
    private async fetchModelCapabilities(modelName: string): Promise<EmbeddingModelInfo | null> {
        try {
            // First try the /api/show endpoint which has detailed model information
            const showResponse = await axios.get(
                `${this.baseUrl}/api/show`,
                {
                    params: { name: modelName },
                    headers: { "Content-Type": "application/json" },
                    timeout: 10000
                }
            );

            if (showResponse.data && showResponse.data.parameters) {
                const params = showResponse.data.parameters;
                // Extract context length from parameters (different models might use different parameter names)
                const contextWindow = params.context_length ||
                                     params.num_ctx ||
                                     params.context_window ||
                                     (LLM_CONSTANTS.OLLAMA_MODEL_CONTEXT_WINDOWS as Record<string, number>).default;

                // Some models might provide embedding dimensions
                const embeddingDimension = params.embedding_length || params.dim || null;

                log.info(`Fetched Ollama model info from API for ${modelName}: context window ${contextWindow}`);

                return {
                    dimension: embeddingDimension || 0, // We'll detect this separately if not provided
                    contextWindow: contextWindow,
                    guaranteesNormalization: false // Ollama models don't guarantee normalized embeddings
                };
            }
        } catch (error: any) {
            log.info(`Could not fetch model info from Ollama show API: ${error.message}. Will try embedding test.`);
            // We'll fall back to embedding test if this fails
        }

        return null;
    }

    /**
     * Get model information by probing the API
     */
    async getModelInfo(modelName: string): Promise<EmbeddingModelInfo> {
        // Check cache first
        if (this.modelInfoCache.has(modelName)) {
            return this.modelInfoCache.get(modelName);
        }

        // Try to fetch model capabilities from API
        const apiModelInfo = await this.fetchModelCapabilities(modelName);
        if (apiModelInfo) {
            // If we have context window but no embedding dimension, we need to detect the dimension
            if (apiModelInfo.contextWindow && !apiModelInfo.dimension) {
                try {
                    // Detect dimension with a test embedding
                    const dimension = await this.detectEmbeddingDimension(modelName);
                    apiModelInfo.dimension = dimension;
                } catch (error) {
                    // If dimension detection fails, fall back to defaults
                    const baseModelName = modelName.split(':')[0];
                    apiModelInfo.dimension = (LLM_CONSTANTS.OLLAMA_MODEL_DIMENSIONS as Record<string, number>)[baseModelName] ||
                                           (LLM_CONSTANTS.OLLAMA_MODEL_DIMENSIONS as Record<string, number>).default;
                }
            }

            // Cache and return the API-provided info
            this.modelInfoCache.set(modelName, apiModelInfo);
            this.config.dimension = apiModelInfo.dimension;
            return apiModelInfo;
        }

        // If API info fetch fails, fall back to test embedding
        try {
            const dimension = await this.detectEmbeddingDimension(modelName);
            const baseModelName = modelName.split(':')[0];
            const contextWindow = (LLM_CONSTANTS.OLLAMA_MODEL_CONTEXT_WINDOWS as Record<string, number>)[baseModelName] ||
                                (LLM_CONSTANTS.OLLAMA_MODEL_CONTEXT_WINDOWS as Record<string, number>).default;

            const modelInfo: EmbeddingModelInfo = {
                dimension,
                contextWindow,
                guaranteesNormalization: false // Ollama models don't guarantee normalized embeddings
            };
            this.modelInfoCache.set(modelName, modelInfo);
            this.config.dimension = dimension;

            log.info(`Detected Ollama model ${modelName} with dimension ${dimension} (context: ${contextWindow})`);
            return modelInfo;
        } catch (error: any) {
            log.error(`Error detecting Ollama model capabilities: ${error.message}`);

            // If all detection fails, use defaults based on model name
            const baseModelName = modelName.split(':')[0];
            const dimension = (LLM_CONSTANTS.OLLAMA_MODEL_DIMENSIONS as Record<string, number>)[baseModelName] ||
                            (LLM_CONSTANTS.OLLAMA_MODEL_DIMENSIONS as Record<string, number>).default;
            const contextWindow = (LLM_CONSTANTS.OLLAMA_MODEL_CONTEXT_WINDOWS as Record<string, number>)[baseModelName] ||
                                (LLM_CONSTANTS.OLLAMA_MODEL_CONTEXT_WINDOWS as Record<string, number>).default;

            log.info(`Using default parameters for model ${modelName}: dimension ${dimension}, context ${contextWindow}`);

            const modelInfo: EmbeddingModelInfo = {
                dimension,
                contextWindow,
                guaranteesNormalization: false // Ollama models don't guarantee normalized embeddings
            };
            this.modelInfoCache.set(modelName, modelInfo);
            this.config.dimension = dimension;

            return modelInfo;
        }
    }

    /**
     * Detect embedding dimension by making a test API call
     */
    private async detectEmbeddingDimension(modelName: string): Promise<number> {
        const testResponse = await axios.post(
            `${this.baseUrl}/api/embeddings`,
            {
                model: modelName,
                prompt: "Test"
            },
            {
                headers: { "Content-Type": "application/json" },
                timeout: 10000
            }
        );

        if (testResponse.data && Array.isArray(testResponse.data.embedding)) {
            return testResponse.data.embedding.length;
        } else {
            throw new Error("Could not detect embedding dimensions");
        }
    }

    /**
     * Get the current embedding dimension
     */
    getDimension(): number {
        return this.config.dimension;
    }

    /**
     * Generate embeddings for a single text
     */
    async generateEmbeddings(text: string): Promise<Float32Array> {
        // Handle empty text
        if (!text.trim()) {
            return new Float32Array(this.config.dimension);
        }

        // Configuration for retries
        const maxRetries = 3;
        let retryCount = 0;
        let lastError: any = null;

        while (retryCount <= maxRetries) {
            try {
                const modelName = this.config.model || "llama3";

                // Ensure we have model info
                const modelInfo = await this.getModelInfo(modelName);

                // Trim text if it might exceed context window (rough character estimate)
                // This is a simplistic approach - ideally we'd count tokens properly
                const charLimit = modelInfo.contextWindow * 4; // Rough estimate: avg 4 chars per token
                const trimmedText = text.length > charLimit ? text.substring(0, charLimit) : text;

                const response = await axios.post(
                    `${this.baseUrl}/api/embeddings`,
                    {
                        model: modelName,
                        prompt: trimmedText,
                        format: "json"
                    },
                    {
                        headers: {
                            "Content-Type": "application/json"
                        },
                        timeout: 60000 // Increased timeout for larger texts (60 seconds)
                    }
                );

                if (response.data && Array.isArray(response.data.embedding)) {
                    // Success! Return the embedding
                    return new Float32Array(response.data.embedding);
                } else {
                    throw new Error("Unexpected response structure from Ollama API");
                }
            } catch (error: any) {
                lastError = error;
                // Only retry on timeout or connection errors
                const errorMessage = error.response?.data?.error?.message || error.message || "Unknown error";
                const isTimeoutError = errorMessage.includes('timeout') ||
                                     errorMessage.includes('socket hang up') ||
                                     errorMessage.includes('ECONNREFUSED') ||
                                     errorMessage.includes('ECONNRESET');

                if (isTimeoutError && retryCount < maxRetries) {
                    // Exponential backoff with jitter
                    const delay = Math.min(Math.pow(2, retryCount) * 1000 + Math.random() * 1000, 15000);
                    log.info(`Ollama embedding timeout, retrying in ${Math.round(delay/1000)}s (attempt ${retryCount + 1}/${maxRetries})`);
                    await new Promise(resolve => setTimeout(resolve, delay));
                    retryCount++;
                } else {
                    // Non-retryable error or max retries exceeded
                    const errorMessage = error.response?.data?.error?.message || error.message || "Unknown error";
                    log.error(`Ollama embedding error: ${errorMessage}`);
                    throw new Error(`Ollama embedding error: ${errorMessage}`);
                }
            }
        }

        // If we get here, we've exceeded our retry limit
        const errorMessage = lastError.response?.data?.error?.message || lastError.message || "Unknown error";
        log.error(`Ollama embedding error after ${maxRetries} retries: ${errorMessage}`);
        throw new Error(`Ollama embedding error after ${maxRetries} retries: ${errorMessage}`);
    }

    /**
     * More specific implementation of batch size error detection for Ollama
     */
    protected isBatchSizeError(error: any): boolean {
        const errorMessage = error?.message || '';
        const ollamaBatchSizeErrorPatterns = [
            'context length', 'token limit', 'out of memory',
            'too large', 'overloaded', 'prompt too long',
            'too many tokens', 'maximum size'
        ];

        return ollamaBatchSizeErrorPatterns.some(pattern =>
            errorMessage.toLowerCase().includes(pattern.toLowerCase())
        );
    }

    /**
     * Generate embeddings for multiple texts
     *
     * Note: Ollama API doesn't support batch embedding, so we process them sequentially
     * but using the adaptive batch processor to handle rate limits and retries
     */
    async generateBatchEmbeddings(texts: string[]): Promise<Float32Array[]> {
        if (texts.length === 0) {
            return [];
        }

        try {
            return await this.processWithAdaptiveBatch(
                texts,
                async (batch) => {
                    const results: Float32Array[] = [];

                    // For Ollama, we have to process one at a time
                    for (const text of batch) {
                        // Skip empty texts
                        if (!text.trim()) {
                            results.push(new Float32Array(this.config.dimension));
                            continue;
                        }

                        const embedding = await this.generateEmbeddings(text);
                        results.push(embedding);
                    }

                    return results;
                },
                this.isBatchSizeError
            );
        }
        catch (error: any) {
            const errorMessage = error.message || "Unknown error";
            log.error(`Ollama batch embedding error: ${errorMessage}`);
            throw new Error(`Ollama batch embedding error: ${errorMessage}`);
        }
    }

    /**
     * Returns the normalization status for Ollama embeddings
     * Ollama embeddings are not guaranteed to be normalized
     */
    getNormalizationStatus(): NormalizationStatus {
        return NormalizationStatus.NEVER; // Be conservative and always normalize
    }
}
create embedding services 2025-03-08 22:02:47 +00:00			`import axios from "axios";`
			`import log from "../../../log.js";`
set up more reasonable context window and dimension sizes 2025-03-16 18:08:50 +00:00			`import { BaseEmbeddingProvider } from "../base_embeddings.js";`
			`import type { EmbeddingConfig, EmbeddingModelInfo } from "../embeddings_interface.js";`
set up embedding normalization 2025-03-18 21:09:19 +00:00			`import { NormalizationStatus } from "../embeddings_interface.js";`
set up more reasonable context window and dimension sizes 2025-03-16 18:08:50 +00:00			`import { LLM_CONSTANTS } from "../../../../routes/api/llm.js";`
add additional options for ollama embeddings 2025-03-08 22:23:50 +00:00
create embedding services 2025-03-08 22:02:47 +00:00			`/**`
			`* Ollama embedding provider implementation`
			`*/`
			`export class OllamaEmbeddingProvider extends BaseEmbeddingProvider {`
			`name = "ollama";`

set up more reasonable context window and dimension sizes 2025-03-16 18:08:50 +00:00			`constructor(config: EmbeddingConfig) {`
create embedding services 2025-03-08 22:02:47 +00:00			`super(config);`
			`}`

add additional options for ollama embeddings 2025-03-08 22:23:50 +00:00			`/**`
			`* Initialize the provider by detecting model capabilities`
			`*/`
			`async initialize(): Promise<void> {`
			`const modelName = this.config.model \|\| "llama3";`
			`try {`
set up more reasonable context window and dimension sizes 2025-03-16 18:08:50 +00:00			`// Detect model capabilities`
			`const modelInfo = await this.getModelInfo(modelName);`

			`// Update the config dimension`
			`this.config.dimension = modelInfo.dimension;`

			log.info(`Ollama model ${modelName} initialized with dimension ${this.config.dimension} and context window ${modelInfo.contextWindow}`);
add additional options for ollama embeddings 2025-03-08 22:23:50 +00:00			`} catch (error: any) {`
set up more reasonable context window and dimension sizes 2025-03-16 18:08:50 +00:00			log.error(`Error initializing Ollama provider: ${error.message}`);
add additional options for ollama embeddings 2025-03-08 22:23:50 +00:00			`}`
			`}`

			`/**`
set up more reasonable context window and dimension sizes 2025-03-16 18:08:50 +00:00			`* Fetch detailed model information from Ollama API`
			`* @param modelName The name of the model to fetch information for`
add additional options for ollama embeddings 2025-03-08 22:23:50 +00:00			`*/`
set up more reasonable context window and dimension sizes 2025-03-16 18:08:50 +00:00			`private async fetchModelCapabilities(modelName: string): Promise<EmbeddingModelInfo \| null> {`
add additional options for ollama embeddings 2025-03-08 22:23:50 +00:00			`try {`
set up more reasonable context window and dimension sizes 2025-03-16 18:08:50 +00:00			`// First try the /api/show endpoint which has detailed model information`
			`const showResponse = await axios.get(`
			`${this.baseUrl}/api/show`,
add additional options for ollama embeddings 2025-03-08 22:23:50 +00:00			`{`
set up more reasonable context window and dimension sizes 2025-03-16 18:08:50 +00:00			`params: { name: modelName },`
add additional options for ollama embeddings 2025-03-08 22:23:50 +00:00			`headers: { "Content-Type": "application/json" },`
			`timeout: 10000`
			`}`
			`);`

set up more reasonable context window and dimension sizes 2025-03-16 18:08:50 +00:00			`if (showResponse.data && showResponse.data.parameters) {`
			`const params = showResponse.data.parameters;`
			`// Extract context length from parameters (different models might use different parameter names)`
			`const contextWindow = params.context_length \|\|`
			`params.num_ctx \|\|`
			`params.context_window \|\|`
			`(LLM_CONSTANTS.OLLAMA_MODEL_CONTEXT_WINDOWS as Record<string, number>).default;`
add additional options for ollama embeddings 2025-03-08 22:23:50 +00:00
set up more reasonable context window and dimension sizes 2025-03-16 18:08:50 +00:00			`// Some models might provide embedding dimensions`
			`const embeddingDimension = params.embedding_length \|\| params.dim \|\| null;`
add additional options for ollama embeddings 2025-03-08 22:23:50 +00:00
set up more reasonable context window and dimension sizes 2025-03-16 18:08:50 +00:00			log.info(`Fetched Ollama model info from API for ${modelName}: context window ${contextWindow}`);
add additional options for ollama embeddings 2025-03-08 22:23:50 +00:00
set up more reasonable context window and dimension sizes 2025-03-16 18:08:50 +00:00			`return {`
			`dimension: embeddingDimension \|\| 0, // We'll detect this separately if not provided`
set up embedding normalization 2025-03-18 21:09:19 +00:00			`contextWindow: contextWindow,`
			`guaranteesNormalization: false // Ollama models don't guarantee normalized embeddings`
set up more reasonable context window and dimension sizes 2025-03-16 18:08:50 +00:00			`};`
add additional options for ollama embeddings 2025-03-08 22:23:50 +00:00			`}`
set up more reasonable context window and dimension sizes 2025-03-16 18:08:50 +00:00			`} catch (error: any) {`
			log.info(`Could not fetch model info from Ollama show API: ${error.message}. Will try embedding test.`);
			`// We'll fall back to embedding test if this fails`
			`}`

			`return null;`
			`}`

			`/**`
			`* Get model information by probing the API`
			`*/`
			`async getModelInfo(modelName: string): Promise<EmbeddingModelInfo> {`
			`// Check cache first`
			`if (this.modelInfoCache.has(modelName)) {`
			`return this.modelInfoCache.get(modelName);`
			`}`

			`// Try to fetch model capabilities from API`
			`const apiModelInfo = await this.fetchModelCapabilities(modelName);`
			`if (apiModelInfo) {`
			`// If we have context window but no embedding dimension, we need to detect the dimension`
			`if (apiModelInfo.contextWindow && !apiModelInfo.dimension) {`
			`try {`
			`// Detect dimension with a test embedding`
			`const dimension = await this.detectEmbeddingDimension(modelName);`
			`apiModelInfo.dimension = dimension;`
			`} catch (error) {`
			`// If dimension detection fails, fall back to defaults`
			`const baseModelName = modelName.split(':')[0];`
			`apiModelInfo.dimension = (LLM_CONSTANTS.OLLAMA_MODEL_DIMENSIONS as Record<string, number>)[baseModelName] \|\|`
			`(LLM_CONSTANTS.OLLAMA_MODEL_DIMENSIONS as Record<string, number>).default;`
			`}`
			`}`

			`// Cache and return the API-provided info`
			`this.modelInfoCache.set(modelName, apiModelInfo);`
			`this.config.dimension = apiModelInfo.dimension;`
			`return apiModelInfo;`
			`}`

			`// If API info fetch fails, fall back to test embedding`
			`try {`
			`const dimension = await this.detectEmbeddingDimension(modelName);`
			`const baseModelName = modelName.split(':')[0];`
			`const contextWindow = (LLM_CONSTANTS.OLLAMA_MODEL_CONTEXT_WINDOWS as Record<string, number>)[baseModelName] \|\|`
			`(LLM_CONSTANTS.OLLAMA_MODEL_CONTEXT_WINDOWS as Record<string, number>).default;`
add additional options for ollama embeddings 2025-03-08 22:23:50 +00:00
set up embedding normalization 2025-03-18 21:09:19 +00:00			`const modelInfo: EmbeddingModelInfo = {`
			`dimension,`
			`contextWindow,`
			`guaranteesNormalization: false // Ollama models don't guarantee normalized embeddings`
			`};`
add additional options for ollama embeddings 2025-03-08 22:23:50 +00:00			`this.modelInfoCache.set(modelName, modelInfo);`
			`this.config.dimension = dimension;`

set up more reasonable context window and dimension sizes 2025-03-16 18:08:50 +00:00			log.info(`Detected Ollama model ${modelName} with dimension ${dimension} (context: ${contextWindow})`);
add additional options for ollama embeddings 2025-03-08 22:23:50 +00:00			`return modelInfo;`
			`} catch (error: any) {`
			log.error(`Error detecting Ollama model capabilities: ${error.message}`);

set up more reasonable context window and dimension sizes 2025-03-16 18:08:50 +00:00			`// If all detection fails, use defaults based on model name`
add additional options for ollama embeddings 2025-03-08 22:23:50 +00:00			`const baseModelName = modelName.split(':')[0];`
set up more reasonable context window and dimension sizes 2025-03-16 18:08:50 +00:00			`const dimension = (LLM_CONSTANTS.OLLAMA_MODEL_DIMENSIONS as Record<string, number>)[baseModelName] \|\|`
			`(LLM_CONSTANTS.OLLAMA_MODEL_DIMENSIONS as Record<string, number>).default;`
			`const contextWindow = (LLM_CONSTANTS.OLLAMA_MODEL_CONTEXT_WINDOWS as Record<string, number>)[baseModelName] \|\|`
			`(LLM_CONSTANTS.OLLAMA_MODEL_CONTEXT_WINDOWS as Record<string, number>).default;`
add additional options for ollama embeddings 2025-03-08 22:23:50 +00:00
set up more reasonable context window and dimension sizes 2025-03-16 18:08:50 +00:00			log.info(`Using default parameters for model ${modelName}: dimension ${dimension}, context ${contextWindow}`);
add additional options for ollama embeddings 2025-03-08 22:23:50 +00:00
set up embedding normalization 2025-03-18 21:09:19 +00:00			`const modelInfo: EmbeddingModelInfo = {`
			`dimension,`
			`contextWindow,`
			`guaranteesNormalization: false // Ollama models don't guarantee normalized embeddings`
			`};`
add additional options for ollama embeddings 2025-03-08 22:23:50 +00:00			`this.modelInfoCache.set(modelName, modelInfo);`
			`this.config.dimension = dimension;`

			`return modelInfo;`
			`}`
			`}`

set up more reasonable context window and dimension sizes 2025-03-16 18:08:50 +00:00			`/**`
			`* Detect embedding dimension by making a test API call`
			`*/`
			`private async detectEmbeddingDimension(modelName: string): Promise<number> {`
			`const testResponse = await axios.post(`
			`${this.baseUrl}/api/embeddings`,
			`{`
			`model: modelName,`
			`prompt: "Test"`
			`},`
			`{`
			`headers: { "Content-Type": "application/json" },`
			`timeout: 10000`
			`}`
			`);`

			`if (testResponse.data && Array.isArray(testResponse.data.embedding)) {`
			`return testResponse.data.embedding.length;`
			`} else {`
			`throw new Error("Could not detect embedding dimensions");`
			`}`
			`}`

add additional options for ollama embeddings 2025-03-08 22:23:50 +00:00			`/**`
			`* Get the current embedding dimension`
			`*/`
			`getDimension(): number {`
			`return this.config.dimension;`
			`}`

create embedding services 2025-03-08 22:02:47 +00:00			`/**`
			`* Generate embeddings for a single text`
			`*/`
			`async generateEmbeddings(text: string): Promise<Float32Array> {`
"lock" notes that are having their embeddings created 2025-03-16 20:36:47 +00:00			`// Handle empty text`
			`if (!text.trim()) {`
			`return new Float32Array(this.config.dimension);`
			`}`
add additional options for ollama embeddings 2025-03-08 22:23:50 +00:00
"lock" notes that are having their embeddings created 2025-03-16 20:36:47 +00:00			`// Configuration for retries`
			`const maxRetries = 3;`
			`let retryCount = 0;`
			`let lastError: any = null;`

			`while (retryCount <= maxRetries) {`
			`try {`
			`const modelName = this.config.model \|\| "llama3";`

			`// Ensure we have model info`
			`const modelInfo = await this.getModelInfo(modelName);`

			`// Trim text if it might exceed context window (rough character estimate)`
			`// This is a simplistic approach - ideally we'd count tokens properly`
			`const charLimit = modelInfo.contextWindow * 4; // Rough estimate: avg 4 chars per token`
			`const trimmedText = text.length > charLimit ? text.substring(0, charLimit) : text;`

			`const response = await axios.post(`
			`${this.baseUrl}/api/embeddings`,
			`{`
			`model: modelName,`
			`prompt: trimmedText,`
			`format: "json"`
add additional options for ollama embeddings 2025-03-08 22:23:50 +00:00			`},`
"lock" notes that are having their embeddings created 2025-03-16 20:36:47 +00:00			`{`
			`headers: {`
			`"Content-Type": "application/json"`
			`},`
			`timeout: 60000 // Increased timeout for larger texts (60 seconds)`
			`}`
			`);`

			`if (response.data && Array.isArray(response.data.embedding)) {`
			`// Success! Return the embedding`
			`return new Float32Array(response.data.embedding);`
			`} else {`
			`throw new Error("Unexpected response structure from Ollama API");`
			`}`
			`} catch (error: any) {`
			`lastError = error;`
			`// Only retry on timeout or connection errors`
			`const errorMessage = error.response?.data?.error?.message \|\| error.message \|\| "Unknown error";`
			`const isTimeoutError = errorMessage.includes('timeout') \|\|`
			`errorMessage.includes('socket hang up') \|\|`
			`errorMessage.includes('ECONNREFUSED') \|\|`
			`errorMessage.includes('ECONNRESET');`

			`if (isTimeoutError && retryCount < maxRetries) {`
			`// Exponential backoff with jitter`
			`const delay = Math.min(Math.pow(2, retryCount) * 1000 + Math.random() * 1000, 15000);`
			log.info(`Ollama embedding timeout, retrying in ${Math.round(delay/1000)}s (attempt ${retryCount + 1}/${maxRetries})`);
			`await new Promise(resolve => setTimeout(resolve, delay));`
			`retryCount++;`
			`} else {`
			`// Non-retryable error or max retries exceeded`
			`const errorMessage = error.response?.data?.error?.message \|\| error.message \|\| "Unknown error";`
			log.error(`Ollama embedding error: ${errorMessage}`);
			throw new Error(`Ollama embedding error: ${errorMessage}`);
create embedding services 2025-03-08 22:02:47 +00:00			`}`
			`}`
			`}`
"lock" notes that are having their embeddings created 2025-03-16 20:36:47 +00:00
			`// If we get here, we've exceeded our retry limit`
			`const errorMessage = lastError.response?.data?.error?.message \|\| lastError.message \|\| "Unknown error";`
			log.error(`Ollama embedding error after ${maxRetries} retries: ${errorMessage}`);
			throw new Error(`Ollama embedding error after ${maxRetries} retries: ${errorMessage}`);
create embedding services 2025-03-08 22:02:47 +00:00			`}`

set up more reasonable context window and dimension sizes 2025-03-16 18:08:50 +00:00			`/**`
			`* More specific implementation of batch size error detection for Ollama`
			`*/`
			`protected isBatchSizeError(error: any): boolean {`
			`const errorMessage = error?.message \|\| '';`
			`const ollamaBatchSizeErrorPatterns = [`
			`'context length', 'token limit', 'out of memory',`
			`'too large', 'overloaded', 'prompt too long',`
			`'too many tokens', 'maximum size'`
			`];`

			`return ollamaBatchSizeErrorPatterns.some(pattern =>`
			`errorMessage.toLowerCase().includes(pattern.toLowerCase())`
			`);`
			`}`

create embedding services 2025-03-08 22:02:47 +00:00			`/**`
			`* Generate embeddings for multiple texts`
			`*`
			`* Note: Ollama API doesn't support batch embedding, so we process them sequentially`
set up more reasonable context window and dimension sizes 2025-03-16 18:08:50 +00:00			`* but using the adaptive batch processor to handle rate limits and retries`
create embedding services 2025-03-08 22:02:47 +00:00			`*/`
			`async generateBatchEmbeddings(texts: string[]): Promise<Float32Array[]> {`
			`if (texts.length === 0) {`
			`return [];`
			`}`

set up more reasonable context window and dimension sizes 2025-03-16 18:08:50 +00:00			`try {`
			`return await this.processWithAdaptiveBatch(`
			`texts,`
			`async (batch) => {`
			`const results: Float32Array[] = [];`
create embedding services 2025-03-08 22:02:47 +00:00
set up more reasonable context window and dimension sizes 2025-03-16 18:08:50 +00:00			`// For Ollama, we have to process one at a time`
			`for (const text of batch) {`
			`// Skip empty texts`
			`if (!text.trim()) {`
			`results.push(new Float32Array(this.config.dimension));`
			`continue;`
			`}`
create embedding services 2025-03-08 22:02:47 +00:00
set up more reasonable context window and dimension sizes 2025-03-16 18:08:50 +00:00			`const embedding = await this.generateEmbeddings(text);`
			`results.push(embedding);`
			`}`

			`return results;`
			`},`
			`this.isBatchSizeError`
			`);`
			`}`
			`catch (error: any) {`
			`const errorMessage = error.message \|\| "Unknown error";`
			log.error(`Ollama batch embedding error: ${errorMessage}`);
			throw new Error(`Ollama batch embedding error: ${errorMessage}`);
			`}`
create embedding services 2025-03-08 22:02:47 +00:00			`}`
set up embedding normalization 2025-03-18 21:09:19 +00:00
			`/**`
			`* Returns the normalization status for Ollama embeddings`
			`* Ollama embeddings are not guaranteed to be normalized`
			`*/`
			`getNormalizationStatus(): NormalizationStatus {`
			`return NormalizationStatus.NEVER; // Be conservative and always normalize`
			`}`
create embedding services 2025-03-08 22:02:47 +00:00			`}`