LibreChat/api/app/clients/OllamaClient.js

const { z } = require('zod');
const axios = require('axios');
const { Ollama } = require('ollama');
const { sleep } = require('@librechat/agents');
const { logger } = require('@librechat/data-schemas');
const { Constants } = require('librechat-data-provider');
const { resolveHeaders, deriveBaseURL } = require('@librechat/api');

const ollamaPayloadSchema = z.object({
  mirostat: z.number().optional(),
  mirostat_eta: z.number().optional(),
  mirostat_tau: z.number().optional(),
  num_ctx: z.number().optional(),
  repeat_last_n: z.number().optional(),
  repeat_penalty: z.number().optional(),
  temperature: z.number().optional(),
  seed: z.number().nullable().optional(),
  stop: z.array(z.string()).optional(),
  tfs_z: z.number().optional(),
  num_predict: z.number().optional(),
  top_k: z.number().optional(),
  top_p: z.number().optional(),
  stream: z.optional(z.boolean()),
  model: z.string(),
});

/**
 * @param {string} imageUrl
 * @returns {string}
 * @throws {Error}
 */
const getValidBase64 = (imageUrl) => {
  const parts = imageUrl.split(';base64,');

  if (parts.length === 2) {
    return parts[1];
  } else {
    logger.error('Invalid or no Base64 string found in URL.');
  }
};

class OllamaClient {
  constructor(options = {}) {
    const host = deriveBaseURL(options.baseURL ?? 'http://localhost:11434');
    this.streamRate = options.streamRate ?? Constants.DEFAULT_STREAM_RATE;
    this.headers = options.headers ?? {};
    /** @type {Ollama} */
    this.client = new Ollama({ host });
  }

  /**
   * Fetches Ollama models from the specified base API path.
   * @param {string} baseURL
   * @param {Object} [options] - Optional configuration
   * @param {Partial<IUser>} [options.user] - User object for header resolution
   * @param {Record<string, string>} [options.headers] - Headers to include in the request
   * @returns {Promise<string[]>} The Ollama models.
   * @throws {Error} Throws if the Ollama API request fails
   */
  static async fetchModels(baseURL, options = {}) {
    if (!baseURL) {
      return [];
    }

    const ollamaEndpoint = deriveBaseURL(baseURL);

    const resolvedHeaders = resolveHeaders({
      headers: options.headers,
      user: options.user,
    });

    /** @type {Promise<AxiosResponse<OllamaListResponse>>} */
    const response = await axios.get(`${ollamaEndpoint}/api/tags`, {
      headers: resolvedHeaders,
      timeout: 5000,
    });

    const models = response.data.models.map((tag) => tag.name);
    return models;
  }

  /**
   * @param {ChatCompletionMessage[]} messages
   * @returns {OllamaMessage[]}
   */
  static formatOpenAIMessages(messages) {
    const ollamaMessages = [];

    for (const message of messages) {
      if (typeof message.content === 'string') {
        ollamaMessages.push({
          role: message.role,
          content: message.content,
        });
        continue;
      }

      let aggregatedText = '';
      let imageUrls = [];

      for (const content of message.content) {
        if (content.type === 'text') {
          aggregatedText += content.text + ' ';
        } else if (content.type === 'image_url') {
          imageUrls.push(getValidBase64(content.image_url.url));
        }
      }

      const ollamaMessage = {
        role: message.role,
        content: aggregatedText.trim(),
      };

      if (imageUrls.length > 0) {
        ollamaMessage.images = imageUrls;
      }

      ollamaMessages.push(ollamaMessage);
    }

    return ollamaMessages;
  }

  /***
   * @param {Object} params
   * @param {ChatCompletionPayload} params.payload
   * @param {onTokenProgress} params.onProgress
   * @param {AbortController} params.abortController
   */
  async chatCompletion({ payload, onProgress, abortController = null }) {
    let intermediateReply = '';

    const parameters = ollamaPayloadSchema.parse(payload);
    const messages = OllamaClient.formatOpenAIMessages(payload.messages);

    if (parameters.stream) {
      const stream = await this.client.chat({
        messages,
        ...parameters,
      });

      for await (const chunk of stream) {
        const token = chunk.message.content;
        intermediateReply += token;
        onProgress(token);
        if (abortController.signal.aborted) {
          stream.controller.abort();
          break;
        }

        await sleep(this.streamRate);
      }
    }
    // TODO: regular completion
    else {
      // const generation = await this.client.generate(payload);
    }

    return intermediateReply;
  }
  catch(err) {
    logger.error('[OllamaClient.chatCompletion]', err);
    throw err;
  }
}

module.exports = { OllamaClient, ollamaPayloadSchema };
🦙 feat: Ollama Vision Support (#2643) * refactor: checkVisionRequest, search availableModels for valid vision model instead of using default * feat: install ollama-js, add typedefs * feat: Ollama Vision Support * ci: fix test 2024-05-08 20:24:40 -04:00			`const { z } = require('zod');`
			`const axios = require('axios');`
			`const { Ollama } = require('ollama');`
👁️ feat: Azure Mistral OCR Strategy (#7888) * 👁️ feat: Add Azure Mistral OCR strategy and endpoint integration This commit introduces a new OCR strategy named 'azure_mistral_ocr', allowing the use of a Mistral OCR endpoint deployed on Azure. The configuration, schemas, and file upload strategies have been updated to support this integration, enabling seamless OCR processing via Azure-hosted Mistral services. * 🗑️ chore: Clean up .gitignore by removing commented-out uncommon directory name * chore: remove unused vars * refactor: Move createAxiosInstance to packages/api/utils and update imports - Removed the createAxiosInstance function from the config module and relocated it to a new utils module for better organization. - Updated import paths in relevant files to reflect the new location of createAxiosInstance. - Added tests for createAxiosInstance to ensure proper functionality and proxy configuration handling. * chore: move axios helpers to packages/api - Added logAxiosError function to @librechat/api for centralized error logging. - Updated imports across various files to use the new logAxiosError function. - Removed the old axios.js utility file as it is no longer needed. * chore: Update Jest moduleNameMapper for improved path resolution - Added a new mapping for '~/' to resolve module paths in Jest configuration, enhancing import handling for the project. * feat: Implement Mistral OCR API integration in TS * chore: Update MistralOCR tests based on new imports * fix: Enhance MistralOCR configuration handling and tests - Introduced helper functions for resolving configuration values from environment variables or hardcoded settings. - Updated the uploadMistralOCR and uploadAzureMistralOCR functions to utilize the new configuration resolution logic. - Improved test cases to ensure correct behavior when mixing environment variables and hardcoded values. - Mocked file upload and signed URL responses in tests to validate functionality without external dependencies. * feat: Enhance MistralOCR functionality with improved configuration and error handling - Introduced helper functions for loading authentication configuration and resolving values from environment variables. - Updated uploadMistralOCR and uploadAzureMistralOCR functions to utilize the new configuration logic. - Added utility functions for processing OCR results and creating error messages. - Improved document type determination and result aggregation for better OCR processing. * refactor: Reorganize OCR type imports in Mistral CRUD file - Moved OCRResult, OCRResultPage, and OCRImage imports to a more logical grouping for better readability and maintainability. * feat: Add file exports to API and create files index * chore: Update OCR types for enhanced structure and clarity - Redesigned OCRImage interface to include mandatory fields and improved naming conventions. - Added PageDimensions interface for better representation of page metrics. - Updated OCRResultPage to include dimensions and mandatory images array. - Refined OCRResult to include document annotation and usage information. * refactor: use TS counterpart of uploadOCR methods * ci: Update MistralOCR tests to reflect new OCR result structure * chore: Bump version of @librechat/api to 1.2.3 in package.json and package-lock.json * chore: Update CONFIG_VERSION to 1.2.8 * chore: remove unused sendEvent function from config module (now imported from '@librechat/api') * chore: remove MistralOCR service files and tests (now in '@librechat/api') * ci: update logger import in ModelService tests to use @librechat/data-schemas --------- Co-authored-by: arthurolivierfortin <arthurolivier.fortin@gmail.com> 2025-06-13 15:14:57 -04:00			`const { sleep } = require('@librechat/agents');`
			`const { logger } = require('@librechat/data-schemas');`
⚙️ feat: Adjust Rate of Stream Progress (#3244) * chore: bump data-provider and add MESSAGES CacheKey * refactor: avoid saving messages while streaming, save partial text to cache instead * fix(ci): processChunks * chore: logging aborted request to debug * feat: set stream rate for token processing * chore: specify default stream rate * fix(ci): Update AppService.js to use optional chaining for endpointLocals assignment * refactor: abstract the error handler * feat: streamRate for assistants; refactor: update default rate for token * refactor: update error handling in assistants/errors.js * refactor: update error handling in assistants/errors.js 2024-07-17 10:47:17 -04:00			`const { Constants } = require('librechat-data-provider');`
🧵 refactor: Migrate Endpoint Initialization to TypeScript (#10794) * refactor: move endpoint initialization methods to typescript * refactor: move agent init to packages/api - Introduced `initialize.ts` for agent initialization, including file processing and tool loading. - Updated `resources.ts` to allow optional appConfig parameter. - Enhanced endpoint configuration handling in various initialization files to support model parameters. - Added new artifacts and prompts for React component generation. - Refactored existing code to improve type safety and maintainability. * refactor: streamline endpoint initialization and enhance type safety - Updated initialization functions across various endpoints to use a consistent request structure, replacing `unknown` types with `ServerResponse`. - Simplified request handling by directly extracting keys from the request body. - Improved type safety by ensuring user IDs are safely accessed with optional chaining. - Removed unnecessary parameters and streamlined model options handling for better clarity and maintainability. * refactor: moved ModelService and extractBaseURL to packages/api - Added comprehensive tests for the models fetching functionality, covering scenarios for OpenAI, Anthropic, Google, and Ollama models. - Updated existing endpoint index to include the new models module. - Enhanced utility functions for URL extraction and model data processing. - Improved type safety and error handling across the models fetching logic. * refactor: consolidate utility functions and remove unused files - Merged `deriveBaseURL` and `extractBaseURL` into the `@librechat/api` module for better organization. - Removed redundant utility files and their associated tests to streamline the codebase. - Updated imports across various client files to utilize the new consolidated functions. - Enhanced overall maintainability by reducing the number of utility modules. * refactor: replace ModelService references with direct imports from @librechat/api and remove ModelService file * refactor: move encrypt/decrypt methods and key db methods to data-schemas, use `getProviderConfig` from `@librechat/api` * chore: remove unused 'res' from options in AgentClient * refactor: file model imports and methods - Updated imports in various controllers and services to use the unified file model from '~/models' instead of '~/models/File'. - Consolidated file-related methods into a new file methods module in the data-schemas package. - Added comprehensive tests for file methods including creation, retrieval, updating, and deletion. - Enhanced the initializeAgent function to accept dependency injection for file-related methods. - Improved error handling and logging in file methods. * refactor: streamline database method references in agent initialization * refactor: enhance file method tests and update type references to IMongoFile * refactor: consolidate database method imports in agent client and initialization * chore: remove redundant import of initializeAgent from @librechat/api * refactor: move checkUserKeyExpiry utility to @librechat/api and update references across endpoints * refactor: move updateUserPlugins logic to user.ts and simplify UserController * refactor: update imports for user key management and remove UserService * refactor: remove unused Anthropics and Bedrock endpoint files and clean up imports * refactor: consolidate and update encryption imports across various files to use @librechat/data-schemas * chore: update file model mock to use unified import from '~/models' * chore: import order * refactor: remove migrated to TS agent.js file and its associated logic from the endpoints * chore: add reusable function to extract imports from source code in unused-packages workflow * chore: enhance unused-packages workflow to include @librechat/api dependencies and improve dependency extraction * chore: improve dependency extraction in unused-packages workflow with enhanced error handling and debugging output * chore: add detailed debugging output to unused-packages workflow for better visibility into unused dependencies and exclusion lists * chore: refine subpath handling in unused-packages workflow to correctly process scoped and non-scoped package imports * chore: clean up unused debug output in unused-packages workflow and reorganize type imports in initialize.ts 2025-12-03 17:21:41 -05:00			`const { resolveHeaders, deriveBaseURL } = require('@librechat/api');`
🦙 feat: Ollama Vision Support (#2643) * refactor: checkVisionRequest, search availableModels for valid vision model instead of using default * feat: install ollama-js, add typedefs * feat: Ollama Vision Support * ci: fix test 2024-05-08 20:24:40 -04:00
			`const ollamaPayloadSchema = z.object({`
			`mirostat: z.number().optional(),`
			`mirostat_eta: z.number().optional(),`
			`mirostat_tau: z.number().optional(),`
			`num_ctx: z.number().optional(),`
			`repeat_last_n: z.number().optional(),`
			`repeat_penalty: z.number().optional(),`
			`temperature: z.number().optional(),`
			`seed: z.number().nullable().optional(),`
			`stop: z.array(z.string()).optional(),`
			`tfs_z: z.number().optional(),`
			`num_predict: z.number().optional(),`
			`top_k: z.number().optional(),`
			`top_p: z.number().optional(),`
			`stream: z.optional(z.boolean()),`
			`model: z.string(),`
			`});`

			`/**`
			`* @param {string} imageUrl`
			`* @returns {string}`
			`* @throws {Error}`
			`*/`
			`const getValidBase64 = (imageUrl) => {`
			`const parts = imageUrl.split(';base64,');`

			`if (parts.length === 2) {`
			`return parts[1];`
			`} else {`
			`logger.error('Invalid or no Base64 string found in URL.');`
			`}`
			`};`

			`class OllamaClient {`
			`constructor(options = {}) {`
			`const host = deriveBaseURL(options.baseURL ?? 'http://localhost:11434');`
⚙️ feat: Adjust Rate of Stream Progress (#3244) * chore: bump data-provider and add MESSAGES CacheKey * refactor: avoid saving messages while streaming, save partial text to cache instead * fix(ci): processChunks * chore: logging aborted request to debug * feat: set stream rate for token processing * chore: specify default stream rate * fix(ci): Update AppService.js to use optional chaining for endpointLocals assignment * refactor: abstract the error handler * feat: streamRate for assistants; refactor: update default rate for token * refactor: update error handling in assistants/errors.js * refactor: update error handling in assistants/errors.js 2024-07-17 10:47:17 -04:00			`this.streamRate = options.streamRate ?? Constants.DEFAULT_STREAM_RATE;`
🦙 fix: Ollama Custom Headers (#10314) * 🦙 fix: Ollama Custom Headers * chore: Correct import order for resolveHeaders in OllamaClient.js * fix: Improve error logging for Ollama API model fetch failure * ci: update Ollama model fetch tests * ci: Add unit test for passing headers and user object to Ollama fetchModels 2025-10-30 14:48:10 -04:00			`this.headers = options.headers ?? {};`
🦙 feat: Ollama Vision Support (#2643) * refactor: checkVisionRequest, search availableModels for valid vision model instead of using default * feat: install ollama-js, add typedefs * feat: Ollama Vision Support * ci: fix test 2024-05-08 20:24:40 -04:00			`/** @type {Ollama} */`
			`this.client = new Ollama({ host });`
			`}`

			`/**`
			`* Fetches Ollama models from the specified base API path.`
			`* @param {string} baseURL`
🦙 fix: Ollama Custom Headers (#10314) * 🦙 fix: Ollama Custom Headers * chore: Correct import order for resolveHeaders in OllamaClient.js * fix: Improve error logging for Ollama API model fetch failure * ci: update Ollama model fetch tests * ci: Add unit test for passing headers and user object to Ollama fetchModels 2025-10-30 14:48:10 -04:00			`* @param {Object} [options] - Optional configuration`
			`* @param {Partial<IUser>} [options.user] - User object for header resolution`
			`* @param {Record<string, string>} [options.headers] - Headers to include in the request`
🦙 feat: Ollama Vision Support (#2643) * refactor: checkVisionRequest, search availableModels for valid vision model instead of using default * feat: install ollama-js, add typedefs * feat: Ollama Vision Support * ci: fix test 2024-05-08 20:24:40 -04:00			`* @returns {Promise<string[]>} The Ollama models.`
🦙 fix: Ollama Custom Headers (#10314) * 🦙 fix: Ollama Custom Headers * chore: Correct import order for resolveHeaders in OllamaClient.js * fix: Improve error logging for Ollama API model fetch failure * ci: update Ollama model fetch tests * ci: Add unit test for passing headers and user object to Ollama fetchModels 2025-10-30 14:48:10 -04:00			`* @throws {Error} Throws if the Ollama API request fails`
🦙 feat: Ollama Vision Support (#2643) * refactor: checkVisionRequest, search availableModels for valid vision model instead of using default * feat: install ollama-js, add typedefs * feat: Ollama Vision Support * ci: fix test 2024-05-08 20:24:40 -04:00			`*/`
🦙 fix: Ollama Custom Headers (#10314) * 🦙 fix: Ollama Custom Headers * chore: Correct import order for resolveHeaders in OllamaClient.js * fix: Improve error logging for Ollama API model fetch failure * ci: update Ollama model fetch tests * ci: Add unit test for passing headers and user object to Ollama fetchModels 2025-10-30 14:48:10 -04:00			`static async fetchModels(baseURL, options = {}) {`
🦙 feat: Ollama Vision Support (#2643) * refactor: checkVisionRequest, search availableModels for valid vision model instead of using default * feat: install ollama-js, add typedefs * feat: Ollama Vision Support * ci: fix test 2024-05-08 20:24:40 -04:00			`if (!baseURL) {`
			`return [];`
			`}`
🦙 fix: Ollama Custom Headers (#10314) * 🦙 fix: Ollama Custom Headers * chore: Correct import order for resolveHeaders in OllamaClient.js * fix: Improve error logging for Ollama API model fetch failure * ci: update Ollama model fetch tests * ci: Add unit test for passing headers and user object to Ollama fetchModels 2025-10-30 14:48:10 -04:00
			`const ollamaEndpoint = deriveBaseURL(baseURL);`

			`const resolvedHeaders = resolveHeaders({`
			`headers: options.headers,`
			`user: options.user,`
			`});`

			`/** @type {Promise<AxiosResponse<OllamaListResponse>>} */`
			const response = await axios.get(`${ollamaEndpoint}/api/tags`, {
			`headers: resolvedHeaders,`
			`timeout: 5000,`
			`});`

			`const models = response.data.models.map((tag) => tag.name);`
			`return models;`
🦙 feat: Ollama Vision Support (#2643) * refactor: checkVisionRequest, search availableModels for valid vision model instead of using default * feat: install ollama-js, add typedefs * feat: Ollama Vision Support * ci: fix test 2024-05-08 20:24:40 -04:00			`}`

			`/**`
			`* @param {ChatCompletionMessage[]} messages`
			`* @returns {OllamaMessage[]}`
			`*/`
			`static formatOpenAIMessages(messages) {`
			`const ollamaMessages = [];`

			`for (const message of messages) {`
			`if (typeof message.content === 'string') {`
			`ollamaMessages.push({`
			`role: message.role,`
			`content: message.content,`
			`});`
			`continue;`
			`}`

			`let aggregatedText = '';`
			`let imageUrls = [];`

			`for (const content of message.content) {`
			`if (content.type === 'text') {`
			`aggregatedText += content.text + ' ';`
			`} else if (content.type === 'image_url') {`
			`imageUrls.push(getValidBase64(content.image_url.url));`
			`}`
			`}`

			`const ollamaMessage = {`
			`role: message.role,`
			`content: aggregatedText.trim(),`
			`};`

			`if (imageUrls.length > 0) {`
			`ollamaMessage.images = imageUrls;`
			`}`

			`ollamaMessages.push(ollamaMessage);`
			`}`

			`return ollamaMessages;`
			`}`

			`/***`
			`* @param {Object} params`
			`* @param {ChatCompletionPayload} params.payload`
			`* @param {onTokenProgress} params.onProgress`
			`* @param {AbortController} params.abortController`
			`*/`
			`async chatCompletion({ payload, onProgress, abortController = null }) {`
			`let intermediateReply = '';`

			`const parameters = ollamaPayloadSchema.parse(payload);`
			`const messages = OllamaClient.formatOpenAIMessages(payload.messages);`

			`if (parameters.stream) {`
			`const stream = await this.client.chat({`
			`messages,`
			`...parameters,`
			`});`

			`for await (const chunk of stream) {`
			`const token = chunk.message.content;`
			`intermediateReply += token;`
			`onProgress(token);`
			`if (abortController.signal.aborted) {`
			`stream.controller.abort();`
			`break;`
			`}`
⚙️ feat: Adjust Rate of Stream Progress (#3244) * chore: bump data-provider and add MESSAGES CacheKey * refactor: avoid saving messages while streaming, save partial text to cache instead * fix(ci): processChunks * chore: logging aborted request to debug * feat: set stream rate for token processing * chore: specify default stream rate * fix(ci): Update AppService.js to use optional chaining for endpointLocals assignment * refactor: abstract the error handler * feat: streamRate for assistants; refactor: update default rate for token * refactor: update error handling in assistants/errors.js * refactor: update error handling in assistants/errors.js 2024-07-17 10:47:17 -04:00
			`await sleep(this.streamRate);`
🦙 feat: Ollama Vision Support (#2643) * refactor: checkVisionRequest, search availableModels for valid vision model instead of using default * feat: install ollama-js, add typedefs * feat: Ollama Vision Support * ci: fix test 2024-05-08 20:24:40 -04:00			`}`
			`}`
			`// TODO: regular completion`
			`else {`
			`// const generation = await this.client.generate(payload);`
			`}`

			`return intermediateReply;`
			`}`
			`catch(err) {`
			`logger.error('[OllamaClient.chatCompletion]', err);`
			`throw err;`
			`}`
			`}`

			`module.exports = { OllamaClient, ollamaPayloadSchema };`