mirror of
https://github.com/danny-avila/LibreChat.git
synced 2025-12-19 18:00:15 +01:00
* WIP(backend/api): custom endpoint * WIP(frontend/client): custom endpoint * chore: adjust typedefs for configs * refactor: use data-provider for cache keys and rename enums and custom endpoint for better clarity and compatibility * feat: loadYaml utility * refactor: rename back to from and proof-of-concept for creating schemas from user-defined defaults * refactor: remove custom endpoint from default endpointsConfig as it will be exclusively managed by yaml config * refactor(EndpointController): rename variables for clarity * feat: initial load custom config * feat(server/utils): add simple `isUserProvided` helper * chore(types): update TConfig type * refactor: remove custom endpoint handling from model services as will be handled by config, modularize fetching of models * feat: loadCustomConfig, loadConfigEndpoints, loadConfigModels * chore: reorganize server init imports, invoke loadCustomConfig * refactor(loadConfigEndpoints/Models): return each custom endpoint as standalone endpoint * refactor(Endpoint/ModelController): spread config values after default (temporary) * chore(client): fix type issues * WIP: first pass for multiple custom endpoints - add endpointType to Conversation schema - add update zod schemas for both convo/presets to allow non-EModelEndpoint value as endpoint (also using type assertion) - use `endpointType` value as `endpoint` where mapping to type is necessary using this field - use custom defined `endpoint` value and not type for mapping to modelsConfig - misc: add return type to `getDefaultEndpoint` - in `useNewConvo`, add the endpointType if it wasn't already added to conversation - EndpointsMenu: use user-defined endpoint name as Title in menu - TODO: custom icon via custom config, change unknown to robot icon * refactor(parseConvo): pass args as an object and change where used accordingly; chore: comment out 'create schema' code * chore: remove unused availableModels field in TConfig type * refactor(parseCompactConvo): pass args as an object and change where used accordingly * feat: chat through custom endpoint * chore(message/convoSchemas): avoid saving empty arrays * fix(BaseClient/saveMessageToDatabase): save endpointType * refactor(ChatRoute): show Spinner if endpointsQuery or modelsQuery are still loading, which is apparent with slow fetching of models/remote config on first serve * fix(useConversation): assign endpointType if it's missing * fix(SaveAsPreset): pass real endpoint and endpointType when saving Preset) * chore: recorganize types order for TConfig, add `iconURL` * feat: custom endpoint icon support: - use UnknownIcon in all icon contexts - add mistral and openrouter as known endpoints, and add their icons - iconURL support * fix(presetSchema): move endpointType to default schema definitions shared between convoSchema and defaults * refactor(Settings/OpenAI): remove legacy `isOpenAI` flag * fix(OpenAIClient): do not invoke abortCompletion on completion error * feat: add responseSender/label support for custom endpoints: - use defaultModelLabel field in endpointOption - add model defaults for custom endpoints in `getResponseSender` - add `useGetSender` hook which uses EndpointsQuery to determine `defaultModelLabel` - include defaultModelLabel from endpointConfig in custom endpoint client options - pass `endpointType` to `getResponseSender` * feat(OpenAIClient): use custom options from config file * refactor: rename `defaultModelLabel` to `modelDisplayLabel` * refactor(data-provider): separate concerns from `schemas` into `parsers`, `config`, and fix imports elsewhere * feat: `iconURL` and extract environment variables from custom endpoint config values * feat: custom config validation via zod schema, rename and move to `./projectRoot/librechat.yaml` * docs: custom config docs and examples * fix(OpenAIClient/mistral): mistral does not allow singular system message, also add `useChatCompletion` flag to use openai-node for title completions * fix(custom/initializeClient): extract env var and use `isUserProvided` function * Update librechat.example.yaml * feat(InputWithLabel): add className props, and forwardRef * fix(streamResponse): handle error edge case where either messages or convos query throws an error * fix(useSSE): handle errorHandler edge cases where error response is and is not properly formatted from API, especially when a conversationId is not yet provided, which ensures stream is properly closed on error * feat: user_provided keys for custom endpoints * fix(config/endpointSchema): do not allow default endpoint values in custom endpoint `name` * feat(loadConfigModels): extract env variables and optimize fetching models * feat: support custom endpoint iconURL for messages and Nav * feat(OpenAIClient): add/dropParams support * docs: update docs with default params, add/dropParams, and notes to use config file instead of `OPENAI_REVERSE_PROXY` * docs: update docs with additional notes * feat(maxTokensMap): add mistral models (32k context) * docs: update openrouter notes * Update ai_setup.md * docs(custom_config): add table of contents and fix note about custom name * docs(custom_config): reorder ToC * Update custom_config.md * Add note about `max_tokens` field in custom_config.md
176 lines
4.5 KiB
JavaScript
176 lines
4.5 KiB
JavaScript
const Keyv = require('keyv');
|
|
const axios = require('axios');
|
|
const HttpsProxyAgent = require('https-proxy-agent');
|
|
const { EModelEndpoint, defaultModels } = require('librechat-data-provider');
|
|
const { isEnabled } = require('~/server/utils');
|
|
const keyvRedis = require('~/cache/keyvRedis');
|
|
const { extractBaseURL } = require('~/utils');
|
|
const { logger } = require('~/config');
|
|
|
|
// const { getAzureCredentials, genAzureChatCompletion } = require('~/utils/');
|
|
|
|
const { openAIApiKey, userProvidedOpenAI } = require('./Config/EndpointService').config;
|
|
|
|
const modelsCache = isEnabled(process.env.USE_REDIS)
|
|
? new Keyv({ store: keyvRedis })
|
|
: new Keyv({ namespace: 'models' });
|
|
|
|
const {
|
|
OPENROUTER_API_KEY,
|
|
OPENAI_REVERSE_PROXY,
|
|
CHATGPT_MODELS,
|
|
ANTHROPIC_MODELS,
|
|
GOOGLE_MODELS,
|
|
PROXY,
|
|
} = process.env ?? {};
|
|
|
|
/**
|
|
* Fetches OpenAI models from the specified base API path or Azure, based on the provided configuration.
|
|
*
|
|
* @param {Object} params - The parameters for fetching the models.
|
|
* @param {string} params.apiKey - The API key for authentication with the API.
|
|
* @param {string} params.baseURL - The base path URL for the API.
|
|
* @param {string} [params.name='OpenAI'] - The name of the API; defaults to 'OpenAI'.
|
|
* @param {boolean} [params.azure=false] - Whether to fetch models from Azure.
|
|
* @returns {Promise<string[]>} A promise that resolves to an array of model identifiers.
|
|
* @async
|
|
*/
|
|
const fetchModels = async ({ apiKey, baseURL, name = 'OpenAI', azure = false }) => {
|
|
let models = [];
|
|
|
|
if (!baseURL && !azure) {
|
|
return models;
|
|
}
|
|
|
|
try {
|
|
const payload = {
|
|
headers: {
|
|
Authorization: `Bearer ${apiKey}`,
|
|
},
|
|
};
|
|
|
|
if (PROXY) {
|
|
payload.httpsAgent = new HttpsProxyAgent(PROXY);
|
|
}
|
|
|
|
const res = await axios.get(`${baseURL}${azure ? '' : '/models'}`, payload);
|
|
models = res.data.data.map((item) => item.id);
|
|
} catch (err) {
|
|
logger.error(`Failed to fetch models from ${azure ? 'Azure ' : ''}${name} API`, err);
|
|
}
|
|
|
|
return models;
|
|
};
|
|
|
|
const fetchOpenAIModels = async (opts = { azure: false, plugins: false }, _models = []) => {
|
|
let models = _models.slice() ?? [];
|
|
let apiKey = openAIApiKey;
|
|
let baseURL = 'https://api.openai.com/v1';
|
|
let reverseProxyUrl = OPENAI_REVERSE_PROXY;
|
|
if (opts.azure) {
|
|
return models;
|
|
// const azure = getAzureCredentials();
|
|
// baseURL = (genAzureChatCompletion(azure))
|
|
// .split('/deployments')[0]
|
|
// .concat(`/models?api-version=${azure.azureOpenAIApiVersion}`);
|
|
// apiKey = azureOpenAIApiKey;
|
|
} else if (OPENROUTER_API_KEY) {
|
|
reverseProxyUrl = 'https://openrouter.ai/api/v1';
|
|
apiKey = OPENROUTER_API_KEY;
|
|
}
|
|
|
|
if (reverseProxyUrl) {
|
|
baseURL = extractBaseURL(reverseProxyUrl);
|
|
}
|
|
|
|
const cachedModels = await modelsCache.get(baseURL);
|
|
if (cachedModels) {
|
|
return cachedModels;
|
|
}
|
|
|
|
if (baseURL || opts.azure) {
|
|
models = await fetchModels({
|
|
apiKey,
|
|
baseURL,
|
|
azure: opts.azure,
|
|
});
|
|
}
|
|
|
|
if (!reverseProxyUrl) {
|
|
const regex = /(text-davinci-003|gpt-)/;
|
|
models = models.filter((model) => regex.test(model));
|
|
}
|
|
|
|
await modelsCache.set(baseURL, models);
|
|
return models;
|
|
};
|
|
|
|
const getOpenAIModels = async (opts = { azure: false, plugins: false }) => {
|
|
let models = [
|
|
'gpt-4',
|
|
'gpt-4-0613',
|
|
'gpt-3.5-turbo',
|
|
'gpt-3.5-turbo-16k',
|
|
'gpt-3.5-turbo-0613',
|
|
'gpt-3.5-turbo-0301',
|
|
];
|
|
|
|
if (!opts.plugins) {
|
|
models.push('text-davinci-003');
|
|
}
|
|
|
|
let key;
|
|
if (opts.azure) {
|
|
key = 'AZURE_OPENAI_MODELS';
|
|
} else if (opts.plugins) {
|
|
key = 'PLUGIN_MODELS';
|
|
} else {
|
|
key = 'OPENAI_MODELS';
|
|
}
|
|
|
|
if (process.env[key]) {
|
|
models = String(process.env[key]).split(',');
|
|
return models;
|
|
}
|
|
|
|
if (userProvidedOpenAI && !OPENROUTER_API_KEY) {
|
|
return models;
|
|
}
|
|
|
|
return await fetchOpenAIModels(opts, models);
|
|
};
|
|
|
|
const getChatGPTBrowserModels = () => {
|
|
let models = ['text-davinci-002-render-sha', 'gpt-4'];
|
|
if (CHATGPT_MODELS) {
|
|
models = String(CHATGPT_MODELS).split(',');
|
|
}
|
|
|
|
return models;
|
|
};
|
|
|
|
const getAnthropicModels = () => {
|
|
let models = defaultModels[EModelEndpoint.anthropic];
|
|
if (ANTHROPIC_MODELS) {
|
|
models = String(ANTHROPIC_MODELS).split(',');
|
|
}
|
|
|
|
return models;
|
|
};
|
|
|
|
const getGoogleModels = () => {
|
|
let models = defaultModels[EModelEndpoint.google];
|
|
if (GOOGLE_MODELS) {
|
|
models = String(GOOGLE_MODELS).split(',');
|
|
}
|
|
|
|
return models;
|
|
};
|
|
|
|
module.exports = {
|
|
fetchModels,
|
|
getOpenAIModels,
|
|
getChatGPTBrowserModels,
|
|
getAnthropicModels,
|
|
getGoogleModels,
|
|
};
|