mirror of
https://github.com/danny-avila/LibreChat.git
synced 2025-09-22 06:00:56 +02:00

* feat: add GOOGLE_MODELS env var * feat: add gemini vision support * refactor(GoogleClient): adjust clientOptions handling depending on model * fix(logger): fix redact logic and redact errors only * fix(GoogleClient): do not allow non-multiModal messages when gemini-pro-vision is selected * refactor(OpenAIClient): use `isVisionModel` client property to avoid calling validateVisionModel multiple times * refactor: better debug logging by correctly traversing, redacting sensitive info, and logging condensed versions of long values * refactor(GoogleClient): allow response errors to be thrown/caught above client handling so user receives meaningful error message debug orderedMessages, parentMessageId, and buildMessages result * refactor(AskController): use model from client.modelOptions.model when saving intermediate messages, which requires for the progress callback to be initialized after the client is initialized * feat(useSSE): revert to previous model if the model was auto-switched by backend due to message attachments * docs: update with google updates, notes about Gemini Pro Vision * fix: redis should not be initialized without USE_REDIS and increase max listeners to 20
149 lines
3.7 KiB
JavaScript
149 lines
3.7 KiB
JavaScript
const Keyv = require('keyv');
|
|
const axios = require('axios');
|
|
const HttpsProxyAgent = require('https-proxy-agent');
|
|
const { EModelEndpoint, defaultModels } = require('librechat-data-provider');
|
|
const { isEnabled } = require('~/server/utils');
|
|
const keyvRedis = require('~/cache/keyvRedis');
|
|
const { extractBaseURL } = require('~/utils');
|
|
const { logger } = require('~/config');
|
|
|
|
// const { getAzureCredentials, genAzureChatCompletion } = require('~/utils/');
|
|
|
|
const { openAIApiKey, userProvidedOpenAI } = require('./Config/EndpointService').config;
|
|
|
|
const modelsCache = isEnabled(process.env.USE_REDIS)
|
|
? new Keyv({ store: keyvRedis })
|
|
: new Keyv({ namespace: 'models' });
|
|
|
|
const {
|
|
OPENROUTER_API_KEY,
|
|
OPENAI_REVERSE_PROXY,
|
|
CHATGPT_MODELS,
|
|
ANTHROPIC_MODELS,
|
|
GOOGLE_MODELS,
|
|
PROXY,
|
|
} = process.env ?? {};
|
|
|
|
const fetchOpenAIModels = async (opts = { azure: false, plugins: false }, _models = []) => {
|
|
let models = _models.slice() ?? [];
|
|
let apiKey = openAIApiKey;
|
|
let basePath = 'https://api.openai.com/v1';
|
|
let reverseProxyUrl = OPENAI_REVERSE_PROXY;
|
|
if (opts.azure) {
|
|
return models;
|
|
// const azure = getAzureCredentials();
|
|
// basePath = (genAzureChatCompletion(azure))
|
|
// .split('/deployments')[0]
|
|
// .concat(`/models?api-version=${azure.azureOpenAIApiVersion}`);
|
|
// apiKey = azureOpenAIApiKey;
|
|
} else if (OPENROUTER_API_KEY) {
|
|
reverseProxyUrl = 'https://openrouter.ai/api/v1';
|
|
apiKey = OPENROUTER_API_KEY;
|
|
}
|
|
|
|
if (reverseProxyUrl) {
|
|
basePath = extractBaseURL(reverseProxyUrl);
|
|
}
|
|
|
|
const cachedModels = await modelsCache.get(basePath);
|
|
if (cachedModels) {
|
|
return cachedModels;
|
|
}
|
|
|
|
if (basePath || opts.azure) {
|
|
try {
|
|
const payload = {
|
|
headers: {
|
|
Authorization: `Bearer ${apiKey}`,
|
|
},
|
|
};
|
|
|
|
if (PROXY) {
|
|
payload.httpsAgent = new HttpsProxyAgent(PROXY);
|
|
}
|
|
const res = await axios.get(`${basePath}${opts.azure ? '' : '/models'}`, payload);
|
|
|
|
models = res.data.data.map((item) => item.id);
|
|
// logger.debug(`Fetched ${models.length} models from ${opts.azure ? 'Azure ' : ''}OpenAI API`);
|
|
} catch (err) {
|
|
logger.error(`Failed to fetch models from ${opts.azure ? 'Azure ' : ''}OpenAI API`, err);
|
|
}
|
|
}
|
|
|
|
if (!reverseProxyUrl) {
|
|
const regex = /(text-davinci-003|gpt-)/;
|
|
models = models.filter((model) => regex.test(model));
|
|
}
|
|
|
|
await modelsCache.set(basePath, models);
|
|
return models;
|
|
};
|
|
|
|
const getOpenAIModels = async (opts = { azure: false, plugins: false }) => {
|
|
let models = [
|
|
'gpt-4',
|
|
'gpt-4-0613',
|
|
'gpt-3.5-turbo',
|
|
'gpt-3.5-turbo-16k',
|
|
'gpt-3.5-turbo-0613',
|
|
'gpt-3.5-turbo-0301',
|
|
];
|
|
|
|
if (!opts.plugins) {
|
|
models.push('text-davinci-003');
|
|
}
|
|
|
|
let key;
|
|
if (opts.azure) {
|
|
key = 'AZURE_OPENAI_MODELS';
|
|
} else if (opts.plugins) {
|
|
key = 'PLUGIN_MODELS';
|
|
} else {
|
|
key = 'OPENAI_MODELS';
|
|
}
|
|
|
|
if (process.env[key]) {
|
|
models = String(process.env[key]).split(',');
|
|
return models;
|
|
}
|
|
|
|
if (userProvidedOpenAI && !OPENROUTER_API_KEY) {
|
|
return models;
|
|
}
|
|
|
|
return await fetchOpenAIModels(opts, models);
|
|
};
|
|
|
|
const getChatGPTBrowserModels = () => {
|
|
let models = ['text-davinci-002-render-sha', 'gpt-4'];
|
|
if (CHATGPT_MODELS) {
|
|
models = String(CHATGPT_MODELS).split(',');
|
|
}
|
|
|
|
return models;
|
|
};
|
|
|
|
const getAnthropicModels = () => {
|
|
let models = defaultModels[EModelEndpoint.anthropic];
|
|
if (ANTHROPIC_MODELS) {
|
|
models = String(ANTHROPIC_MODELS).split(',');
|
|
}
|
|
|
|
return models;
|
|
};
|
|
|
|
const getGoogleModels = () => {
|
|
let models = defaultModels[EModelEndpoint.google];
|
|
if (GOOGLE_MODELS) {
|
|
models = String(GOOGLE_MODELS).split(',');
|
|
}
|
|
|
|
return models;
|
|
};
|
|
|
|
module.exports = {
|
|
getOpenAIModels,
|
|
getChatGPTBrowserModels,
|
|
getAnthropicModels,
|
|
getGoogleModels,
|
|
};
|