mirror of
https://github.com/danny-avila/LibreChat.git
synced 2025-09-22 06:00:56 +02:00

* refactor: use keyv for search caching with 1 min expirations * feat: keyvRedis; chore: bump keyv, bun.lockb, add jsconfig for vscode file resolution * feat: api/search redis support * refactor(redis) use ioredis cluster for keyv fix(OpenID): when redis is configured, use redis memory store for express-session * fix: revert using uri for keyvredis * fix(SearchBar): properly debounce search queries, fix weird render behaviors * refactor: add authentication to search endpoint and show error messages in results * feat: redis support for violation logs * fix(logViolation): ensure a number is always being stored in cache * feat(concurrentLimiter): uses clearPendingReq, clears pendingReq on abort, redis support * fix(api/search/enable): query only when authenticated * feat(ModelService): redis support * feat(checkBan): redis support * refactor(api/search): consolidate keyv logic * fix(ci): add default empty value for REDIS_URI * refactor(keyvRedis): use condition to initialize keyvRedis assignment * refactor(connectDb): handle disconnected state (should create a new conn) * fix(ci/e2e): handle case where cleanUp did not successfully run * fix(getDefaultEndpoint): return endpoint from localStorage if defined and endpointsConfig is default * ci(e2e): remove afterAll messages as startup/cleanUp will clear messages * ci(e2e): remove teardown for CI until further notice * chore: bump playwright/test * ci(e2e): reinstate teardown as CI issue is specific to github env * fix(ci): click settings menu trigger by testid
130 lines
3.2 KiB
JavaScript
130 lines
3.2 KiB
JavaScript
const Keyv = require('keyv');
|
|
const axios = require('axios');
|
|
const { isEnabled } = require('../utils');
|
|
const keyvRedis = require('../../cache/keyvRedis');
|
|
// const { getAzureCredentials, genAzureChatCompletion } = require('../../utils/');
|
|
const { openAIApiKey, userProvidedOpenAI } = require('./EndpointService').config;
|
|
|
|
const modelsCache = isEnabled(process.env.USE_REDIS)
|
|
? new Keyv({ store: keyvRedis })
|
|
: new Keyv({ namespace: 'models' });
|
|
|
|
const { OPENROUTER_API_KEY, OPENAI_REVERSE_PROXY, CHATGPT_MODELS, ANTHROPIC_MODELS } =
|
|
process.env ?? {};
|
|
|
|
const fetchOpenAIModels = async (opts = { azure: false, plugins: false }, _models = []) => {
|
|
let models = _models.slice() ?? [];
|
|
let apiKey = openAIApiKey;
|
|
let basePath = 'https://api.openai.com/v1';
|
|
if (opts.azure) {
|
|
return models;
|
|
// const azure = getAzureCredentials();
|
|
// basePath = (genAzureChatCompletion(azure))
|
|
// .split('/deployments')[0]
|
|
// .concat(`/models?api-version=${azure.azureOpenAIApiVersion}`);
|
|
// apiKey = azureOpenAIApiKey;
|
|
}
|
|
|
|
let reverseProxyUrl = OPENAI_REVERSE_PROXY;
|
|
|
|
if (OPENROUTER_API_KEY) {
|
|
reverseProxyUrl = 'https://openrouter.ai/api/v1';
|
|
}
|
|
|
|
if (reverseProxyUrl) {
|
|
basePath = reverseProxyUrl.match(/.*v1/)?.[0];
|
|
}
|
|
|
|
const cachedModels = await modelsCache.get(basePath);
|
|
if (cachedModels) {
|
|
return cachedModels;
|
|
}
|
|
|
|
if (basePath.includes('v1') || opts.azure) {
|
|
try {
|
|
const res = await axios.get(`${basePath}${opts.azure ? '' : '/models'}`, {
|
|
headers: {
|
|
Authorization: `Bearer ${apiKey}`,
|
|
},
|
|
});
|
|
|
|
models = res.data.data.map((item) => item.id);
|
|
// console.log(`Fetched ${models.length} models from ${opts.azure ? 'Azure ' : ''}OpenAI API`);
|
|
} catch (err) {
|
|
console.log(`Failed to fetch models from ${opts.azure ? 'Azure ' : ''}OpenAI API`);
|
|
}
|
|
}
|
|
|
|
if (!reverseProxyUrl) {
|
|
const regex = /(text-davinci-003|gpt-)/;
|
|
models = models.filter((model) => regex.test(model));
|
|
}
|
|
|
|
await modelsCache.set(basePath, models);
|
|
return models;
|
|
};
|
|
|
|
const getOpenAIModels = async (opts = { azure: false, plugins: false }) => {
|
|
let models = [
|
|
'gpt-4',
|
|
'gpt-4-0613',
|
|
'gpt-3.5-turbo',
|
|
'gpt-3.5-turbo-16k',
|
|
'gpt-3.5-turbo-0613',
|
|
'gpt-3.5-turbo-0301',
|
|
];
|
|
|
|
if (!opts.plugins) {
|
|
models.push('text-davinci-003');
|
|
}
|
|
|
|
let key;
|
|
if (opts.azure) {
|
|
key = 'AZURE_OPENAI_MODELS';
|
|
} else if (opts.plugins) {
|
|
key = 'PLUGIN_MODELS';
|
|
} else {
|
|
key = 'OPENAI_MODELS';
|
|
}
|
|
|
|
if (process.env[key]) {
|
|
models = String(process.env[key]).split(',');
|
|
return models;
|
|
}
|
|
|
|
if (userProvidedOpenAI && !OPENROUTER_API_KEY) {
|
|
return models;
|
|
}
|
|
|
|
return await fetchOpenAIModels(opts, models);
|
|
};
|
|
|
|
const getChatGPTBrowserModels = () => {
|
|
let models = ['text-davinci-002-render-sha', 'gpt-4'];
|
|
if (CHATGPT_MODELS) {
|
|
models = String(CHATGPT_MODELS).split(',');
|
|
}
|
|
|
|
return models;
|
|
};
|
|
|
|
const getAnthropicModels = () => {
|
|
let models = [
|
|
'claude-1',
|
|
'claude-1-100k',
|
|
'claude-instant-1',
|
|
'claude-instant-1-100k',
|
|
'claude-2',
|
|
];
|
|
if (ANTHROPIC_MODELS) {
|
|
models = String(ANTHROPIC_MODELS).split(',');
|
|
}
|
|
|
|
return models;
|
|
};
|
|
|
|
module.exports = {
|
|
getOpenAIModels,
|
|
getChatGPTBrowserModels,
|
|
getAnthropicModels,
|
|
};
|