mirror of
https://github.com/danny-avila/LibreChat.git
synced 2025-12-16 16:30:15 +01:00
* refactor: move endpoint initialization methods to typescript * refactor: move agent init to packages/api - Introduced `initialize.ts` for agent initialization, including file processing and tool loading. - Updated `resources.ts` to allow optional appConfig parameter. - Enhanced endpoint configuration handling in various initialization files to support model parameters. - Added new artifacts and prompts for React component generation. - Refactored existing code to improve type safety and maintainability. * refactor: streamline endpoint initialization and enhance type safety - Updated initialization functions across various endpoints to use a consistent request structure, replacing `unknown` types with `ServerResponse`. - Simplified request handling by directly extracting keys from the request body. - Improved type safety by ensuring user IDs are safely accessed with optional chaining. - Removed unnecessary parameters and streamlined model options handling for better clarity and maintainability. * refactor: moved ModelService and extractBaseURL to packages/api - Added comprehensive tests for the models fetching functionality, covering scenarios for OpenAI, Anthropic, Google, and Ollama models. - Updated existing endpoint index to include the new models module. - Enhanced utility functions for URL extraction and model data processing. - Improved type safety and error handling across the models fetching logic. * refactor: consolidate utility functions and remove unused files - Merged `deriveBaseURL` and `extractBaseURL` into the `@librechat/api` module for better organization. - Removed redundant utility files and their associated tests to streamline the codebase. - Updated imports across various client files to utilize the new consolidated functions. - Enhanced overall maintainability by reducing the number of utility modules. * refactor: replace ModelService references with direct imports from @librechat/api and remove ModelService file * refactor: move encrypt/decrypt methods and key db methods to data-schemas, use `getProviderConfig` from `@librechat/api` * chore: remove unused 'res' from options in AgentClient * refactor: file model imports and methods - Updated imports in various controllers and services to use the unified file model from '~/models' instead of '~/models/File'. - Consolidated file-related methods into a new file methods module in the data-schemas package. - Added comprehensive tests for file methods including creation, retrieval, updating, and deletion. - Enhanced the initializeAgent function to accept dependency injection for file-related methods. - Improved error handling and logging in file methods. * refactor: streamline database method references in agent initialization * refactor: enhance file method tests and update type references to IMongoFile * refactor: consolidate database method imports in agent client and initialization * chore: remove redundant import of initializeAgent from @librechat/api * refactor: move checkUserKeyExpiry utility to @librechat/api and update references across endpoints * refactor: move updateUserPlugins logic to user.ts and simplify UserController * refactor: update imports for user key management and remove UserService * refactor: remove unused Anthropics and Bedrock endpoint files and clean up imports * refactor: consolidate and update encryption imports across various files to use @librechat/data-schemas * chore: update file model mock to use unified import from '~/models' * chore: import order * refactor: remove migrated to TS agent.js file and its associated logic from the endpoints * chore: add reusable function to extract imports from source code in unused-packages workflow * chore: enhance unused-packages workflow to include @librechat/api dependencies and improve dependency extraction * chore: improve dependency extraction in unused-packages workflow with enhanced error handling and debugging output * chore: add detailed debugging output to unused-packages workflow for better visibility into unused dependencies and exclusion lists * chore: refine subpath handling in unused-packages workflow to correctly process scoped and non-scoped package imports * chore: clean up unused debug output in unused-packages workflow and reorganize type imports in initialize.ts
411 lines
13 KiB
JavaScript
411 lines
13 KiB
JavaScript
const axios = require('axios');
|
|
const { v4 } = require('uuid');
|
|
const OpenAI = require('openai');
|
|
const FormData = require('form-data');
|
|
const { ProxyAgent } = require('undici');
|
|
const { tool } = require('@langchain/core/tools');
|
|
const { logger } = require('@librechat/data-schemas');
|
|
const { HttpsProxyAgent } = require('https-proxy-agent');
|
|
const { ContentTypes, EImageOutputType } = require('librechat-data-provider');
|
|
const { logAxiosError, oaiToolkit, extractBaseURL } = require('@librechat/api');
|
|
const { getStrategyFunctions } = require('~/server/services/Files/strategies');
|
|
const { getFiles } = require('~/models');
|
|
|
|
const displayMessage =
|
|
"The tool displayed an image. All generated images are already plainly visible, so don't repeat the descriptions in detail. Do not list download links as they are available in the UI already. The user may download the images by clicking on them, but do not mention anything about downloading to the user.";
|
|
|
|
/**
|
|
* Replaces unwanted characters from the input string
|
|
* @param {string} inputString - The input string to process
|
|
* @returns {string} - The processed string
|
|
*/
|
|
function replaceUnwantedChars(inputString) {
|
|
return inputString
|
|
.replace(/\r\n|\r|\n/g, ' ')
|
|
.replace(/"/g, '')
|
|
.trim();
|
|
}
|
|
|
|
function returnValue(value) {
|
|
if (typeof value === 'string') {
|
|
return [value, {}];
|
|
} else if (typeof value === 'object') {
|
|
if (Array.isArray(value)) {
|
|
return value;
|
|
}
|
|
return [displayMessage, value];
|
|
}
|
|
return value;
|
|
}
|
|
|
|
function createAbortHandler() {
|
|
return function () {
|
|
logger.debug('[ImageGenOAI] Image generation aborted');
|
|
};
|
|
}
|
|
|
|
/**
|
|
* Creates OpenAI Image tools (generation and editing)
|
|
* @param {Object} fields - Configuration fields
|
|
* @param {ServerRequest} fields.req - Whether the tool is being used in an agent context
|
|
* @param {boolean} fields.isAgent - Whether the tool is being used in an agent context
|
|
* @param {string} fields.IMAGE_GEN_OAI_API_KEY - The OpenAI API key
|
|
* @param {boolean} [fields.override] - Whether to override the API key check, necessary for app initialization
|
|
* @param {MongoFile[]} [fields.imageFiles] - The images to be used for editing
|
|
* @param {string} [fields.imageOutputType] - The image output type configuration
|
|
* @param {string} [fields.fileStrategy] - The file storage strategy
|
|
* @returns {Array<ReturnType<tool>>} - Array of image tools
|
|
*/
|
|
function createOpenAIImageTools(fields = {}) {
|
|
/** @type {boolean} Used to initialize the Tool without necessary variables. */
|
|
const override = fields.override ?? false;
|
|
/** @type {boolean} */
|
|
if (!override && !fields.isAgent) {
|
|
throw new Error('This tool is only available for agents.');
|
|
}
|
|
const { req } = fields;
|
|
const imageOutputType = fields.imageOutputType || EImageOutputType.PNG;
|
|
const appFileStrategy = fields.fileStrategy;
|
|
|
|
const getApiKey = () => {
|
|
const apiKey = process.env.IMAGE_GEN_OAI_API_KEY ?? '';
|
|
if (!apiKey && !override) {
|
|
throw new Error('Missing IMAGE_GEN_OAI_API_KEY environment variable.');
|
|
}
|
|
return apiKey;
|
|
};
|
|
|
|
let apiKey = fields.IMAGE_GEN_OAI_API_KEY ?? getApiKey();
|
|
const closureConfig = { apiKey };
|
|
|
|
let baseURL = 'https://api.openai.com/v1/';
|
|
if (!override && process.env.IMAGE_GEN_OAI_BASEURL) {
|
|
baseURL = extractBaseURL(process.env.IMAGE_GEN_OAI_BASEURL);
|
|
closureConfig.baseURL = baseURL;
|
|
}
|
|
|
|
// Note: Azure may not yet support the latest image generation models
|
|
if (
|
|
!override &&
|
|
process.env.IMAGE_GEN_OAI_AZURE_API_VERSION &&
|
|
process.env.IMAGE_GEN_OAI_BASEURL
|
|
) {
|
|
baseURL = process.env.IMAGE_GEN_OAI_BASEURL;
|
|
closureConfig.baseURL = baseURL;
|
|
closureConfig.defaultQuery = { 'api-version': process.env.IMAGE_GEN_OAI_AZURE_API_VERSION };
|
|
closureConfig.defaultHeaders = {
|
|
'api-key': process.env.IMAGE_GEN_OAI_API_KEY,
|
|
'Content-Type': 'application/json',
|
|
};
|
|
closureConfig.apiKey = process.env.IMAGE_GEN_OAI_API_KEY;
|
|
}
|
|
|
|
const imageFiles = fields.imageFiles ?? [];
|
|
|
|
/**
|
|
* Image Generation Tool
|
|
*/
|
|
const imageGenTool = tool(
|
|
async (
|
|
{
|
|
prompt,
|
|
background = 'auto',
|
|
n = 1,
|
|
output_compression = 100,
|
|
quality = 'auto',
|
|
size = 'auto',
|
|
},
|
|
runnableConfig,
|
|
) => {
|
|
if (!prompt) {
|
|
throw new Error('Missing required field: prompt');
|
|
}
|
|
const clientConfig = { ...closureConfig };
|
|
if (process.env.PROXY) {
|
|
const proxyAgent = new ProxyAgent(process.env.PROXY);
|
|
clientConfig.fetchOptions = {
|
|
dispatcher: proxyAgent,
|
|
};
|
|
}
|
|
|
|
/** @type {OpenAI} */
|
|
const openai = new OpenAI(clientConfig);
|
|
let output_format = imageOutputType;
|
|
if (
|
|
background === 'transparent' &&
|
|
output_format !== EImageOutputType.PNG &&
|
|
output_format !== EImageOutputType.WEBP
|
|
) {
|
|
logger.warn(
|
|
'[ImageGenOAI] Transparent background requires PNG or WebP format, defaulting to PNG',
|
|
);
|
|
output_format = EImageOutputType.PNG;
|
|
}
|
|
|
|
let resp;
|
|
/** @type {AbortSignal} */
|
|
let derivedSignal = null;
|
|
/** @type {() => void} */
|
|
let abortHandler = null;
|
|
|
|
try {
|
|
if (runnableConfig?.signal) {
|
|
derivedSignal = AbortSignal.any([runnableConfig.signal]);
|
|
abortHandler = createAbortHandler();
|
|
derivedSignal.addEventListener('abort', abortHandler, { once: true });
|
|
}
|
|
|
|
resp = await openai.images.generate(
|
|
{
|
|
model: 'gpt-image-1',
|
|
prompt: replaceUnwantedChars(prompt),
|
|
n: Math.min(Math.max(1, n), 10),
|
|
background,
|
|
output_format,
|
|
output_compression:
|
|
output_format === EImageOutputType.WEBP || output_format === EImageOutputType.JPEG
|
|
? output_compression
|
|
: undefined,
|
|
quality,
|
|
size,
|
|
},
|
|
{
|
|
signal: derivedSignal,
|
|
},
|
|
);
|
|
} catch (error) {
|
|
const message = '[image_gen_oai] Problem generating the image:';
|
|
logAxiosError({ error, message });
|
|
return returnValue(`Something went wrong when trying to generate the image. The OpenAI API may be unavailable:
|
|
Error Message: ${error.message}`);
|
|
} finally {
|
|
if (abortHandler && derivedSignal) {
|
|
derivedSignal.removeEventListener('abort', abortHandler);
|
|
}
|
|
}
|
|
|
|
if (!resp) {
|
|
return returnValue(
|
|
'Something went wrong when trying to generate the image. The OpenAI API may be unavailable',
|
|
);
|
|
}
|
|
|
|
// For gpt-image-1, the response contains base64-encoded images
|
|
// TODO: handle cost in `resp.usage`
|
|
const base64Image = resp.data[0].b64_json;
|
|
|
|
if (!base64Image) {
|
|
return returnValue(
|
|
'No image data returned from OpenAI API. There may be a problem with the API or your configuration.',
|
|
);
|
|
}
|
|
|
|
const content = [
|
|
{
|
|
type: ContentTypes.IMAGE_URL,
|
|
image_url: {
|
|
url: `data:image/${output_format};base64,${base64Image}`,
|
|
},
|
|
},
|
|
];
|
|
|
|
const file_ids = [v4()];
|
|
const response = [
|
|
{
|
|
type: ContentTypes.TEXT,
|
|
text: displayMessage + `\n\ngenerated_image_id: "${file_ids[0]}"`,
|
|
},
|
|
];
|
|
return [response, { content, file_ids }];
|
|
},
|
|
oaiToolkit.image_gen_oai,
|
|
);
|
|
|
|
/**
|
|
* Image Editing Tool
|
|
*/
|
|
const imageEditTool = tool(
|
|
async ({ prompt, image_ids, quality = 'auto', size = 'auto' }, runnableConfig) => {
|
|
if (!prompt) {
|
|
throw new Error('Missing required field: prompt');
|
|
}
|
|
|
|
const clientConfig = { ...closureConfig };
|
|
if (process.env.PROXY) {
|
|
const proxyAgent = new ProxyAgent(process.env.PROXY);
|
|
clientConfig.fetchOptions = {
|
|
dispatcher: proxyAgent,
|
|
};
|
|
}
|
|
|
|
const formData = new FormData();
|
|
formData.append('model', 'gpt-image-1');
|
|
formData.append('prompt', replaceUnwantedChars(prompt));
|
|
// TODO: `mask` support
|
|
// TODO: more than 1 image support
|
|
// formData.append('n', n.toString());
|
|
formData.append('quality', quality);
|
|
formData.append('size', size);
|
|
|
|
/** @type {Record<FileSources, undefined | NodeStreamDownloader<File>>} */
|
|
const streamMethods = {};
|
|
|
|
const requestFilesMap = Object.fromEntries(imageFiles.map((f) => [f.file_id, { ...f }]));
|
|
|
|
const orderedFiles = new Array(image_ids.length);
|
|
const idsToFetch = [];
|
|
const indexOfMissing = Object.create(null);
|
|
|
|
for (let i = 0; i < image_ids.length; i++) {
|
|
const id = image_ids[i];
|
|
const file = requestFilesMap[id];
|
|
|
|
if (file) {
|
|
orderedFiles[i] = file;
|
|
} else {
|
|
idsToFetch.push(id);
|
|
indexOfMissing[id] = i;
|
|
}
|
|
}
|
|
|
|
if (idsToFetch.length) {
|
|
const fetchedFiles = await getFiles(
|
|
{
|
|
user: req.user.id,
|
|
file_id: { $in: idsToFetch },
|
|
height: { $exists: true },
|
|
width: { $exists: true },
|
|
},
|
|
{},
|
|
{},
|
|
);
|
|
|
|
for (const file of fetchedFiles) {
|
|
requestFilesMap[file.file_id] = file;
|
|
orderedFiles[indexOfMissing[file.file_id]] = file;
|
|
}
|
|
}
|
|
for (const imageFile of orderedFiles) {
|
|
if (!imageFile) {
|
|
continue;
|
|
}
|
|
/** @type {NodeStream<File>} */
|
|
let stream;
|
|
/** @type {NodeStreamDownloader<File>} */
|
|
let getDownloadStream;
|
|
const source = imageFile.source || appFileStrategy;
|
|
if (!source) {
|
|
throw new Error('No source found for image file');
|
|
}
|
|
if (streamMethods[source]) {
|
|
getDownloadStream = streamMethods[source];
|
|
} else {
|
|
({ getDownloadStream } = getStrategyFunctions(source));
|
|
streamMethods[source] = getDownloadStream;
|
|
}
|
|
if (!getDownloadStream) {
|
|
throw new Error(`No download stream method found for source: ${source}`);
|
|
}
|
|
stream = await getDownloadStream(req, imageFile.filepath);
|
|
if (!stream) {
|
|
throw new Error('Failed to get download stream for image file');
|
|
}
|
|
formData.append('image[]', stream, {
|
|
filename: imageFile.filename,
|
|
contentType: imageFile.type,
|
|
});
|
|
}
|
|
|
|
/** @type {import('axios').RawAxiosHeaders} */
|
|
let headers = {
|
|
...formData.getHeaders(),
|
|
};
|
|
|
|
if (process.env.IMAGE_GEN_OAI_AZURE_API_VERSION && process.env.IMAGE_GEN_OAI_BASEURL) {
|
|
headers['api-key'] = apiKey;
|
|
} else {
|
|
headers['Authorization'] = `Bearer ${apiKey}`;
|
|
}
|
|
|
|
/** @type {AbortSignal} */
|
|
let derivedSignal = null;
|
|
/** @type {() => void} */
|
|
let abortHandler = null;
|
|
|
|
try {
|
|
if (runnableConfig?.signal) {
|
|
derivedSignal = AbortSignal.any([runnableConfig.signal]);
|
|
abortHandler = createAbortHandler();
|
|
derivedSignal.addEventListener('abort', abortHandler, { once: true });
|
|
}
|
|
|
|
/** @type {import('axios').AxiosRequestConfig} */
|
|
const axiosConfig = {
|
|
headers,
|
|
...clientConfig,
|
|
signal: derivedSignal,
|
|
baseURL,
|
|
};
|
|
|
|
if (process.env.PROXY) {
|
|
axiosConfig.httpsAgent = new HttpsProxyAgent(process.env.PROXY);
|
|
}
|
|
|
|
if (process.env.IMAGE_GEN_OAI_AZURE_API_VERSION && process.env.IMAGE_GEN_OAI_BASEURL) {
|
|
axiosConfig.params = {
|
|
'api-version': process.env.IMAGE_GEN_OAI_AZURE_API_VERSION,
|
|
...axiosConfig.params,
|
|
};
|
|
}
|
|
const response = await axios.post('/images/edits', formData, axiosConfig);
|
|
|
|
if (!response.data || !response.data.data || !response.data.data.length) {
|
|
return returnValue(
|
|
'No image data returned from OpenAI API. There may be a problem with the API or your configuration.',
|
|
);
|
|
}
|
|
|
|
const base64Image = response.data.data[0].b64_json;
|
|
if (!base64Image) {
|
|
return returnValue(
|
|
'No image data returned from OpenAI API. There may be a problem with the API or your configuration.',
|
|
);
|
|
}
|
|
|
|
const content = [
|
|
{
|
|
type: ContentTypes.IMAGE_URL,
|
|
image_url: {
|
|
url: `data:image/${imageOutputType};base64,${base64Image}`,
|
|
},
|
|
},
|
|
];
|
|
|
|
const file_ids = [v4()];
|
|
const textResponse = [
|
|
{
|
|
type: ContentTypes.TEXT,
|
|
text:
|
|
displayMessage +
|
|
`\n\ngenerated_image_id: "${file_ids[0]}"\nreferenced_image_ids: ["${image_ids.join('", "')}"]`,
|
|
},
|
|
];
|
|
return [textResponse, { content, file_ids }];
|
|
} catch (error) {
|
|
const message = '[image_edit_oai] Problem editing the image:';
|
|
logAxiosError({ error, message });
|
|
return returnValue(`Something went wrong when trying to edit the image. The OpenAI API may be unavailable:
|
|
Error Message: ${error.message || 'Unknown error'}`);
|
|
} finally {
|
|
if (abortHandler && derivedSignal) {
|
|
derivedSignal.removeEventListener('abort', abortHandler);
|
|
}
|
|
}
|
|
},
|
|
oaiToolkit.image_edit_oai,
|
|
);
|
|
|
|
return [imageGenTool, imageEditTool];
|
|
}
|
|
|
|
module.exports = createOpenAIImageTools;
|