mirror of
https://github.com/danny-avila/LibreChat.git
synced 2025-09-22 06:00:56 +02:00

* feat: Code Interpreter API & File Search Agent Uploads chore: add back code files wip: first pass, abstract key dialog refactor: influence checkbox on key changes refactor: update localization keys for 'execute code' to 'run code' wip: run code button refactor: add throwError parameter to loadAuthValues and getUserPluginAuthValue functions feat: first pass, API tool calling fix: handle missing toolId in callTool function and return 404 for non-existent tools feat: show code outputs fix: improve error handling in callTool function and log errors fix: handle potential null value for filepath in attachment destructuring fix: normalize language before rendering and prevent null return fix: add loading indicator in RunCode component while executing code feat: add support for conditional code execution in Markdown components feat: attachments refactor: remove bash fix: pass abort signal to graph/run refactor: debounce and rate limit tool call refactor: increase debounce delay for execute function feat: set code output attachments feat: image attachments refactor: apply message context refactor: pass `partIndex` feat: toolCall schema/model/methods feat: block indexing feat: get tool calls chore: imports chore: typing chore: condense type imports feat: get tool calls fix: block indexing chore: typing refactor: update tool calls mapping to support multiple results fix: add unique key to nav link for rendering wip: first pass, tool call results refactor: update query cache from successful tool call mutation style: improve result switcher styling chore: note on using \`.toObject()\` feat: add agent_id field to conversation schema chore: typing refactor: rename agentMap to agentsMap for consistency feat: Agent Name as chat input placeholder chore: bump agents 📦 chore: update @langchain dependencies to latest versions to match agents package 📦 chore: update @librechat/agents dependency to version 1.8.0 fix: Aborting agent stream removes sender; fix(bedrock): completion removes preset name label refactor: remove direct file parameter to use req.file, add `processAgentFileUpload` for image uploads feat: upload menu feat: prime message_file resources feat: implement conversation access validation in chat route refactor: remove file parameter from processFileUpload and use req.file instead feat: add savedMessageIds set to track saved message IDs in BaseClient, to prevent unnecessary double-write to db feat: prevent duplicate message saves by checking savedMessageIds in AgentController refactor: skip legacy RAG API handling for agents feat: add files field to convoSchema refactor: update request type annotations from Express.Request to ServerRequest in file processing functions feat: track conversation files fix: resendFiles, addPreviousAttachments handling feat: add ID validation for session_id and file_id in download route feat: entity_id for code file uploads/downloads fix: code file edge cases feat: delete related tool calls feat: add stream rate handling for LLM configuration feat: enhance system content with attached file information fix: improve error logging in resource priming function * WIP: PoC, sequential agents WIP: PoC Sequential Agents, first pass content data + bump agents package fix: package-lock WIP: PoC, o1 support, refactor bufferString feat: convertJsonSchemaToZod fix: form issues and schema defining erroneous model fix: max length issue on agent form instructions, limit conversation messages to sequential agents feat: add abort signal support to createRun function and AgentClient feat: PoC, hide prior sequential agent steps fix: update parameter naming from config to metadata in event handlers for clarity, add model to usage data refactor: use only last contentData, track model for usage data chore: bump agents package fix: content parts issue refactor: filter contentParts to include tool calls and relevant indices feat: show function calls refactor: filter context messages to exclude tool calls when no tools are available to the agent fix: ensure tool call content is not undefined in formatMessages feat: add agent_id field to conversationPreset schema feat: hide sequential agents feat: increase upload toast duration to 10 seconds * refactor: tool context handling & update Code API Key Dialog feat: toolContextMap chore: skipSpecs -> useSpecs ci: fix handleTools tests feat: API Key Dialog * feat: Agent Permissions Admin Controls feat: replace label with button for prompt permission toggle feat: update agent permissions feat: enable experimental agents and streamline capability configuration feat: implement access control for agents and enhance endpoint menu items feat: add welcome message for agent selection in localization feat: add agents permission to access control and update version to 0.7.57 * fix: update types in useAssistantListMap and useMentions hooks for better null handling * feat: mention agents * fix: agent tool resource race conditions when deleting agent tool resource files * feat: add error handling for code execution with user feedback * refactor: rename AdminControls to AdminSettings for clarity * style: add gap to button in AdminSettings for improved layout * refactor: separate agent query hooks and check access to enable fetching * fix: remove unused provider from agent initialization options, creates issue with custom endpoints * refactor: remove redundant/deprecated modelOptions from AgentClient processes * chore: update @librechat/agents to version 1.8.5 in package.json and package-lock.json * fix: minor styling issues + agent panel uniformity * fix: agent edge cases when set endpoint is no longer defined * refactor: remove unused cleanup function call from AppService * fix: update link in ApiKeyDialog to point to pricing page * fix: improve type handling and layout calculations in SidePanel component * fix: add missing localization string for agent selection in SidePanel * chore: form styling and localizations for upload filesearch/code interpreter * fix: model selection placeholder logic in AgentConfig component * style: agent capabilities * fix: add localization for provider selection and improve dropdown styling in ModelPanel * refactor: use gpt-4o-mini > gpt-3.5-turbo * fix: agents configuration for loadDefaultInterface and update related tests * feat: DALLE Agents support
155 lines
4.2 KiB
JavaScript
155 lines
4.2 KiB
JavaScript
const axios = require('axios');
|
|
const {
|
|
FileSources,
|
|
VisionModes,
|
|
ImageDetail,
|
|
ContentTypes,
|
|
EModelEndpoint,
|
|
} = require('librechat-data-provider');
|
|
const { getStrategyFunctions } = require('~/server/services/Files/strategies');
|
|
const { logger } = require('~/config');
|
|
|
|
/**
|
|
* Fetches an image from a URL and returns its base64 representation.
|
|
*
|
|
* @async
|
|
* @param {string} url The URL of the image.
|
|
* @returns {Promise<string>} The base64-encoded string of the image.
|
|
* @throws {Error} If there's an issue fetching the image or encoding it.
|
|
*/
|
|
async function fetchImageToBase64(url) {
|
|
try {
|
|
const response = await axios.get(url, {
|
|
responseType: 'arraybuffer',
|
|
});
|
|
return Buffer.from(response.data).toString('base64');
|
|
} catch (error) {
|
|
logger.error('Error fetching image to convert to base64', error);
|
|
throw error;
|
|
}
|
|
}
|
|
|
|
const base64Only = new Set([
|
|
EModelEndpoint.google,
|
|
EModelEndpoint.anthropic,
|
|
'Ollama',
|
|
'ollama',
|
|
EModelEndpoint.bedrock,
|
|
]);
|
|
|
|
/**
|
|
* Encodes and formats the given files.
|
|
* @param {Express.Request} req - The request object.
|
|
* @param {Array<MongoFile>} files - The array of files to encode and format.
|
|
* @param {EModelEndpoint} [endpoint] - Optional: The endpoint for the image.
|
|
* @param {string} [mode] - Optional: The endpoint mode for the image.
|
|
* @returns {Promise<Object>} - A promise that resolves to the result object containing the encoded images and file details.
|
|
*/
|
|
async function encodeAndFormat(req, files, endpoint, mode) {
|
|
const promises = [];
|
|
const encodingMethods = {};
|
|
const result = {
|
|
files: [],
|
|
image_urls: [],
|
|
};
|
|
|
|
if (!files || !files.length) {
|
|
return result;
|
|
}
|
|
|
|
for (let file of files) {
|
|
const source = file.source ?? FileSources.local;
|
|
|
|
if (!file.height) {
|
|
promises.push([file, null]);
|
|
continue;
|
|
}
|
|
|
|
if (!encodingMethods[source]) {
|
|
const { prepareImagePayload } = getStrategyFunctions(source);
|
|
if (!prepareImagePayload) {
|
|
throw new Error(`Encoding function not implemented for ${source}`);
|
|
}
|
|
|
|
encodingMethods[source] = prepareImagePayload;
|
|
}
|
|
|
|
const preparePayload = encodingMethods[source];
|
|
|
|
/* Google & Anthropic don't support passing URLs to payload */
|
|
if (source !== FileSources.local && base64Only.has(endpoint)) {
|
|
const [_file, imageURL] = await preparePayload(req, file);
|
|
promises.push([_file, await fetchImageToBase64(imageURL)]);
|
|
continue;
|
|
}
|
|
promises.push(preparePayload(req, file));
|
|
}
|
|
|
|
const detail = req.body.imageDetail ?? ImageDetail.auto;
|
|
|
|
/** @type {Array<[MongoFile, string]>} */
|
|
const formattedImages = await Promise.all(promises);
|
|
|
|
for (const [file, imageContent] of formattedImages) {
|
|
const fileMetadata = {
|
|
type: file.type,
|
|
file_id: file.file_id,
|
|
filepath: file.filepath,
|
|
filename: file.filename,
|
|
embedded: !!file.embedded,
|
|
metadata: file.metadata,
|
|
};
|
|
|
|
if (file.height && file.width) {
|
|
fileMetadata.height = file.height;
|
|
fileMetadata.width = file.width;
|
|
}
|
|
|
|
if (!imageContent) {
|
|
result.files.push(fileMetadata);
|
|
continue;
|
|
}
|
|
|
|
const imagePart = {
|
|
type: ContentTypes.IMAGE_URL,
|
|
image_url: {
|
|
url: imageContent.startsWith('http')
|
|
? imageContent
|
|
: `data:${file.type};base64,${imageContent}`,
|
|
detail,
|
|
},
|
|
};
|
|
|
|
if (mode === VisionModes.agents) {
|
|
result.image_urls.push(imagePart);
|
|
result.files.push(fileMetadata);
|
|
continue;
|
|
}
|
|
|
|
if (endpoint && endpoint === EModelEndpoint.google && mode === VisionModes.generative) {
|
|
delete imagePart.image_url;
|
|
imagePart.inlineData = {
|
|
mimeType: file.type,
|
|
data: imageContent,
|
|
};
|
|
} else if (endpoint && endpoint === EModelEndpoint.google) {
|
|
imagePart.image_url = imagePart.image_url.url;
|
|
} else if (endpoint && endpoint === EModelEndpoint.anthropic) {
|
|
imagePart.type = 'image';
|
|
imagePart.source = {
|
|
type: 'base64',
|
|
media_type: file.type,
|
|
data: imageContent,
|
|
};
|
|
delete imagePart.image_url;
|
|
}
|
|
|
|
result.image_urls.push(imagePart);
|
|
result.files.push(fileMetadata);
|
|
}
|
|
return result;
|
|
}
|
|
|
|
module.exports = {
|
|
encodeAndFormat,
|
|
};
|