mirror of
https://github.com/danny-avila/LibreChat.git
synced 2025-09-22 08:12:00 +02:00

* refactor: move `loadAuthValues` to `~/services/Tools/credentials` * feat: add createAxiosInstance function to configure axios with proxy support * WIP: First pass mistral ocr * refactor: replace getConvoFiles with getToolFiles for improved file retrieval logic * refactor: improve document formatting in encodeAndFormat function * refactor: remove unused resendFiles parameter from buildOptions function (this option comes from the agent config) * fix: update getFiles call to include files with `text` property as well * refactor: move file handling to `initializeAgentOptions` * refactor: enhance addImageURLs method to handle OCR text and improve message formatting * refactor: update message formatting to handle OCR text in various content types * refactor: remove unused resendFiles property from compactAgentsSchema * fix: add error handling for Mistral OCR document upload and logging * refactor: integrate OCR capability into file upload options and configuration * refactor: skip processing for text source files in delete request, as they are directly tied to database * feat: add metadata field to ExtendedFile type and update PanelColumns and PanelTable components for localization and metadata handling * fix: source icon styling * wip: first pass, frontend file context agent resources * refactor: add hover card with contextual information for File Context (OCR) in FileContext component * feat: enhance file processing by integrating file retrieval for OCR resources in agent initialization * feat: implement OCR config; fix: agent resource deletion for ocr files * feat: enhance agent initialization by adding OCR capability check in resource priming * ci: fix `~/config` module mock * ci: add OCR property expectation in AppService tests * refactor: simplify OCR config loading by removing environment variable extraction, to be done when OCR is actually performed * ci: add unit test to ensure environment variable references are not parsed in OCR config * refactor: disable base64 image inclusion in OCR request * refactor: enhance OCR configuration handling by validating environment variables and providing defaults * refactor: use file stream from disk for mistral ocr api
289 lines
9.8 KiB
JavaScript
289 lines
9.8 KiB
JavaScript
const Conversation = require('./schema/convoSchema');
|
|
const { getMessages, deleteMessages } = require('./Message');
|
|
const logger = require('~/config/winston');
|
|
|
|
/**
|
|
* Searches for a conversation by conversationId and returns a lean document with only conversationId and user.
|
|
* @param {string} conversationId - The conversation's ID.
|
|
* @returns {Promise<{conversationId: string, user: string} | null>} The conversation object with selected fields or null if not found.
|
|
*/
|
|
const searchConversation = async (conversationId) => {
|
|
try {
|
|
return await Conversation.findOne({ conversationId }, 'conversationId user').lean();
|
|
} catch (error) {
|
|
logger.error('[searchConversation] Error searching conversation', error);
|
|
throw new Error('Error searching conversation');
|
|
}
|
|
};
|
|
|
|
/**
|
|
* Retrieves a single conversation for a given user and conversation ID.
|
|
* @param {string} user - The user's ID.
|
|
* @param {string} conversationId - The conversation's ID.
|
|
* @returns {Promise<TConversation>} The conversation object.
|
|
*/
|
|
const getConvo = async (user, conversationId) => {
|
|
try {
|
|
return await Conversation.findOne({ user, conversationId }).lean();
|
|
} catch (error) {
|
|
logger.error('[getConvo] Error getting single conversation', error);
|
|
return { message: 'Error getting single conversation' };
|
|
}
|
|
};
|
|
|
|
const deleteNullOrEmptyConversations = async () => {
|
|
try {
|
|
const filter = {
|
|
$or: [
|
|
{ conversationId: null },
|
|
{ conversationId: '' },
|
|
{ conversationId: { $exists: false } },
|
|
],
|
|
};
|
|
|
|
const result = await Conversation.deleteMany(filter);
|
|
|
|
// Delete associated messages
|
|
const messageDeleteResult = await deleteMessages(filter);
|
|
|
|
logger.info(
|
|
`[deleteNullOrEmptyConversations] Deleted ${result.deletedCount} conversations and ${messageDeleteResult.deletedCount} messages`,
|
|
);
|
|
|
|
return {
|
|
conversations: result,
|
|
messages: messageDeleteResult,
|
|
};
|
|
} catch (error) {
|
|
logger.error('[deleteNullOrEmptyConversations] Error deleting conversations', error);
|
|
throw new Error('Error deleting conversations with null or empty conversationId');
|
|
}
|
|
};
|
|
|
|
/**
|
|
* Retrieves files from a conversation that have either embedded=true
|
|
* or a metadata.fileIdentifier. Simplified and efficient query.
|
|
*
|
|
* @param {string} conversationId - The conversation ID
|
|
* @returns {Promise<MongoFile[]>} - Filtered array of matching file objects
|
|
*/
|
|
const getToolFiles = async (conversationId) => {
|
|
try {
|
|
const [result] = await Conversation.aggregate([
|
|
{ $match: { conversationId } },
|
|
{
|
|
$project: {
|
|
files: {
|
|
$filter: {
|
|
input: '$files',
|
|
as: 'file',
|
|
cond: {
|
|
$or: [
|
|
{ $eq: ['$$file.embedded', true] },
|
|
{ $ifNull: ['$$file.metadata.fileIdentifier', false] },
|
|
],
|
|
},
|
|
},
|
|
},
|
|
_id: 0,
|
|
},
|
|
},
|
|
]).exec();
|
|
|
|
return result?.files || [];
|
|
} catch (error) {
|
|
logger.error('[getConvoEmbeddedFiles] Error fetching embedded files:', error);
|
|
throw new Error('Error fetching embedded files');
|
|
}
|
|
};
|
|
|
|
module.exports = {
|
|
Conversation,
|
|
getToolFiles,
|
|
searchConversation,
|
|
deleteNullOrEmptyConversations,
|
|
/**
|
|
* Saves a conversation to the database.
|
|
* @param {Object} req - The request object.
|
|
* @param {string} conversationId - The conversation's ID.
|
|
* @param {Object} metadata - Additional metadata to log for operation.
|
|
* @returns {Promise<TConversation>} The conversation object.
|
|
*/
|
|
saveConvo: async (req, { conversationId, newConversationId, ...convo }, metadata) => {
|
|
try {
|
|
if (metadata && metadata?.context) {
|
|
logger.debug(`[saveConvo] ${metadata.context}`);
|
|
}
|
|
const messages = await getMessages({ conversationId }, '_id');
|
|
const update = { ...convo, messages, user: req.user.id };
|
|
if (newConversationId) {
|
|
update.conversationId = newConversationId;
|
|
}
|
|
|
|
if (req.body.isTemporary) {
|
|
const expiredAt = new Date();
|
|
expiredAt.setDate(expiredAt.getDate() + 30);
|
|
update.expiredAt = expiredAt;
|
|
} else {
|
|
update.expiredAt = null;
|
|
}
|
|
|
|
/** @type {{ $set: Partial<TConversation>; $unset?: Record<keyof TConversation, number> }} */
|
|
const updateOperation = { $set: update };
|
|
if (metadata && metadata.unsetFields && Object.keys(metadata.unsetFields).length > 0) {
|
|
updateOperation.$unset = metadata.unsetFields;
|
|
}
|
|
|
|
/** Note: the resulting Model object is necessary for Meilisearch operations */
|
|
const conversation = await Conversation.findOneAndUpdate(
|
|
{ conversationId, user: req.user.id },
|
|
updateOperation,
|
|
{
|
|
new: true,
|
|
upsert: true,
|
|
},
|
|
);
|
|
|
|
return conversation.toObject();
|
|
} catch (error) {
|
|
logger.error('[saveConvo] Error saving conversation', error);
|
|
if (metadata && metadata?.context) {
|
|
logger.info(`[saveConvo] ${metadata.context}`);
|
|
}
|
|
return { message: 'Error saving conversation' };
|
|
}
|
|
},
|
|
bulkSaveConvos: async (conversations) => {
|
|
try {
|
|
const bulkOps = conversations.map((convo) => ({
|
|
updateOne: {
|
|
filter: { conversationId: convo.conversationId, user: convo.user },
|
|
update: convo,
|
|
upsert: true,
|
|
timestamps: false,
|
|
},
|
|
}));
|
|
|
|
const result = await Conversation.bulkWrite(bulkOps);
|
|
return result;
|
|
} catch (error) {
|
|
logger.error('[saveBulkConversations] Error saving conversations in bulk', error);
|
|
throw new Error('Failed to save conversations in bulk.');
|
|
}
|
|
},
|
|
getConvosByPage: async (user, pageNumber = 1, pageSize = 25, isArchived = false, tags) => {
|
|
const query = { user };
|
|
if (isArchived) {
|
|
query.isArchived = true;
|
|
} else {
|
|
query.$or = [{ isArchived: false }, { isArchived: { $exists: false } }];
|
|
}
|
|
if (Array.isArray(tags) && tags.length > 0) {
|
|
query.tags = { $in: tags };
|
|
}
|
|
|
|
query.$and = [{ $or: [{ expiredAt: null }, { expiredAt: { $exists: false } }] }];
|
|
|
|
try {
|
|
const totalConvos = (await Conversation.countDocuments(query)) || 1;
|
|
const totalPages = Math.ceil(totalConvos / pageSize);
|
|
const convos = await Conversation.find(query)
|
|
.sort({ updatedAt: -1 })
|
|
.skip((pageNumber - 1) * pageSize)
|
|
.limit(pageSize)
|
|
.lean();
|
|
return { conversations: convos, pages: totalPages, pageNumber, pageSize };
|
|
} catch (error) {
|
|
logger.error('[getConvosByPage] Error getting conversations', error);
|
|
return { message: 'Error getting conversations' };
|
|
}
|
|
},
|
|
getConvosQueried: async (user, convoIds, pageNumber = 1, pageSize = 25) => {
|
|
try {
|
|
if (!convoIds || convoIds.length === 0) {
|
|
return { conversations: [], pages: 1, pageNumber, pageSize };
|
|
}
|
|
|
|
const cache = {};
|
|
const convoMap = {};
|
|
const promises = [];
|
|
|
|
convoIds.forEach((convo) =>
|
|
promises.push(
|
|
Conversation.findOne({
|
|
user,
|
|
conversationId: convo.conversationId,
|
|
$or: [{ expiredAt: { $exists: false } }, { expiredAt: null }],
|
|
}).lean(),
|
|
),
|
|
);
|
|
|
|
const results = (await Promise.all(promises)).filter(Boolean);
|
|
|
|
results.forEach((convo, i) => {
|
|
const page = Math.floor(i / pageSize) + 1;
|
|
if (!cache[page]) {
|
|
cache[page] = [];
|
|
}
|
|
cache[page].push(convo);
|
|
convoMap[convo.conversationId] = convo;
|
|
});
|
|
|
|
const totalPages = Math.ceil(results.length / pageSize);
|
|
cache.pages = totalPages;
|
|
cache.pageSize = pageSize;
|
|
return {
|
|
cache,
|
|
conversations: cache[pageNumber] || [],
|
|
pages: totalPages || 1,
|
|
pageNumber,
|
|
pageSize,
|
|
convoMap,
|
|
};
|
|
} catch (error) {
|
|
logger.error('[getConvosQueried] Error getting conversations', error);
|
|
return { message: 'Error fetching conversations' };
|
|
}
|
|
},
|
|
getConvo,
|
|
/* chore: this method is not properly error handled */
|
|
getConvoTitle: async (user, conversationId) => {
|
|
try {
|
|
const convo = await getConvo(user, conversationId);
|
|
/* ChatGPT Browser was triggering error here due to convo being saved later */
|
|
if (convo && !convo.title) {
|
|
return null;
|
|
} else {
|
|
// TypeError: Cannot read properties of null (reading 'title')
|
|
return convo?.title || 'New Chat';
|
|
}
|
|
} catch (error) {
|
|
logger.error('[getConvoTitle] Error getting conversation title', error);
|
|
return { message: 'Error getting conversation title' };
|
|
}
|
|
},
|
|
/**
|
|
* Asynchronously deletes conversations and associated messages for a given user and filter.
|
|
*
|
|
* @async
|
|
* @function
|
|
* @param {string|ObjectId} user - The user's ID.
|
|
* @param {Object} filter - Additional filter criteria for the conversations to be deleted.
|
|
* @returns {Promise<{ n: number, ok: number, deletedCount: number, messages: { n: number, ok: number, deletedCount: number } }>}
|
|
* An object containing the count of deleted conversations and associated messages.
|
|
* @throws {Error} Throws an error if there's an issue with the database operations.
|
|
*
|
|
* @example
|
|
* const user = 'someUserId';
|
|
* const filter = { someField: 'someValue' };
|
|
* const result = await deleteConvos(user, filter);
|
|
* logger.error(result); // { n: 5, ok: 1, deletedCount: 5, messages: { n: 10, ok: 1, deletedCount: 10 } }
|
|
*/
|
|
deleteConvos: async (user, filter) => {
|
|
let toRemove = await Conversation.find({ ...filter, user }).select('conversationId');
|
|
const ids = toRemove.map((instance) => instance.conversationId);
|
|
let deleteCount = await Conversation.deleteMany({ ...filter, user });
|
|
deleteCount.messages = await deleteMessages({ conversationId: { $in: ids } });
|
|
return deleteCount;
|
|
},
|
|
};
|