LibreChat/api/app/clients/prompts/truncate.js

const MAX_CHAR = 255;

/**
 * Truncates a given text to a specified maximum length, appending ellipsis and a notification
 * if the original text exceeds the maximum length.
 *
 * @param {string} text - The text to be truncated.
 * @param {number} [maxLength=MAX_CHAR] - The maximum length of the text after truncation. Defaults to MAX_CHAR.
 * @returns {string} The truncated text if the original text length exceeds maxLength, otherwise returns the original text.
 */
function truncateText(text, maxLength = MAX_CHAR) {
  if (text.length > maxLength) {
    return `${text.slice(0, maxLength)}... [text truncated for brevity]`;
  }
  return text;
}

/**
 * Truncates a given text to a specified maximum length by showing the first half and the last half of the text,
 * separated by ellipsis. This method ensures the output does not exceed the maximum length, including the addition
 * of ellipsis and notification if the original text exceeds the maximum length.
 *
 * @param {string} text - The text to be truncated.
 * @param {number} [maxLength=MAX_CHAR] - The maximum length of the output text after truncation. Defaults to MAX_CHAR.
 * @returns {string} The truncated text showing the first half and the last half, or the original text if it does not exceed maxLength.
 */
function smartTruncateText(text, maxLength = MAX_CHAR) {
  const ellipsis = '...';
  const notification = ' [text truncated for brevity]';
  const halfMaxLength = Math.floor((maxLength - ellipsis.length - notification.length) / 2);

  if (text.length > maxLength) {
    const startLastHalf = text.length - halfMaxLength;
    return `${text.slice(0, halfMaxLength)}${ellipsis}${text.slice(startLastHalf)}${notification}`;
  }

  return text;
}

/**
 * @param {TMessage[]} _messages
 * @param {number} maxContextTokens
 * @param {function({role: string, content: TMessageContent[]}): number} getTokenCountForMessage
 *
 * @returns {{
 *  dbMessages: TMessage[],
 * editedIndices: number[]
 * }}
 */
function truncateToolCallOutputs(_messages, maxContextTokens, getTokenCountForMessage) {
  const THRESHOLD_PERCENTAGE = 0.5;
  const targetTokenLimit = maxContextTokens * THRESHOLD_PERCENTAGE;

  let currentTokenCount = 3;
  const messages = [..._messages];
  const processedMessages = [];
  let currentIndex = messages.length;
  const editedIndices = new Set();
  while (messages.length > 0) {
    currentIndex--;
    const message = messages.pop();
    currentTokenCount += message.tokenCount;
    if (currentTokenCount < targetTokenLimit) {
      processedMessages.push(message);
      continue;
    }

    if (!message.content || !Array.isArray(message.content)) {
      processedMessages.push(message);
      continue;
    }

    const toolCallIndices = message.content
      .map((item, index) => (item.type === 'tool_call' ? index : -1))
      .filter((index) => index !== -1)
      .reverse();

    if (toolCallIndices.length === 0) {
      processedMessages.push(message);
      continue;
    }

    const newContent = [...message.content];

    // Truncate all tool outputs since we're over threshold
    for (const index of toolCallIndices) {
      const toolCall = newContent[index].tool_call;
      if (!toolCall || !toolCall.output) {
        continue;
      }

      editedIndices.add(currentIndex);

      newContent[index] = {
        ...newContent[index],
        tool_call: {
          ...toolCall,
          output: '[OUTPUT_OMITTED_FOR_BREVITY]',
        },
      };
    }

    const truncatedMessage = {
      ...message,
      content: newContent,
      tokenCount: getTokenCountForMessage({ role: 'assistant', content: newContent }),
    };

    processedMessages.push(truncatedMessage);
  }

  return { dbMessages: processedMessages.reverse(), editedIndices: Array.from(editedIndices) };
}

module.exports = { truncateText, smartTruncateText, truncateToolCallOutputs };
🔧 refactor: Improve Agent Context & Minor Fixes (#5349) * refactor: Improve Context for Agents * 🔧 fix: Safeguard against undefined properties in OpenAIClient response handling * refactor: log error before re-throwing for original stack trace * refactor: remove toolResource state from useFileHandling, allow svg files * refactor: prevent verbose logs from axios errors when using actions * refactor: add silent method recordTokenUsage in AgentClient * refactor: streamline token count assignment in BaseClient * refactor: enhance safety settings handling for Gemini 2.0 model * fix: capabilities structure in MCPConnection * refactor: simplify civic integrity threshold handling in GoogleClient and llm * refactor: update token count retrieval method in BaseClient tests * ci: fix test for svg 2025-01-17 12:55:48 -05:00			`const MAX_CHAR = 255;`

			`/**`
			`* Truncates a given text to a specified maximum length, appending ellipsis and a notification`
			`* if the original text exceeds the maximum length.`
			`*`
			`* @param {string} text - The text to be truncated.`
			`* @param {number} [maxLength=MAX_CHAR] - The maximum length of the text after truncation. Defaults to MAX_CHAR.`
			`* @returns {string} The truncated text if the original text length exceeds maxLength, otherwise returns the original text.`
			`*/`
			`function truncateText(text, maxLength = MAX_CHAR) {`
			`if (text.length > maxLength) {`
			return `${text.slice(0, maxLength)}... [text truncated for brevity]`;
			`}`
			`return text;`
			`}`

			`/**`
			`* Truncates a given text to a specified maximum length by showing the first half and the last half of the text,`
			`* separated by ellipsis. This method ensures the output does not exceed the maximum length, including the addition`
			`* of ellipsis and notification if the original text exceeds the maximum length.`
			`*`
			`* @param {string} text - The text to be truncated.`
			`* @param {number} [maxLength=MAX_CHAR] - The maximum length of the output text after truncation. Defaults to MAX_CHAR.`
			`* @returns {string} The truncated text showing the first half and the last half, or the original text if it does not exceed maxLength.`
			`*/`
			`function smartTruncateText(text, maxLength = MAX_CHAR) {`
			`const ellipsis = '...';`
			`const notification = ' [text truncated for brevity]';`
			`const halfMaxLength = Math.floor((maxLength - ellipsis.length - notification.length) / 2);`

			`if (text.length > maxLength) {`
			`const startLastHalf = text.length - halfMaxLength;`
			return `${text.slice(0, halfMaxLength)}${ellipsis}${text.slice(startLastHalf)}${notification}`;
			`}`

			`return text;`
			`}`

			`/**`
			`* @param {TMessage[]} _messages`
			`* @param {number} maxContextTokens`
			`* @param {function({role: string, content: TMessageContent[]}): number} getTokenCountForMessage`
			`*`
			`* @returns {{`
			`* dbMessages: TMessage[],`
			`* editedIndices: number[]`
			`* }}`
			`*/`
			`function truncateToolCallOutputs(_messages, maxContextTokens, getTokenCountForMessage) {`
			`const THRESHOLD_PERCENTAGE = 0.5;`
			`const targetTokenLimit = maxContextTokens * THRESHOLD_PERCENTAGE;`

			`let currentTokenCount = 3;`
			`const messages = [..._messages];`
			`const processedMessages = [];`
			`let currentIndex = messages.length;`
			`const editedIndices = new Set();`
			`while (messages.length > 0) {`
			`currentIndex--;`
			`const message = messages.pop();`
			`currentTokenCount += message.tokenCount;`
			`if (currentTokenCount < targetTokenLimit) {`
			`processedMessages.push(message);`
			`continue;`
			`}`

			`if (!message.content \|\| !Array.isArray(message.content)) {`
			`processedMessages.push(message);`
			`continue;`
			`}`

			`const toolCallIndices = message.content`
			`.map((item, index) => (item.type === 'tool_call' ? index : -1))`
			`.filter((index) => index !== -1)`
			`.reverse();`

			`if (toolCallIndices.length === 0) {`
			`processedMessages.push(message);`
			`continue;`
			`}`

			`const newContent = [...message.content];`

			`// Truncate all tool outputs since we're over threshold`
			`for (const index of toolCallIndices) {`
			`const toolCall = newContent[index].tool_call;`
			`if (!toolCall \|\| !toolCall.output) {`
			`continue;`
			`}`

			`editedIndices.add(currentIndex);`

			`newContent[index] = {`
			`...newContent[index],`
			`tool_call: {`
			`...toolCall,`
			`output: '[OUTPUT_OMITTED_FOR_BREVITY]',`
			`},`
			`};`
			`}`

			`const truncatedMessage = {`
			`...message,`
			`content: newContent,`
			`tokenCount: getTokenCountForMessage({ role: 'assistant', content: newContent }),`
			`};`

			`processedMessages.push(truncatedMessage);`
			`}`

			`return { dbMessages: processedMessages.reverse(), editedIndices: Array.from(editedIndices) };`
			`}`

			`module.exports = { truncateText, smartTruncateText, truncateToolCallOutputs };`