mirror of
https://github.com/danny-avila/LibreChat.git
synced 2025-12-17 17:00:15 +01:00
♻️ fix: Prevent Instructions from Removal when nearing Max Context (#5516)
* refactor: getMessagesWithinTokenLimit to accept params object * refactor: always include instructions in payload if provided * ci: remove obsolete test * refactor: update logoutUser to accept request object and handle session destruction * test: enhance getMessagesWithinTokenLimit tests for instruction handling
This commit is contained in:
parent
528ee62eb1
commit
4110209494
6 changed files with 185 additions and 83 deletions
|
|
@ -159,7 +159,7 @@ describe('BaseClient', () => {
|
|||
expectedMessagesToRefine?.[expectedMessagesToRefine.length - 1] ?? {};
|
||||
const expectedIndex = messages.findIndex((msg) => msg.content === lastExpectedMessage?.content);
|
||||
|
||||
const result = await TestClient.getMessagesWithinTokenLimit(messages);
|
||||
const result = await TestClient.getMessagesWithinTokenLimit({ messages });
|
||||
|
||||
expect(result.context).toEqual(expectedContext);
|
||||
expect(result.summaryIndex).toEqual(expectedIndex);
|
||||
|
|
@ -195,7 +195,7 @@ describe('BaseClient', () => {
|
|||
expectedMessagesToRefine?.[expectedMessagesToRefine.length - 1] ?? {};
|
||||
const expectedIndex = messages.findIndex((msg) => msg.content === lastExpectedMessage?.content);
|
||||
|
||||
const result = await TestClient.getMessagesWithinTokenLimit(messages);
|
||||
const result = await TestClient.getMessagesWithinTokenLimit({ messages });
|
||||
|
||||
expect(result.context).toEqual(expectedContext);
|
||||
expect(result.summaryIndex).toEqual(expectedIndex);
|
||||
|
|
@ -203,66 +203,6 @@ describe('BaseClient', () => {
|
|||
expect(result.messagesToRefine).toEqual(expectedMessagesToRefine);
|
||||
});
|
||||
|
||||
test('handles context strategy correctly in handleContextStrategy()', async () => {
|
||||
TestClient.addInstructions = jest
|
||||
.fn()
|
||||
.mockReturnValue([
|
||||
{ content: 'Hello' },
|
||||
{ content: 'How can I help you?' },
|
||||
{ content: 'Please provide more details.' },
|
||||
{ content: 'I can assist you with that.' },
|
||||
]);
|
||||
TestClient.getMessagesWithinTokenLimit = jest.fn().mockReturnValue({
|
||||
context: [
|
||||
{ content: 'How can I help you?' },
|
||||
{ content: 'Please provide more details.' },
|
||||
{ content: 'I can assist you with that.' },
|
||||
],
|
||||
remainingContextTokens: 80,
|
||||
messagesToRefine: [{ content: 'Hello' }],
|
||||
summaryIndex: 3,
|
||||
});
|
||||
|
||||
TestClient.getTokenCount = jest.fn().mockReturnValue(40);
|
||||
|
||||
const instructions = { content: 'Please provide more details.' };
|
||||
const orderedMessages = [
|
||||
{ content: 'Hello' },
|
||||
{ content: 'How can I help you?' },
|
||||
{ content: 'Please provide more details.' },
|
||||
{ content: 'I can assist you with that.' },
|
||||
];
|
||||
const formattedMessages = [
|
||||
{ content: 'Hello' },
|
||||
{ content: 'How can I help you?' },
|
||||
{ content: 'Please provide more details.' },
|
||||
{ content: 'I can assist you with that.' },
|
||||
];
|
||||
const expectedResult = {
|
||||
payload: [
|
||||
{
|
||||
role: 'system',
|
||||
content: 'Refined answer',
|
||||
},
|
||||
{ content: 'How can I help you?' },
|
||||
{ content: 'Please provide more details.' },
|
||||
{ content: 'I can assist you with that.' },
|
||||
],
|
||||
promptTokens: expect.any(Number),
|
||||
tokenCountMap: {},
|
||||
messages: expect.any(Array),
|
||||
};
|
||||
|
||||
TestClient.shouldSummarize = true;
|
||||
const result = await TestClient.handleContextStrategy({
|
||||
instructions,
|
||||
orderedMessages,
|
||||
formattedMessages,
|
||||
});
|
||||
|
||||
expect(result).toEqual(expectedResult);
|
||||
});
|
||||
|
||||
describe('getMessagesForConversation', () => {
|
||||
it('should return an empty array if the parentMessageId does not exist', () => {
|
||||
const result = TestClient.constructor.getMessagesForConversation({
|
||||
|
|
@ -674,4 +614,112 @@ describe('BaseClient', () => {
|
|||
expect(calls[1][0].isCreatedByUser).toBe(false); // Second call should be for response message
|
||||
});
|
||||
});
|
||||
|
||||
describe('getMessagesWithinTokenLimit with instructions', () => {
|
||||
test('should always include instructions when present', async () => {
|
||||
TestClient.maxContextTokens = 50;
|
||||
const instructions = {
|
||||
role: 'system',
|
||||
content: 'System instructions',
|
||||
tokenCount: 20,
|
||||
};
|
||||
|
||||
const messages = [
|
||||
instructions,
|
||||
{ role: 'user', content: 'Hello', tokenCount: 10 },
|
||||
{ role: 'assistant', content: 'Hi there', tokenCount: 15 },
|
||||
];
|
||||
|
||||
const result = await TestClient.getMessagesWithinTokenLimit({
|
||||
messages,
|
||||
instructions,
|
||||
});
|
||||
|
||||
expect(result.context[0]).toBe(instructions);
|
||||
expect(result.remainingContextTokens).toBe(2);
|
||||
});
|
||||
|
||||
test('should handle case when messages exceed limit but instructions must be preserved', async () => {
|
||||
TestClient.maxContextTokens = 30;
|
||||
const instructions = {
|
||||
role: 'system',
|
||||
content: 'System instructions',
|
||||
tokenCount: 20,
|
||||
};
|
||||
|
||||
const messages = [
|
||||
instructions,
|
||||
{ role: 'user', content: 'Hello', tokenCount: 10 },
|
||||
{ role: 'assistant', content: 'Hi there', tokenCount: 15 },
|
||||
];
|
||||
|
||||
const result = await TestClient.getMessagesWithinTokenLimit({
|
||||
messages,
|
||||
instructions,
|
||||
});
|
||||
|
||||
// Should only include instructions and the last message that fits
|
||||
expect(result.context).toHaveLength(1);
|
||||
expect(result.context[0].content).toBe(instructions.content);
|
||||
expect(result.messagesToRefine).toHaveLength(2);
|
||||
expect(result.remainingContextTokens).toBe(7); // 30 - 20 - 3 (assistant label)
|
||||
});
|
||||
|
||||
test('should work correctly without instructions (1/2)', async () => {
|
||||
TestClient.maxContextTokens = 50;
|
||||
const messages = [
|
||||
{ role: 'user', content: 'Hello', tokenCount: 10 },
|
||||
{ role: 'assistant', content: 'Hi there', tokenCount: 15 },
|
||||
];
|
||||
|
||||
const result = await TestClient.getMessagesWithinTokenLimit({
|
||||
messages,
|
||||
});
|
||||
|
||||
expect(result.context).toHaveLength(2);
|
||||
expect(result.remainingContextTokens).toBe(22); // 50 - 10 - 15 - 3(assistant label)
|
||||
expect(result.messagesToRefine).toHaveLength(0);
|
||||
});
|
||||
|
||||
test('should work correctly without instructions (2/2)', async () => {
|
||||
TestClient.maxContextTokens = 30;
|
||||
const messages = [
|
||||
{ role: 'user', content: 'Hello', tokenCount: 10 },
|
||||
{ role: 'assistant', content: 'Hi there', tokenCount: 20 },
|
||||
];
|
||||
|
||||
const result = await TestClient.getMessagesWithinTokenLimit({
|
||||
messages,
|
||||
});
|
||||
|
||||
expect(result.context).toHaveLength(1);
|
||||
expect(result.remainingContextTokens).toBe(7);
|
||||
expect(result.messagesToRefine).toHaveLength(1);
|
||||
});
|
||||
|
||||
test('should handle case when only instructions fit within limit', async () => {
|
||||
TestClient.maxContextTokens = 25;
|
||||
const instructions = {
|
||||
role: 'system',
|
||||
content: 'System instructions',
|
||||
tokenCount: 20,
|
||||
};
|
||||
|
||||
const messages = [
|
||||
instructions,
|
||||
{ role: 'user', content: 'Hello', tokenCount: 10 },
|
||||
{ role: 'assistant', content: 'Hi there', tokenCount: 15 },
|
||||
];
|
||||
|
||||
const result = await TestClient.getMessagesWithinTokenLimit({
|
||||
messages,
|
||||
instructions,
|
||||
});
|
||||
|
||||
expect(result.context).toHaveLength(1);
|
||||
expect(result.context[0]).toBe(instructions);
|
||||
expect(result.messagesToRefine).toHaveLength(2);
|
||||
expect(result.remainingContextTokens).toBe(2); // 25 - 20 - 3(assistant label)
|
||||
});
|
||||
});
|
||||
});
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue