🤖 feat: GPT-5.4 and GPT-5.4-pro Context + Pricing (#12099)

* ✨ feat: Add support for new GPT-5.4 and GPT-5.4-pro models - Introduced new token values and cache settings for 'gpt-5.4' and 'gpt-5.4-pro' in the API model configurations. - Updated maximum output limits for the new models in the tokens utility. - Included 'gpt-5.4' and 'gpt-5.4-pro' in the shared OpenAI models list for consistent access across the application. * 🔧 update: Enhance GPT-5.4 and GPT-5.4-pro model configurations - Refined token pricing and cache settings for 'gpt-5.4' and 'gpt-5.4-pro' in the API model configurations. - Added tests for cache multipliers and maximum token limits for the new models. - Updated shared OpenAI models list to include 'gpt-5.4-thinking' and added a note for verifying pricing before release. * 🔧 update: Add clarification to token pricing for 'gpt-5.4-pro' - Added a comment to the 'gpt-5.4-pro' model configuration in tokens.ts to specify that it shares the same token window as 'gpt-5.4', enhancing clarity for future reference.
2026-03-07 16:42:38 +01:00 · 2026-03-06 02:11:01 -05:00 · 2026-03-06 02:11:01 -05:00 · a79f7cebd5
commit a79f7cebd5
parent 3b84cc048a
5 changed files with 100 additions and 24 deletions
--- a/api/utils/tokens.spec.js
+++ b/api/utils/tokens.spec.js
@ -214,6 +214,25 @@ describe('getModelMaxTokens', () => {
    );
  });

+  test('should return correct tokens for gpt-5.4 matches', () => {
+    expect(getModelMaxTokens('gpt-5.4')).toBe(maxTokensMap[EModelEndpoint.openAI]['gpt-5.4']);
+    expect(getModelMaxTokens('gpt-5.4-thinking')).toBe(
+      maxTokensMap[EModelEndpoint.openAI]['gpt-5.4'],
+    );
+    expect(getModelMaxTokens('openai/gpt-5.4')).toBe(
+      maxTokensMap[EModelEndpoint.openAI]['gpt-5.4'],
+    );
+  });
+
+  test('should return correct tokens for gpt-5.4-pro matches', () => {
+    expect(getModelMaxTokens('gpt-5.4-pro')).toBe(
+      maxTokensMap[EModelEndpoint.openAI]['gpt-5.4-pro'],
+    );
+    expect(getModelMaxTokens('openai/gpt-5.4-pro')).toBe(
+      maxTokensMap[EModelEndpoint.openAI]['gpt-5.4-pro'],
+    );
+  });
+
  test('should return correct tokens for Anthropic models', () => {
    const models = [
      'claude-2.1',
@ -495,6 +514,8 @@ describe('getModelMaxTokens', () => {
      'gpt-5.1',
      'gpt-5.2',
      'gpt-5.3',
+      'gpt-5.4',
+      'gpt-5.4-pro',
      'gpt-5-mini',
      'gpt-5-nano',
      'gpt-5-pro',
@ -804,6 +825,12 @@ describe('matchModelName', () => {
    expect(matchModelName('gpt-5.3-2025-03-01')).toBe('gpt-5.3');
  });

+  it('should return the closest matching key for gpt-5.4 matches', () => {
+    expect(matchModelName('openai/gpt-5.4')).toBe('gpt-5.4');
+    expect(matchModelName('gpt-5.4-thinking')).toBe('gpt-5.4');
+    expect(matchModelName('gpt-5.4-pro')).toBe('gpt-5.4-pro');
+  });
+
  it('should return the input model name if no match is found - Google models', () => {
    expect(matchModelName('unknown-google-model', EModelEndpoint.google)).toBe(
      'unknown-google-model',