📋 feat: Log Custom Config File and Add Known Model Limits to Custom Endpoint (#1657)

* refactor(custom): add all recognized models to maxTokensMap for custom endpoint * feat(librechat.yaml): log the custom config file on initial load * fix(OpenAIClient): pass endpointType/endpoint to `getModelMaxTokens` call
2025-12-17 08:50:15 +01:00 · 2024-01-27 08:59:04 -05:00 · 2024-01-27 08:59:04 -05:00 · f7f7f929a0
commit f7f7f929a0
parent c470147ea2
3 changed files with 27 additions and 21 deletions
--- a/api/app/clients/OpenAIClient.js
+++ b/api/app/clients/OpenAIClient.js
@ -131,7 +131,8 @@ class OpenAIClient extends BaseClient {
    const { isChatGptModel } = this;
    this.isUnofficialChatGptModel =
      model.startsWith('text-chat') || model.startsWith('text-davinci-002-render');
-    this.maxContextTokens = getModelMaxTokens(model) ?? 4095; // 1 less than maximum
+    this.maxContextTokens =
      getModelMaxTokens(model, this.options.endpointType ?? this.options.endpoint) ?? 4095; // 1 less than maximum
    if (this.shouldSummarize) {
      this.maxContextTokens = Math.floor(this.maxContextTokens / 2);
--- a/api/server/services/Config/loadCustomConfig.js
+++ b/api/server/services/Config/loadCustomConfig.js
@ -25,7 +25,8 @@ async function loadCustomConfig() {
    logger.error(`Invalid custom config file at ${configPath}`, result.error);
    return null;
  } else {
-    logger.info('Loaded custom config file');
+    logger.info('Loaded custom config file:');
    logger.info(JSON.stringify(customConfig, null, 2));
  }
  if (customConfig.cache) {
--- a/api/utils/tokens.js
+++ b/api/utils/tokens.js
@ -57,11 +57,7 @@ const openAIModels = {
  'mistral-': 31990, // -10 from max
 };
-// Order is important here: by model series and context size (gpt-4 then gpt-3, ascending)
+const googleModels = {
 const maxTokensMap = {
  [EModelEndpoint.openAI]: openAIModels,
  [EModelEndpoint.custom]: openAIModels,
  [EModelEndpoint.google]: {
  /* Max I/O is combined so we subtract the amount from max response tokens for actual total */
  gemini: 32750, // -10 from max
  'text-bison-32k': 32758, // -10 from max
@ -74,11 +70,19 @@ const maxTokensMap = {
  /* PaLM2, -5 from max: 8192 */
  'text-': 8187,
  'chat-': 8187,
-  },
+};
-  [EModelEndpoint.anthropic]: {
+
 const anthropicModels = {
  'claude-2.1': 200000,
  'claude-': 100000,
-  },
+};
 // Order is important here: by model series and context size (gpt-4 then gpt-3, ascending)
 const maxTokensMap = {
  [EModelEndpoint.openAI]: openAIModels,
  [EModelEndpoint.custom]: { ...openAIModels, ...googleModels, ...anthropicModels },
  [EModelEndpoint.google]: googleModels,
  [EModelEndpoint.anthropic]: anthropicModels,
 };
 /**