2026-03-16 12:46:34 +01:00
743 changed files with 18060 additions and 84531 deletions
--- a/.env.example
+++ b/.env.example
@ -47,10 +47,6 @@ TRUST_PROXY=1
 # password policies.
 # MIN_PASSWORD_LENGTH=8

-# When enabled, the app will continue running after encountering uncaught exceptions
-# instead of exiting the process. Not recommended for production unless necessary.
-# CONTINUE_ON_UNCAUGHT_EXCEPTION=false
-
 #===============#
 # JSON Logging  #
 #===============#
@ -65,9 +61,6 @@ CONSOLE_JSON=false
 DEBUG_LOGGING=true
 DEBUG_CONSOLE=false

-# Enable memory diagnostics (logs heap/RSS snapshots every 60s, auto-enabled with --inspect)
-# MEM_DIAG=true
-
 #=============#
 # Permissions #
 #=============#
@ -94,16 +87,6 @@ NODE_MAX_OLD_SPACE_SIZE=6144

 # CONFIG_PATH="/alternative/path/to/librechat.yaml"

-#==================#
-# Langfuse Tracing #
-#==================#
-
-# Get Langfuse API keys for your project from the project settings page: https://cloud.langfuse.com
-
-# LANGFUSE_PUBLIC_KEY=
-# LANGFUSE_SECRET_KEY=
-# LANGFUSE_BASE_URL=
-
 #===================================================#
 #                     Endpoints                     #
 #===================================================#
@ -138,7 +121,7 @@ PROXY=
 #============#

 ANTHROPIC_API_KEY=user_provided
-# ANTHROPIC_MODELS=claude-sonnet-4-6,claude-opus-4-6,claude-opus-4-20250514,claude-sonnet-4-20250514,claude-3-7-sonnet-20250219,claude-3-5-sonnet-20241022,claude-3-5-haiku-20241022,claude-3-opus-20240229,claude-3-sonnet-20240229,claude-3-haiku-20240307
+# ANTHROPIC_MODELS=claude-opus-4-20250514,claude-sonnet-4-20250514,claude-3-7-sonnet-20250219,claude-3-5-sonnet-20241022,claude-3-5-haiku-20241022,claude-3-opus-20240229,claude-3-sonnet-20240229,claude-3-haiku-20240307
 # ANTHROPIC_REVERSE_PROXY=

 # Set to true to use Anthropic models through Google Vertex AI instead of direct API
@ -173,8 +156,7 @@ ANTHROPIC_API_KEY=user_provided
 # BEDROCK_AWS_SESSION_TOKEN=someSessionToken

 # Note: This example list is not meant to be exhaustive. If omitted, all known, supported model IDs will be included for you.
-# BEDROCK_AWS_MODELS=anthropic.claude-sonnet-4-6,anthropic.claude-opus-4-6-v1,anthropic.claude-3-5-sonnet-20240620-v1:0,meta.llama3-1-8b-instruct-v1:0
-# Cross-region inference model IDs: us.anthropic.claude-sonnet-4-6,us.anthropic.claude-opus-4-6-v1,global.anthropic.claude-opus-4-6-v1
+# BEDROCK_AWS_MODELS=anthropic.claude-3-5-sonnet-20240620-v1:0,meta.llama3-1-8b-instruct-v1:0

 # See all Bedrock model IDs here: https://docs.aws.amazon.com/bedrock/latest/userguide/model-ids.html#model-ids-arns

@ -196,10 +178,10 @@ GOOGLE_KEY=user_provided
 # GOOGLE_AUTH_HEADER=true

 # Gemini API (AI Studio)
-# GOOGLE_MODELS=gemini-3.1-pro-preview,gemini-3.1-pro-preview-customtools,gemini-3.1-flash-lite-preview,gemini-2.5-pro,gemini-2.5-flash,gemini-2.5-flash-lite,gemini-2.0-flash,gemini-2.0-flash-lite
+# GOOGLE_MODELS=gemini-2.5-pro,gemini-2.5-flash,gemini-2.5-flash-lite,gemini-2.0-flash,gemini-2.0-flash-lite

 # Vertex AI
-# GOOGLE_MODELS=gemini-3.1-pro-preview,gemini-3.1-pro-preview-customtools,gemini-3.1-flash-lite-preview,gemini-2.5-pro,gemini-2.5-flash,gemini-2.5-flash-lite,gemini-2.0-flash-001,gemini-2.0-flash-lite-001
+# GOOGLE_MODELS=gemini-2.5-pro,gemini-2.5-flash,gemini-2.5-flash-lite,gemini-2.0-flash-001,gemini-2.0-flash-lite-001

 # GOOGLE_TITLE_MODEL=gemini-2.0-flash-lite-001

@ -246,6 +228,10 @@ GOOGLE_KEY=user_provided
 # Option A: Use dedicated Gemini API key for image generation
 # GEMINI_API_KEY=your-gemini-api-key

+# Option B: Use Vertex AI (no API key needed, uses service account)
+# Set this to enable Vertex AI and allow tool without requiring API keys
+# GEMINI_VERTEX_ENABLED=true
+
 # Vertex AI model for image generation (defaults to gemini-2.5-flash-image)
 # GEMINI_IMAGE_MODEL=gemini-2.5-flash-image

@ -513,9 +499,6 @@ OPENID_ADMIN_ROLE_TOKEN_KIND=
 OPENID_USERNAME_CLAIM=
 # Set to determine which user info property returned from OpenID Provider to store as the User's name
 OPENID_NAME_CLAIM=
-# Set to determine which user info claim to use as the email/identifier for user matching (e.g., "upn" for Entra ID)
-# When not set, defaults to: email -> preferred_username -> upn
-OPENID_EMAIL_CLAIM=
 # Optional audience parameter for OpenID authorization requests
 OPENID_AUDIENCE=

@ -660,9 +643,6 @@ AWS_ACCESS_KEY_ID=
 AWS_SECRET_ACCESS_KEY=
 AWS_REGION=
 AWS_BUCKET_NAME=
-# Required for path-style S3-compatible providers (MinIO, Hetzner, Backblaze B2, etc.)
-# that don't support virtual-hosted-style URLs (bucket.endpoint). Not needed for AWS S3.
-# AWS_FORCE_PATH_STYLE=false

 #========================#
 # Azure Blob Storage     #
@ -677,8 +657,7 @@ AZURE_CONTAINER_NAME=files
 #========================#

 ALLOW_SHARED_LINKS=true
-# Allows unauthenticated access to shared links. Defaults to false (auth required) if not set.
-ALLOW_SHARED_LINKS_PUBLIC=false
+ALLOW_SHARED_LINKS_PUBLIC=true

 #==============================#
 # Static File Cache Control    #
@ -758,10 +737,8 @@ HELP_AND_FAQ_URL=https://librechat.ai
 # REDIS_PING_INTERVAL=300

 # Force specific cache namespaces to use in-memory storage even when Redis is enabled
-# Comma-separated list of CacheKeys
-# Defaults to CONFIG_STORE,APP_CONFIG so YAML-derived config stays per-container (safe for blue/green deployments)
-# Set to empty string to force all namespaces through Redis: FORCED_IN_MEMORY_CACHE_NAMESPACES=
-# FORCED_IN_MEMORY_CACHE_NAMESPACES=CONFIG_STORE,APP_CONFIG
+# Comma-separated list of CacheKeys (e.g., ROLES,MESSAGES)
+# FORCED_IN_MEMORY_CACHE_NAMESPACES=ROLES,MESSAGES

 # Leader Election Configuration (for multi-instance deployments with Redis)
 # Duration in seconds that the leader lease is valid before it expires (default: 25)
@ -850,24 +827,3 @@ OPENWEATHER_API_KEY=
 # Skip code challenge method validation (e.g., for AWS Cognito that supports S256 but doesn't advertise it)
 # When set to true, forces S256 code challenge even if not advertised in .well-known/openid-configuration
 # MCP_SKIP_CODE_CHALLENGE_CHECK=false
-
-# Circuit breaker: max connect/disconnect cycles before tripping (per server)
-# MCP_CB_MAX_CYCLES=7
-
-# Circuit breaker: sliding window (ms) for counting cycles
-# MCP_CB_CYCLE_WINDOW_MS=45000
-
-# Circuit breaker: cooldown (ms) after the cycle breaker trips
-# MCP_CB_CYCLE_COOLDOWN_MS=15000
-
-# Circuit breaker: max consecutive failed connection rounds before backoff
-# MCP_CB_MAX_FAILED_ROUNDS=3
-
-# Circuit breaker: sliding window (ms) for counting failed rounds
-# MCP_CB_FAILED_WINDOW_MS=120000
-
-# Circuit breaker: base backoff (ms) after failed round threshold is reached
-# MCP_CB_BASE_BACKOFF_MS=30000
-
-# Circuit breaker: max backoff cap (ms) for exponential backoff
-# MCP_CB_MAX_BACKOFF_MS=300000
--- a/.github/CONTRIBUTING.md
+++ b/.github/CONTRIBUTING.md
@ -26,14 +26,18 @@ Project maintainers have the right and responsibility to remove, edit, or reject

 ## 1. Development Setup

-1. Use Node.js v20.19.0+ or ^22.12.0 or >= 23.0.0.
-2. Run `npm run smart-reinstall` to install dependencies (uses Turborepo). Use `npm run reinstall` for a clean install, or `npm ci` for a fresh lockfile-based install.
-3. Build all compiled code: `npm run build`.
-4. Setup and run unit tests:
+1. Use Node.JS 20.x.
+2. Install typescript globally: `npm i -g typescript`.
+3. Run `npm ci` to install dependencies.
+4. Build the data provider: `npm run build:data-provider`.
+5. Build data schemas: `npm run build:data-schemas`.
+6. Build API methods: `npm run build:api`.
+7. Setup and run unit tests:
    - Copy `.env.test`: `cp api/test/.env.test.example api/test/.env.test`.
    - Run backend unit tests: `npm run test:api`.
    - Run frontend unit tests: `npm run test:client`.
-5. Setup and run integration tests:
+8. Setup and run integration tests:
+    - Build client: `cd client && npm run build`.
    - Create `.env`: `cp .env.example .env`.
    - Install [MongoDB Community Edition](https://www.mongodb.com/docs/manual/administration/install-community/), ensure that `mongosh` connects to your local instance.
    - Run: `npx install playwright`, then `npx playwright install`.
@ -44,11 +48,11 @@ Project maintainers have the right and responsibility to remove, edit, or reject
 ## 2. Development Notes

 1. Before starting work, make sure your main branch has the latest commits with `npm run update`.
-2. Run linting command to find errors: `npm run lint`. Alternatively, ensure husky pre-commit checks are functioning.
+3. Run linting command to find errors: `npm run lint`. Alternatively, ensure husky pre-commit checks are functioning.
 3. After your changes, reinstall packages in your current branch using `npm run reinstall` and ensure everything still works. 
    - Restart the ESLint server ("ESLint: Restart ESLint Server" in VS Code command bar) and your IDE after reinstalling or updating.
 4. Clear web app localStorage and cookies before and after changes.
-5. To check for introduced errors, build all compiled code: `npm run build`.
+5. For frontend changes, compile typescript before and after changes to check for introduced errors: `cd client && npm run build`.
 6. Run backend unit tests: `npm run test:api`.
 7. Run frontend unit tests: `npm run test:client`.
 8. Run integration tests: `npm run e2e`.
@ -114,45 +118,50 @@ Apply the following naming conventions to branches, labels, and other Git-relate
 - **JS/TS:** Directories and file names: Descriptive and camelCase. First letter uppercased for React files (e.g., `helperFunction.ts, ReactComponent.tsx`).
 - **Docs:** Directories and file names: Descriptive and snake_case (e.g., `config_files.md`).

-## 7. Coding Standards
-
-For detailed coding conventions, workspace boundaries, and architecture guidance, refer to the [`AGENTS.md`](../AGENTS.md) file at the project root. It covers code style, type safety, import ordering, iteration/performance expectations, frontend rules, testing, and development commands.
-
-## 8. TypeScript Conversion
+## 7. TypeScript Conversion

 1. **Original State**: The project was initially developed entirely in JavaScript (JS).

-2. **Frontend**: Fully transitioned to TypeScript.
+2. **Frontend Transition**:
+   - We are in the process of transitioning the frontend from JS to TypeScript (TS).
+   - The transition is nearing completion.
+   - This conversion is feasible due to React's capability to intermix JS and TS prior to code compilation. It's standard practice to compile/bundle the code in such scenarios.

-3. **Backend**:
-   - The legacy Express.js server remains in `/api` as JavaScript.
-   - All new backend code is written in TypeScript under `/packages/api`, which is compiled and consumed by `/api`.
-   - Shared database logic lives in `/packages/data-schemas` (TypeScript).
-   - Shared frontend/backend API types and services live in `/packages/data-provider` (TypeScript).
-   - Minimize direct changes to `/api`; prefer adding TypeScript code to `/packages/api` and importing it.
+3. **Backend Considerations**:
+   - Transitioning the backend to TypeScript would be a more intricate process, especially for an established Express.js server.
   
-## 9. Module Import Conventions
+   - **Options for Transition**:
+      - **Single Phase Overhaul**: This involves converting the entire backend to TypeScript in one go. It's the most straightforward approach but can be disruptive, especially for larger codebases.
      
-Imports are organized into three sections (in order):
+      - **Incremental Transition**: Convert parts of the backend progressively. This can be done by:
+         - Maintaining a separate directory for TypeScript files.
+         - Gradually migrating and testing individual modules or routes.
+         - Using a build tool like `tsc` to compile TypeScript files independently until the entire transition is complete.
         
-1. **Package imports** — sorted from shortest to longest line length.
-   - `react` is always the first import.
-   - Multi-line (stacked) imports count their total character length across all lines for sorting.
+   - **Compilation Considerations**: 
+      - Introducing a compilation step for the server is an option. This would involve using tools like `ts-node` for development and `tsc` for production builds.
+      - However, this is not a conventional approach for Express.js servers and could introduce added complexity, especially in terms of build and deployment processes.
      
-2. **`import type` imports** — sorted from longest to shortest line length.
-   - Package type imports come first, then local type imports.
-   - Line length sorting resets between the package and local sub-groups.
+   - **Current Stance**: At present, this backend transition is of lower priority and might not be pursued.

-3. **Local/project imports** — sorted from longest to shortest line length.
-   - Multi-line (stacked) imports count their total character length across all lines for sorting.
-   - Imports with alias `~` are treated the same as relative imports with respect to line length.
+## 8. Module Import Conventions

- Consolidate value imports from the same module as much as possible.
- Always use standalone `import type { ... }` for type imports; never use inline `type` keyword inside value imports (e.g., `import { Foo, type Bar }` is wrong).
+- `npm` packages first, 
+     - from longest line (top) to shortest (bottom)
+
+- Followed by typescript types (pertains to data-provider and client workspaces)
+     - longest line (top) to shortest (bottom)
+     - types from package come first
+
+- Lastly, local imports
+     - longest line (top) to shortest (bottom)
+     - imports with alias `~` treated the same as relative import with respect to line length

 **Note:** ESLint will automatically enforce these import conventions when you run `npm run lint --fix` or through pre-commit hooks.

-For the full set of coding standards, see [`AGENTS.md`](../AGENTS.md).
+---
+
+Please ensure that you adapt this summary to fit the specific context and nuances of your project.

 ---

--- a/.github/workflows/backend-review.yml
+++ b/.github/workflows/backend-review.yml
@ -9,159 +9,11 @@ on:
    paths:
      - 'api/**'
      - 'packages/**'
-
-env:
-  NODE_ENV: CI
-  NODE_OPTIONS: '--max-old-space-size=${{ secrets.NODE_MAX_OLD_SPACE_SIZE || 6144 }}'
-
 jobs:
-  build:
-    name: Build packages
+  tests_Backend:
+    name: Run Backend unit tests
+    timeout-minutes: 60
    runs-on: ubuntu-latest
-    timeout-minutes: 15
-    steps:
-      - uses: actions/checkout@v4
-
-      - name: Use Node.js 20.19
-        uses: actions/setup-node@v4
-        with:
-          node-version: '20.19'
-
-      - name: Restore node_modules cache
-        id: cache-node-modules
-        uses: actions/cache@v4
-        with:
-          path: |
-            node_modules
-            api/node_modules
-            packages/api/node_modules
-            packages/data-provider/node_modules
-            packages/data-schemas/node_modules
-          key: node-modules-backend-${{ runner.os }}-20.19-${{ hashFiles('package-lock.json') }}
-
-      - name: Install dependencies
-        if: steps.cache-node-modules.outputs.cache-hit != 'true'
-        run: npm ci
-
-      - name: Restore data-provider build cache
-        id: cache-data-provider
-        uses: actions/cache@v4
-        with:
-          path: packages/data-provider/dist
-          key: build-data-provider-${{ runner.os }}-${{ hashFiles('packages/data-provider/src/**', 'packages/data-provider/tsconfig*.json', 'packages/data-provider/rollup.config.js', 'packages/data-provider/package.json') }}
-
-      - name: Build data-provider
-        if: steps.cache-data-provider.outputs.cache-hit != 'true'
-        run: npm run build:data-provider
-
-      - name: Restore data-schemas build cache
-        id: cache-data-schemas
-        uses: actions/cache@v4
-        with:
-          path: packages/data-schemas/dist
-          key: build-data-schemas-${{ runner.os }}-${{ hashFiles('packages/data-schemas/src/**', 'packages/data-schemas/tsconfig*.json', 'packages/data-schemas/rollup.config.js', 'packages/data-schemas/package.json', 'packages/data-provider/src/**', 'packages/data-provider/tsconfig*.json', 'packages/data-provider/rollup.config.js', 'packages/data-provider/package.json') }}
-
-      - name: Build data-schemas
-        if: steps.cache-data-schemas.outputs.cache-hit != 'true'
-        run: npm run build:data-schemas
-
-      - name: Restore api build cache
-        id: cache-api
-        uses: actions/cache@v4
-        with:
-          path: packages/api/dist
-          key: build-api-${{ runner.os }}-${{ hashFiles('packages/api/src/**', 'packages/api/tsconfig*.json', 'packages/api/server-rollup.config.js', 'packages/api/package.json', 'packages/data-provider/src/**', 'packages/data-provider/tsconfig*.json', 'packages/data-provider/rollup.config.js', 'packages/data-provider/package.json', 'packages/data-schemas/src/**', 'packages/data-schemas/tsconfig*.json', 'packages/data-schemas/rollup.config.js', 'packages/data-schemas/package.json') }}
-
-      - name: Build api
-        if: steps.cache-api.outputs.cache-hit != 'true'
-        run: npm run build:api
-
-      - name: Upload data-provider build
-        uses: actions/upload-artifact@v4
-        with:
-          name: build-data-provider
-          path: packages/data-provider/dist
-          retention-days: 2
-
-      - name: Upload data-schemas build
-        uses: actions/upload-artifact@v4
-        with:
-          name: build-data-schemas
-          path: packages/data-schemas/dist
-          retention-days: 2
-
-      - name: Upload api build
-        uses: actions/upload-artifact@v4
-        with:
-          name: build-api
-          path: packages/api/dist
-          retention-days: 2
-
-  circular-deps:
-    name: Circular dependency checks
-    needs: build
-    runs-on: ubuntu-latest
-    timeout-minutes: 10
-    steps:
-      - uses: actions/checkout@v4
-
-      - name: Use Node.js 20.19
-        uses: actions/setup-node@v4
-        with:
-          node-version: '20.19'
-
-      - name: Restore node_modules cache
-        id: cache-node-modules
-        uses: actions/cache@v4
-        with:
-          path: |
-            node_modules
-            api/node_modules
-            packages/api/node_modules
-            packages/data-provider/node_modules
-            packages/data-schemas/node_modules
-          key: node-modules-backend-${{ runner.os }}-20.19-${{ hashFiles('package-lock.json') }}
-
-      - name: Install dependencies
-        if: steps.cache-node-modules.outputs.cache-hit != 'true'
-        run: npm ci
-
-      - name: Download data-provider build
-        uses: actions/download-artifact@v4
-        with:
-          name: build-data-provider
-          path: packages/data-provider/dist
-
-      - name: Download data-schemas build
-        uses: actions/download-artifact@v4
-        with:
-          name: build-data-schemas
-          path: packages/data-schemas/dist
-
-      - name: Rebuild @librechat/api and check for circular dependencies
-        run: |
-          output=$(npm run build:api 2>&1)
-          echo "$output"
-          if echo "$output" | grep -q "Circular depend"; then
-            echo "Error: Circular dependency detected in @librechat/api!"
-            exit 1
-          fi
-
-      - name: Detect circular dependencies in rollup
-        working-directory: ./packages/data-provider
-        run: |
-          output=$(npm run rollup:api)
-          echo "$output"
-          if echo "$output" | grep -q "Circular dependency"; then
-            echo "Error: Circular dependency detected!"
-            exit 1
-          fi
-
-  test-api:
-    name: 'Tests: api'
-    needs: build
-    runs-on: ubuntu-latest
-    timeout-minutes: 15
    env:
      MONGO_URI: ${{ secrets.MONGO_URI }}
      OPENAI_API_KEY: ${{ secrets.OPENAI_API_KEY }}
@ -171,187 +23,54 @@ jobs:
      BAN_VIOLATIONS: ${{ secrets.BAN_VIOLATIONS }}
      BAN_DURATION: ${{ secrets.BAN_DURATION }}
      BAN_INTERVAL: ${{ secrets.BAN_INTERVAL }}
+      NODE_ENV: CI
+      NODE_OPTIONS: '--max-old-space-size=${{ secrets.NODE_MAX_OLD_SPACE_SIZE || 6144 }}'
    steps:
      - uses: actions/checkout@v4
-
-      - name: Use Node.js 20.19
+      - name: Use Node.js 20.x
        uses: actions/setup-node@v4
        with:
-          node-version: '20.19'
-
-      - name: Restore node_modules cache
-        id: cache-node-modules
-        uses: actions/cache@v4
-        with:
-          path: |
-            node_modules
-            api/node_modules
-            packages/api/node_modules
-            packages/data-provider/node_modules
-            packages/data-schemas/node_modules
-          key: node-modules-backend-${{ runner.os }}-20.19-${{ hashFiles('package-lock.json') }}
+          node-version: 20
+          cache: 'npm'

      - name: Install dependencies
-        if: steps.cache-node-modules.outputs.cache-hit != 'true'
        run: npm ci

-      - name: Download data-provider build
-        uses: actions/download-artifact@v4
-        with:
-          name: build-data-provider
-          path: packages/data-provider/dist
+      - name: Install Data Provider Package
+        run: npm run build:data-provider

-      - name: Download data-schemas build
-        uses: actions/download-artifact@v4
-        with:
-          name: build-data-schemas
-          path: packages/data-schemas/dist
+      - name: Install Data Schemas Package
+        run: npm run build:data-schemas

-      - name: Download api build
-        uses: actions/download-artifact@v4
-        with:
-          name: build-api
-          path: packages/api/dist
+      - name: Install API Package
+        run: npm run build:api

      - name: Create empty auth.json file
        run: |
          mkdir -p api/data
          echo '{}' > api/data/auth.json

+      - name: Check for Circular dependency in rollup
+        working-directory: ./packages/data-provider
+        run: |
+          output=$(npm run rollup:api)
+          echo "$output"
+          if echo "$output" | grep -q "Circular dependency"; then
+            echo "Error: Circular dependency detected!"
+            exit 1
+          fi
+
      - name: Prepare .env.test file
        run: cp api/test/.env.test.example api/test/.env.test

      - name: Run unit tests
        run: cd api && npm run test:ci

-  test-data-provider:
-    name: 'Tests: data-provider'
-    needs: build
-    runs-on: ubuntu-latest
-    timeout-minutes: 10
-    steps:
-      - uses: actions/checkout@v4
-
-      - name: Use Node.js 20.19
-        uses: actions/setup-node@v4
-        with:
-          node-version: '20.19'
-
-      - name: Restore node_modules cache
-        id: cache-node-modules
-        uses: actions/cache@v4
-        with:
-          path: |
-            node_modules
-            api/node_modules
-            packages/api/node_modules
-            packages/data-provider/node_modules
-            packages/data-schemas/node_modules
-          key: node-modules-backend-${{ runner.os }}-20.19-${{ hashFiles('package-lock.json') }}
-
-      - name: Install dependencies
-        if: steps.cache-node-modules.outputs.cache-hit != 'true'
-        run: npm ci
-
-      - name: Download data-provider build
-        uses: actions/download-artifact@v4
-        with:
-          name: build-data-provider
-          path: packages/data-provider/dist
-
-      - name: Run unit tests
+      - name: Run librechat-data-provider unit tests
        run: cd packages/data-provider && npm run test:ci

-  test-data-schemas:
-    name: 'Tests: data-schemas'
-    needs: build
-    runs-on: ubuntu-latest
-    timeout-minutes: 10
-    steps:
-      - uses: actions/checkout@v4
-
-      - name: Use Node.js 20.19
-        uses: actions/setup-node@v4
-        with:
-          node-version: '20.19'
-
-      - name: Restore node_modules cache
-        id: cache-node-modules
-        uses: actions/cache@v4
-        with:
-          path: |
-            node_modules
-            api/node_modules
-            packages/api/node_modules
-            packages/data-provider/node_modules
-            packages/data-schemas/node_modules
-          key: node-modules-backend-${{ runner.os }}-20.19-${{ hashFiles('package-lock.json') }}
-
-      - name: Install dependencies
-        if: steps.cache-node-modules.outputs.cache-hit != 'true'
-        run: npm ci
-
-      - name: Download data-provider build
-        uses: actions/download-artifact@v4
-        with:
-          name: build-data-provider
-          path: packages/data-provider/dist
-
-      - name: Download data-schemas build
-        uses: actions/download-artifact@v4
-        with:
-          name: build-data-schemas
-          path: packages/data-schemas/dist
-
-      - name: Run unit tests
+      - name: Run @librechat/data-schemas unit tests
        run: cd packages/data-schemas && npm run test:ci

-  test-packages-api:
-    name: 'Tests: @librechat/api'
-    needs: build
-    runs-on: ubuntu-latest
-    timeout-minutes: 10
-    steps:
-      - uses: actions/checkout@v4
-
-      - name: Use Node.js 20.19
-        uses: actions/setup-node@v4
-        with:
-          node-version: '20.19'
-
-      - name: Restore node_modules cache
-        id: cache-node-modules
-        uses: actions/cache@v4
-        with:
-          path: |
-            node_modules
-            api/node_modules
-            packages/api/node_modules
-            packages/data-provider/node_modules
-            packages/data-schemas/node_modules
-          key: node-modules-backend-${{ runner.os }}-20.19-${{ hashFiles('package-lock.json') }}
-
-      - name: Install dependencies
-        if: steps.cache-node-modules.outputs.cache-hit != 'true'
-        run: npm ci
-
-      - name: Download data-provider build
-        uses: actions/download-artifact@v4
-        with:
-          name: build-data-provider
-          path: packages/data-provider/dist
-
-      - name: Download data-schemas build
-        uses: actions/download-artifact@v4
-        with:
-          name: build-data-schemas
-          path: packages/data-schemas/dist
-
-      - name: Download api build
-        uses: actions/download-artifact@v4
-        with:
-          name: build-api
-          path: packages/api/dist
-
-      - name: Run unit tests
+      - name: Run @librechat/api unit tests
        run: cd packages/api && npm run test:ci
--- a/.github/workflows/frontend-review.yml
+++ b/.github/workflows/frontend-review.yml
@ -11,200 +11,51 @@ on:
      - 'client/**'
      - 'packages/data-provider/**'

-env:
-  NODE_OPTIONS: '--max-old-space-size=${{ secrets.NODE_MAX_OLD_SPACE_SIZE || 6144 }}'
-
 jobs:
-  build:
-    name: Build packages
+  tests_frontend_ubuntu:
+    name: Run frontend unit tests on Ubuntu
+    timeout-minutes: 60
    runs-on: ubuntu-latest
-    timeout-minutes: 15
+    env:
+      NODE_OPTIONS: '--max-old-space-size=${{ secrets.NODE_MAX_OLD_SPACE_SIZE || 6144 }}'
    steps:
      - uses: actions/checkout@v4
-
-      - name: Use Node.js 20.19
+      - name: Use Node.js 20.x
        uses: actions/setup-node@v4
        with:
-          node-version: '20.19'
-
-      - name: Restore node_modules cache
-        id: cache-node-modules
-        uses: actions/cache@v4
-        with:
-          path: |
-            node_modules
-            client/node_modules
-            packages/client/node_modules
-            packages/data-provider/node_modules
-          key: node-modules-frontend-${{ runner.os }}-20.19-${{ hashFiles('package-lock.json') }}
+          node-version: 20
+          cache: 'npm'

      - name: Install dependencies
-        if: steps.cache-node-modules.outputs.cache-hit != 'true'
        run: npm ci

-      - name: Restore data-provider build cache
-        id: cache-data-provider
-        uses: actions/cache@v4
-        with:
-          path: packages/data-provider/dist
-          key: build-data-provider-${{ runner.os }}-${{ hashFiles('packages/data-provider/src/**', 'packages/data-provider/tsconfig*.json', 'packages/data-provider/rollup.config.js', 'packages/data-provider/package.json') }}
-
-      - name: Build data-provider
-        if: steps.cache-data-provider.outputs.cache-hit != 'true'
-        run: npm run build:data-provider
-
-      - name: Restore client-package build cache
-        id: cache-client-package
-        uses: actions/cache@v4
-        with:
-          path: packages/client/dist
-          key: build-client-package-${{ runner.os }}-${{ hashFiles('packages/client/src/**', 'packages/client/tsconfig*.json', 'packages/client/rollup.config.js', 'packages/client/package.json', 'packages/data-provider/src/**', 'packages/data-provider/tsconfig*.json', 'packages/data-provider/rollup.config.js', 'packages/data-provider/package.json') }}
-
-      - name: Build client-package
-        if: steps.cache-client-package.outputs.cache-hit != 'true'
-        run: npm run build:client-package
-
-      - name: Upload data-provider build
-        uses: actions/upload-artifact@v4
-        with:
-          name: build-data-provider
-          path: packages/data-provider/dist
-          retention-days: 2
-
-      - name: Upload client-package build
-        uses: actions/upload-artifact@v4
-        with:
-          name: build-client-package
-          path: packages/client/dist
-          retention-days: 2
-
-  test-ubuntu:
-    name: 'Tests: Ubuntu'
-    needs: build
-    runs-on: ubuntu-latest
-    timeout-minutes: 15
-    steps:
-      - uses: actions/checkout@v4
-
-      - name: Use Node.js 20.19
-        uses: actions/setup-node@v4
-        with:
-          node-version: '20.19'
-
-      - name: Restore node_modules cache
-        id: cache-node-modules
-        uses: actions/cache@v4
-        with:
-          path: |
-            node_modules
-            client/node_modules
-            packages/client/node_modules
-            packages/data-provider/node_modules
-          key: node-modules-frontend-${{ runner.os }}-20.19-${{ hashFiles('package-lock.json') }}
-
-      - name: Install dependencies
-        if: steps.cache-node-modules.outputs.cache-hit != 'true'
-        run: npm ci
-
-      - name: Download data-provider build
-        uses: actions/download-artifact@v4
-        with:
-          name: build-data-provider
-          path: packages/data-provider/dist
-
-      - name: Download client-package build
-        uses: actions/download-artifact@v4
-        with:
-          name: build-client-package
-          path: packages/client/dist
+      - name: Build Client
+        run: npm run frontend:ci

      - name: Run unit tests
        run: npm run test:ci --verbose
        working-directory: client

-  test-windows:
-    name: 'Tests: Windows'
-    needs: build
+  tests_frontend_windows:
+    name: Run frontend unit tests on Windows
+    timeout-minutes: 60
    runs-on: windows-latest
-    timeout-minutes: 20
+    env:
+      NODE_OPTIONS: '--max-old-space-size=${{ secrets.NODE_MAX_OLD_SPACE_SIZE || 6144 }}'
    steps:
      - uses: actions/checkout@v4
-
-      - name: Use Node.js 20.19
+      - name: Use Node.js 20.x
        uses: actions/setup-node@v4
        with:
-          node-version: '20.19'
-
-      - name: Restore node_modules cache
-        id: cache-node-modules
-        uses: actions/cache@v4
-        with:
-          path: |
-            node_modules
-            client/node_modules
-            packages/client/node_modules
-            packages/data-provider/node_modules
-          key: node-modules-frontend-${{ runner.os }}-20.19-${{ hashFiles('package-lock.json') }}
+          node-version: 20
+          cache: 'npm'

      - name: Install dependencies
-        if: steps.cache-node-modules.outputs.cache-hit != 'true'
        run: npm ci

-      - name: Download data-provider build
-        uses: actions/download-artifact@v4
-        with:
-          name: build-data-provider
-          path: packages/data-provider/dist
-
-      - name: Download client-package build
-        uses: actions/download-artifact@v4
-        with:
-          name: build-client-package
-          path: packages/client/dist
+      - name: Build Client
+        run: npm run frontend:ci

      - name: Run unit tests
        run: npm run test:ci --verbose
        working-directory: client
-
-  build-verify:
-    name: Vite build verification
-    needs: build
-    runs-on: ubuntu-latest
-    timeout-minutes: 15
-    steps:
-      - uses: actions/checkout@v4
-
-      - name: Use Node.js 20.19
-        uses: actions/setup-node@v4
-        with:
-          node-version: '20.19'
-
-      - name: Restore node_modules cache
-        id: cache-node-modules
-        uses: actions/cache@v4
-        with:
-          path: |
-            node_modules
-            client/node_modules
-            packages/client/node_modules
-            packages/data-provider/node_modules
-          key: node-modules-frontend-${{ runner.os }}-20.19-${{ hashFiles('package-lock.json') }}
-
-      - name: Install dependencies
-        if: steps.cache-node-modules.outputs.cache-hit != 'true'
-        run: npm ci
-
-      - name: Download data-provider build
-        uses: actions/download-artifact@v4
-        with:
-          name: build-data-provider
-          path: packages/data-provider/dist
-
-      - name: Download client-package build
-        uses: actions/download-artifact@v4
-        with:
-          name: build-client-package
-          path: packages/client/dist
-
-      - name: Build client
-        run: cd client && npm run build:ci
--- a/.gitignore
+++ b/.gitignore
@ -15,7 +15,6 @@ pids

 # CI/CD data
 test-image*
-dump.rdb

 # Directory for instrumented libs generated by jscoverage/JSCover
 lib-cov
@ -30,9 +29,6 @@ coverage
 config/translations/stores/*
 client/src/localization/languages/*_missing_keys.json

-# Turborepo
-.turbo
-
 # Compiled Dirs (http://nodejs.org/api/addons.html)
 build/
 dist/
--- a/AGENTS.md
+++ b/AGENTS.md
@ -1,166 +0,0 @@
-# LibreChat
-
-## Project Overview
-
-LibreChat is a monorepo with the following key workspaces:
-
-| Workspace | Language | Side | Dependency | Purpose |
-|---|---|---|---|---|
-| `/api` | JS (legacy) | Backend | `packages/api`, `packages/data-schemas`, `packages/data-provider`, `@librechat/agents` | Express server — minimize changes here |
-| `/packages/api` | **TypeScript** | Backend | `packages/data-schemas`, `packages/data-provider` | New backend code lives here (TS only, consumed by `/api`) |
-| `/packages/data-schemas` | TypeScript | Backend | `packages/data-provider` | Database models/schemas, shareable across backend projects |
-| `/packages/data-provider` | TypeScript | Shared | — | Shared API types, endpoints, data-service — used by both frontend and backend |
-| `/client` | TypeScript/React | Frontend | `packages/data-provider`, `packages/client` | Frontend SPA |
-| `/packages/client` | TypeScript | Frontend | `packages/data-provider` | Shared frontend utilities |
-
-The source code for `@librechat/agents` (major backend dependency, same team) is at `/home/danny/agentus`.
-
---
-
-## Workspace Boundaries
-
- **All new backend code must be TypeScript** in `/packages/api`.
- Keep `/api` changes to the absolute minimum (thin JS wrappers calling into `/packages/api`).
- Database-specific shared logic goes in `/packages/data-schemas`.
- Frontend/backend shared API logic (endpoints, types, data-service) goes in `/packages/data-provider`.
- Build data-provider from project root: `npm run build:data-provider`.
-
---
-
-## Code Style
-
-### Structure and Clarity
-
- **Never-nesting**: early returns, flat code, minimal indentation. Break complex operations into well-named helpers.
- **Functional first**: pure functions, immutable data, `map`/`filter`/`reduce` over imperative loops. Only reach for OOP when it clearly improves domain modeling or state encapsulation.
- **No dynamic imports** unless absolutely necessary.
-
-### DRY
-
- Extract repeated logic into utility functions.
- Reusable hooks / higher-order components for UI patterns.
- Parameterized helpers instead of near-duplicate functions.
- Constants for repeated values; configuration objects over duplicated init code.
- Shared validators, centralized error handling, single source of truth for business rules.
- Shared typing system with interfaces/types extending common base definitions.
- Abstraction layers for external API interactions.
-
-### Iteration and Performance
-
- **Minimize looping** — especially over shared data structures like message arrays, which are iterated frequently throughout the codebase. Every additional pass adds up at scale.
- Consolidate sequential O(n) operations into a single pass whenever possible; never loop over the same collection twice if the work can be combined.
- Choose data structures that reduce the need to iterate (e.g., `Map`/`Set` for lookups instead of `Array.find`/`Array.includes`).
- Avoid unnecessary object creation; consider space-time tradeoffs.
- Prevent memory leaks: careful with closures, dispose resources/event listeners, no circular references.
-
-### Type Safety
-
- **Never use `any`**. Explicit types for all parameters, return values, and variables.
- **Limit `unknown`** — avoid `unknown`, `Record<string, unknown>`, and `as unknown as T` assertions. A `Record<string, unknown>` almost always signals a missing explicit type definition.
- **Don't duplicate types** — before defining a new type, check whether it already exists in the project (especially `packages/data-provider`). Reuse and extend existing types rather than creating redundant definitions.
- Use union types, generics, and interfaces appropriately.
- All TypeScript and ESLint warnings/errors must be addressed — do not leave unresolved diagnostics.
-
-### Comments and Documentation
-
- Write self-documenting code; no inline comments narrating what code does.
- JSDoc only for complex/non-obvious logic or intellisense on public APIs.
- Single-line JSDoc for brief docs, multi-line for complex cases.
- Avoid standalone `//` comments unless absolutely necessary.
-
-### Import Order
-
-Imports are organized into three sections:
-
-1. **Package imports** — sorted shortest to longest line length (`react` always first).
-2. **`import type` imports** — sorted longest to shortest (package types first, then local types; length resets between sub-groups).
-3. **Local/project imports** — sorted longest to shortest.
-
-Multi-line imports count total character length across all lines. Consolidate value imports from the same module. Always use standalone `import type { ... }` — never inline `type` inside value imports.
-
-### JS/TS Loop Preferences
-
- **Limit looping as much as possible.** Prefer single-pass transformations and avoid re-iterating the same data.
- `for (let i = 0; ...)` for performance-critical or index-dependent operations.
- `for...of` for simple array iteration.
- `for...in` only for object property enumeration.
-
---
-
-## Frontend Rules (`client/src/**/*`)
-
-### Localization
-
- All user-facing text must use `useLocalize()`.
- Only update English keys in `client/src/locales/en/translation.json` (other languages are automated externally).
- Semantic key prefixes: `com_ui_`, `com_assistants_`, etc.
-
-### Components
-
- TypeScript for all React components with proper type imports.
- Semantic HTML with ARIA labels (`role`, `aria-label`) for accessibility.
- Group related components in feature directories (e.g., `SidePanel/Memories/`).
- Use index files for clean exports.
-
-### Data Management
-
- Feature hooks: `client/src/data-provider/[Feature]/queries.ts` → `[Feature]/index.ts` → `client/src/data-provider/index.ts`.
- React Query (`@tanstack/react-query`) for all API interactions; proper query invalidation on mutations.
- QueryKeys and MutationKeys in `packages/data-provider/src/keys.ts`.
-
-### Data-Provider Integration
-
- Endpoints: `packages/data-provider/src/api-endpoints.ts`
- Data service: `packages/data-provider/src/data-service.ts`
- Types: `packages/data-provider/src/types/queries.ts`
- Use `encodeURIComponent` for dynamic URL parameters.
-
-### Performance
-
- Prioritize memory and speed efficiency at scale.
- Cursor pagination for large datasets.
- Proper dependency arrays to avoid unnecessary re-renders.
- Leverage React Query caching and background refetching.
-
---
-
-## Development Commands
-
-| Command | Purpose |
-|---|---|
-| `npm run smart-reinstall` | Install deps (if lockfile changed) + build via Turborepo |
-| `npm run reinstall` | Clean install — wipe `node_modules` and reinstall from scratch |
-| `npm run backend` | Start the backend server |
-| `npm run backend:dev` | Start backend with file watching (development) |
-| `npm run build` | Build all compiled code via Turborepo (parallel, cached) |
-| `npm run frontend` | Build all compiled code sequentially (legacy fallback) |
-| `npm run frontend:dev` | Start frontend dev server with HMR (port 3090, requires backend running) |
-| `npm run build:data-provider` | Rebuild `packages/data-provider` after changes |
-
- Node.js: v20.19.0+ or ^22.12.0 or >= 23.0.0
- Database: MongoDB
- Backend runs on `http://localhost:3080/`; frontend dev server on `http://localhost:3090/`
-
---
-
-## Testing
-
- Framework: **Jest**, run per-workspace.
- Run tests from their workspace directory: `cd api && npx jest <pattern>`, `cd packages/api && npx jest <pattern>`, etc.
- Frontend tests: `__tests__` directories alongside components; use `test/layout-test-utils` for rendering.
- Cover loading, success, and error states for UI/data flows.
-
-### Philosophy
-
- **Real logic over mocks.** Exercise actual code paths with real dependencies. Mocking is a last resort.
- **Spies over mocks.** Assert that real functions are called with expected arguments and frequency without replacing underlying logic.
- **MongoDB**: use `mongodb-memory-server` for a real in-memory MongoDB instance. Test actual queries and schema validation, not mocked DB calls.
- **MCP**: use real `@modelcontextprotocol/sdk` exports for servers, transports, and tool definitions. Mirror real scenarios, don't stub SDK internals.
- Only mock what you cannot control: external HTTP APIs, rate-limited services, non-deterministic system calls.
- Heavy mocking is a code smell, not a testing strategy.
-
---
-
-## Formatting
-
-Fix all formatting lint errors (trailing spaces, tabs, newlines, indentation) using auto-fix when available. All TypeScript/ESLint warnings and errors **must** be resolved.
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@ -0,0 +1,236 @@
+# Changelog
+
+All notable changes to this project will be documented in this file.
+
+
+
+
+
+
+## [Unreleased]
+
+### ✨ New Features
+
+- ✨ feat: implement search parameter updates by **@mawburn** in [#7151](https://github.com/danny-avila/LibreChat/pull/7151)
+- 🎏 feat: Add MCP support for Streamable HTTP Transport by **@benverhees** in [#7353](https://github.com/danny-avila/LibreChat/pull/7353)
+- 🔒 feat: Add Content Security Policy using Helmet middleware by **@rubentalstra** in [#7377](https://github.com/danny-avila/LibreChat/pull/7377)
+- ✨ feat: Add Normalization for MCP Server Names by **@danny-avila** in [#7421](https://github.com/danny-avila/LibreChat/pull/7421)
+- 📊 feat: Improve Helm Chart by **@hofq** in [#3638](https://github.com/danny-avila/LibreChat/pull/3638)
+- 🦾 feat: Claude-4 Support by **@danny-avila** in [#7509](https://github.com/danny-avila/LibreChat/pull/7509)
+- 🪨 feat: Bedrock Support for Claude-4 Reasoning by **@danny-avila** in [#7517](https://github.com/danny-avila/LibreChat/pull/7517)
+
+### 🌍 Internationalization
+
+- 🌍 i18n: Add `Danish` and `Czech` and `Catalan` localization support by **@rubentalstra** in [#7373](https://github.com/danny-avila/LibreChat/pull/7373)
+- 🌍 i18n: Update translation.json with latest translations by **@github-actions[bot]** in [#7375](https://github.com/danny-avila/LibreChat/pull/7375)
+- 🌍 i18n: Update translation.json with latest translations by **@github-actions[bot]** in [#7468](https://github.com/danny-avila/LibreChat/pull/7468)
+
+### 🔧 Fixes
+
+- 💬 fix: update aria-label for accessibility in ConvoLink component by **@berry-13** in [#7320](https://github.com/danny-avila/LibreChat/pull/7320)
+- 🔑 fix: use `apiKey` instead of `openAIApiKey` in OpenAI-like Config by **@danny-avila** in [#7337](https://github.com/danny-avila/LibreChat/pull/7337)
+- 🔄 fix: update navigation logic in `useFocusChatEffect` to ensure correct search parameters are used by **@mawburn** in [#7340](https://github.com/danny-avila/LibreChat/pull/7340)
+- 🔄 fix: Improve MCP Connection Cleanup by **@danny-avila** in [#7400](https://github.com/danny-avila/LibreChat/pull/7400)
+- 🛡️ fix: Preset and Validation Logic for URL Query Params by **@danny-avila** in [#7407](https://github.com/danny-avila/LibreChat/pull/7407)
+- 🌘 fix: artifact of preview text is illegible in dark mode by **@nhtruong** in [#7405](https://github.com/danny-avila/LibreChat/pull/7405)
+- 🛡️ fix: Temporarily Remove CSP until Configurable by **@danny-avila** in [#7419](https://github.com/danny-avila/LibreChat/pull/7419)
+- 💽 fix: Exclude index page `/` from static cache settings by **@sbruel** in [#7382](https://github.com/danny-avila/LibreChat/pull/7382)
+
+### ⚙️ Other Changes
+
+- 📜 docs: CHANGELOG for release v0.7.8 by **@github-actions[bot]** in [#7290](https://github.com/danny-avila/LibreChat/pull/7290)
+- 📦 chore: Update API Package Dependencies by **@danny-avila** in [#7359](https://github.com/danny-avila/LibreChat/pull/7359)
+- 📜 docs: Unreleased Changelog by **@github-actions[bot]** in [#7321](https://github.com/danny-avila/LibreChat/pull/7321)
+- 📜 docs: Unreleased Changelog by **@github-actions[bot]** in [#7434](https://github.com/danny-avila/LibreChat/pull/7434)
+- 🛡️ chore: `multer` v2.0.0 for CVE-2025-47935 and CVE-2025-47944 by **@danny-avila** in [#7454](https://github.com/danny-avila/LibreChat/pull/7454)
+- 📂 refactor: Improve `FileAttachment` & File Form Deletion by **@danny-avila** in [#7471](https://github.com/danny-avila/LibreChat/pull/7471)
+- 📊 chore: Remove Old Helm Chart by **@hofq** in [#7512](https://github.com/danny-avila/LibreChat/pull/7512)
+- 🪖 chore: bump helm app version to v0.7.8 by **@austin-barrington** in [#7524](https://github.com/danny-avila/LibreChat/pull/7524)
+
+
+
+---
+## [v0.7.8] - 
+
+Changes from v0.7.8-rc1 to v0.7.8.
+
+### ✨ New Features
+
+- ✨ feat: Enhance form submission for touch screens by **@berry-13** in [#7198](https://github.com/danny-avila/LibreChat/pull/7198)
+- 🔍 feat: Additional Tavily API Tool Parameters by **@glowforge-opensource** in [#7232](https://github.com/danny-avila/LibreChat/pull/7232)
+- 🐋 feat: Add python to Dockerfile for increased MCP compatibility by **@technicalpickles** in [#7270](https://github.com/danny-avila/LibreChat/pull/7270)
+
+### 🔧 Fixes
+
+- 🔧 fix: Google Gemma Support & OpenAI Reasoning Instructions by **@danny-avila** in [#7196](https://github.com/danny-avila/LibreChat/pull/7196)
+- 🛠️ fix: Conversation Navigation State by **@danny-avila** in [#7210](https://github.com/danny-avila/LibreChat/pull/7210)
+- 🔄 fix: o-Series Model Regex for System Messages by **@danny-avila** in [#7245](https://github.com/danny-avila/LibreChat/pull/7245)
+- 🔖 fix: Custom Headers for Initial MCP SSE Connection by **@danny-avila** in [#7246](https://github.com/danny-avila/LibreChat/pull/7246)
+- 🛡️ fix: Deep Clone `MCPOptions` for User MCP Connections by **@danny-avila** in [#7247](https://github.com/danny-avila/LibreChat/pull/7247)
+- 🔄 fix: URL Param Race Condition and File Draft Persistence by **@danny-avila** in [#7257](https://github.com/danny-avila/LibreChat/pull/7257)
+- 🔄 fix: Assistants Endpoint & Minor Issues by **@danny-avila** in [#7274](https://github.com/danny-avila/LibreChat/pull/7274)
+- 🔄 fix: Ollama Think Tag Edge Case with Tools by **@danny-avila** in [#7275](https://github.com/danny-avila/LibreChat/pull/7275)
+
+### ⚙️ Other Changes
+
+- 📜 docs: CHANGELOG for release v0.7.8-rc1 by **@github-actions[bot]** in [#7153](https://github.com/danny-avila/LibreChat/pull/7153)
+- 🔄 refactor: Artifact Visibility Management by **@danny-avila** in [#7181](https://github.com/danny-avila/LibreChat/pull/7181)
+- 📦 chore: Bump Package Security by **@danny-avila** in [#7183](https://github.com/danny-avila/LibreChat/pull/7183)
+- 🌿 refactor: Unmount Fork Popover on Hide for Better Performance by **@danny-avila** in [#7189](https://github.com/danny-avila/LibreChat/pull/7189)
+- 🧰 chore: ESLint configuration to enforce Prettier formatting rules by **@mawburn** in [#7186](https://github.com/danny-avila/LibreChat/pull/7186)
+- 🎨 style: Improve KaTeX Rendering for LaTeX Equations by **@andresgit** in [#7223](https://github.com/danny-avila/LibreChat/pull/7223)
+- 📝 docs: Update `.env.example` Google models by **@marlonka** in [#7254](https://github.com/danny-avila/LibreChat/pull/7254)
+- 💬 refactor: MCP Chat Visibility Option, Google Rates, Remove OpenAPI Plugins by **@danny-avila** in [#7286](https://github.com/danny-avila/LibreChat/pull/7286)
+- 📜 docs: Unreleased Changelog by **@github-actions[bot]** in [#7214](https://github.com/danny-avila/LibreChat/pull/7214)
+
+
+
+[See full release details][release-v0.7.8]
+
+[release-v0.7.8]: https://github.com/danny-avila/LibreChat/releases/tag/v0.7.8
+
+---
+## [v0.7.8-rc1] - 
+
+Changes from v0.7.7 to v0.7.8-rc1.
+
+### ✨ New Features
+
+- 🔍 feat: Mistral OCR API / Upload Files as Text by **@danny-avila** in [#6274](https://github.com/danny-avila/LibreChat/pull/6274)
+- 🤖 feat: Support OpenAI Web Search models by **@danny-avila** in [#6313](https://github.com/danny-avila/LibreChat/pull/6313)
+- 🔗 feat: Agent Chain (Mixture-of-Agents) by **@danny-avila** in [#6374](https://github.com/danny-avila/LibreChat/pull/6374)
+- ⌛ feat: `initTimeout` for Slow Starting MCP Servers by **@perweij** in [#6383](https://github.com/danny-avila/LibreChat/pull/6383)
+- 🚀 feat: `S3` Integration for File handling and Image uploads by **@rubentalstra** in [#6142](https://github.com/danny-avila/LibreChat/pull/6142)
+- 🔒feat: Enable OpenID Auto-Redirect by **@leondape** in [#6066](https://github.com/danny-avila/LibreChat/pull/6066)
+- 🚀 feat: Integrate `Azure Blob Storage` for file handling and image uploads by **@rubentalstra** in [#6153](https://github.com/danny-avila/LibreChat/pull/6153)
+- 🚀 feat: Add support for custom `AWS` endpoint in `S3` by **@rubentalstra** in [#6431](https://github.com/danny-avila/LibreChat/pull/6431)
+- 🚀 feat: Add support for LDAP STARTTLS in LDAP authentication by **@rubentalstra** in [#6438](https://github.com/danny-avila/LibreChat/pull/6438)
+- 🚀 feat: Refactor schema exports and update package version to 0.0.4 by **@rubentalstra** in [#6455](https://github.com/danny-avila/LibreChat/pull/6455)
+- 🔼 feat: Add Auto Submit For URL Query Params by **@mjaverto** in [#6440](https://github.com/danny-avila/LibreChat/pull/6440)
+- 🛠 feat: Enhance Redis Integration, Rate Limiters & Log Headers by **@danny-avila** in [#6462](https://github.com/danny-avila/LibreChat/pull/6462)
+- 💵 feat: Add Automatic Balance Refill by **@rubentalstra** in [#6452](https://github.com/danny-avila/LibreChat/pull/6452)
+- 🗣️ feat: add support for gpt-4o-transcribe models by **@berry-13** in [#6483](https://github.com/danny-avila/LibreChat/pull/6483)
+- 🎨 feat: UI Refresh for Enhanced UX by **@berry-13** in [#6346](https://github.com/danny-avila/LibreChat/pull/6346)
+- 🌍 feat: Add support for Hungarian language localization by **@rubentalstra** in [#6508](https://github.com/danny-avila/LibreChat/pull/6508)
+- 🚀 feat: Add Gemini 2.5 Token/Context Values, Increase Max Possible Output to 64k by **@danny-avila** in [#6563](https://github.com/danny-avila/LibreChat/pull/6563)
+- 🚀 feat: Enhance MCP Connections For Multi-User Support by **@danny-avila** in [#6610](https://github.com/danny-avila/LibreChat/pull/6610)
+- 🚀 feat: Enhance S3 URL Expiry with Refresh; fix: S3 File Deletion by **@danny-avila** in [#6647](https://github.com/danny-avila/LibreChat/pull/6647)
+- 🚀 feat: enhance UI components and refactor settings by **@berry-13** in [#6625](https://github.com/danny-avila/LibreChat/pull/6625)
+- 💬 feat: move TemporaryChat to the Header by **@berry-13** in [#6646](https://github.com/danny-avila/LibreChat/pull/6646)
+- 🚀 feat: Use Model Specs + Specific Endpoints, Limit Providers for Agents by **@danny-avila** in [#6650](https://github.com/danny-avila/LibreChat/pull/6650)
+- 🪙 feat: Sync Balance Config on Login by **@danny-avila** in [#6671](https://github.com/danny-avila/LibreChat/pull/6671)
+- 🔦 feat: MCP Support for Non-Agent Endpoints by **@danny-avila** in [#6775](https://github.com/danny-avila/LibreChat/pull/6775)
+- 🗃️ feat: Code Interpreter File Persistence between Sessions by **@danny-avila** in [#6790](https://github.com/danny-avila/LibreChat/pull/6790)
+- 🖥️ feat: Code Interpreter API for Non-Agent Endpoints by **@danny-avila** in [#6803](https://github.com/danny-avila/LibreChat/pull/6803)
+- ⚡ feat: Self-hosted Artifacts Static Bundler URL by **@danny-avila** in [#6827](https://github.com/danny-avila/LibreChat/pull/6827)
+- 🐳 feat: Add Jemalloc and UV to Docker Builds by **@danny-avila** in [#6836](https://github.com/danny-avila/LibreChat/pull/6836)
+- 🤖 feat: GPT-4.1 by **@danny-avila** in [#6880](https://github.com/danny-avila/LibreChat/pull/6880)
+- 👋 feat: remove Edge TTS by **@berry-13** in [#6885](https://github.com/danny-avila/LibreChat/pull/6885)
+- feat: nav optimization  by **@berry-13** in [#5785](https://github.com/danny-avila/LibreChat/pull/5785)
+- 🗺️ feat: Add Parameter Location Mapping for OpenAPI actions by **@peeeteeer** in [#6858](https://github.com/danny-avila/LibreChat/pull/6858)
+- 🤖 feat: Support `o4-mini` and `o3` Models by **@danny-avila** in [#6928](https://github.com/danny-avila/LibreChat/pull/6928)
+- 🎨 feat: OpenAI Image Tools (GPT-Image-1) by **@danny-avila** in [#7079](https://github.com/danny-avila/LibreChat/pull/7079)
+- 🗓️ feat: Add Special Variables for Prompts & Agents, Prompt UI Improvements by **@danny-avila** in [#7123](https://github.com/danny-avila/LibreChat/pull/7123)
+
+### 🌍 Internationalization
+
+- 🌍 i18n: Add Thai Language Support and Update Translations by **@rubentalstra** in [#6219](https://github.com/danny-avila/LibreChat/pull/6219)
+- 🌍 i18n: Update translation.json with latest translations by **@github-actions[bot]** in [#6220](https://github.com/danny-avila/LibreChat/pull/6220)
+- 🌍 i18n: Update translation.json with latest translations by **@github-actions[bot]** in [#6240](https://github.com/danny-avila/LibreChat/pull/6240)
+- 🌍 i18n: Update translation.json with latest translations by **@github-actions[bot]** in [#6241](https://github.com/danny-avila/LibreChat/pull/6241)
+- 🌍 i18n: Update translation.json with latest translations by **@github-actions[bot]** in [#6277](https://github.com/danny-avila/LibreChat/pull/6277)
+- 🌍 i18n: Update translation.json with latest translations by **@github-actions[bot]** in [#6414](https://github.com/danny-avila/LibreChat/pull/6414)
+- 🌍 i18n: Update translation.json with latest translations by **@github-actions[bot]** in [#6505](https://github.com/danny-avila/LibreChat/pull/6505)
+- 🌍 i18n: Update translation.json with latest translations by **@github-actions[bot]** in [#6530](https://github.com/danny-avila/LibreChat/pull/6530)
+- 🌍 i18n: Add Persian Localization Support by **@rubentalstra** in [#6669](https://github.com/danny-avila/LibreChat/pull/6669)
+- 🌍 i18n: Update translation.json with latest translations by **@github-actions[bot]** in [#6667](https://github.com/danny-avila/LibreChat/pull/6667)
+- 🌍 i18n: Update translation.json with latest translations by **@github-actions[bot]** in [#7126](https://github.com/danny-avila/LibreChat/pull/7126)
+- 🌍 i18n: Update translation.json with latest translations by **@github-actions[bot]** in [#7148](https://github.com/danny-avila/LibreChat/pull/7148)
+
+### 👐 Accessibility
+
+- 🎨 a11y: Update Model Spec Description Text by **@berry-13** in [#6294](https://github.com/danny-avila/LibreChat/pull/6294)
+- 🗑️ a11y: Add Accessible Name to Button for File Attachment Removal by **@kangabell** in [#6709](https://github.com/danny-avila/LibreChat/pull/6709)
+- ⌨️ a11y: enhance accessibility & visual consistency by **@berry-13** in [#6866](https://github.com/danny-avila/LibreChat/pull/6866)
+- 🙌 a11y: Searchbar/Conversations List Focus by **@danny-avila** in [#7096](https://github.com/danny-avila/LibreChat/pull/7096)
+- 👐 a11y: Improve Fork and SplitText Accessibility by **@danny-avila** in [#7147](https://github.com/danny-avila/LibreChat/pull/7147)
+
+### 🔧 Fixes
+
+- 🐛 fix: Avatar Type Definitions in Agent/Assistant Schemas by **@danny-avila** in [#6235](https://github.com/danny-avila/LibreChat/pull/6235)
+- 🔧 fix: MeiliSearch Field Error and Patch Incorrect Import by #6210 by **@rubentalstra** in [#6245](https://github.com/danny-avila/LibreChat/pull/6245)
+- 🔏 fix: Enhance Two-Factor Authentication by **@rubentalstra** in [#6247](https://github.com/danny-avila/LibreChat/pull/6247)
+- 🐛 fix: Await saveMessage in abortMiddleware to ensure proper execution by **@sh4shii** in [#6248](https://github.com/danny-avila/LibreChat/pull/6248)
+- 🔧 fix: Axios Proxy Usage And Bump `mongoose` by **@danny-avila** in [#6298](https://github.com/danny-avila/LibreChat/pull/6298)
+- 🔧 fix: comment out MCP servers to resolve service run issues by **@KunalScriptz** in [#6316](https://github.com/danny-avila/LibreChat/pull/6316)
+- 🔧 fix: Update Token Calculations and Mapping, MCP `env` Initialization by **@danny-avila** in [#6406](https://github.com/danny-avila/LibreChat/pull/6406)
+- 🐞 fix: Agent "Resend" Message Attachments + Source Icon Styling by **@danny-avila** in [#6408](https://github.com/danny-avila/LibreChat/pull/6408)
+- 🐛 fix: Prevent Crash on Duplicate Message ID by **@Odrec** in [#6392](https://github.com/danny-avila/LibreChat/pull/6392)
+- 🔐 fix: Invalid Key Length in 2FA Encryption by **@rubentalstra** in [#6432](https://github.com/danny-avila/LibreChat/pull/6432)
+- 🏗️ fix: Fix Agents Token Spend Race Conditions, Expand Test Coverage by **@danny-avila** in [#6480](https://github.com/danny-avila/LibreChat/pull/6480)
+- 🔃 fix: Draft Clearing, Claude Titles, Remove Default Vision Max Tokens by **@danny-avila** in [#6501](https://github.com/danny-avila/LibreChat/pull/6501)
+- 🔧 fix: Update username reference to use user.name in greeting display by **@rubentalstra** in [#6534](https://github.com/danny-avila/LibreChat/pull/6534)
+- 🔧 fix: S3 Download Stream with Key Extraction and Blob Storage Encoding for Vision by **@danny-avila** in [#6557](https://github.com/danny-avila/LibreChat/pull/6557)
+- 🔧 fix: Mistral type strictness for `usage` & update token values/windows by **@danny-avila** in [#6562](https://github.com/danny-avila/LibreChat/pull/6562)
+- 🔧 fix: Consolidate Text Parsing and TTS Edge Initialization by **@danny-avila** in [#6582](https://github.com/danny-avila/LibreChat/pull/6582)
+- 🔧 fix: Ensure continuation in image processing on base64 encoding from Blob Storage by **@danny-avila** in [#6619](https://github.com/danny-avila/LibreChat/pull/6619)
+- ✉️ fix: Fallback For User Name In Email Templates by **@danny-avila** in [#6620](https://github.com/danny-avila/LibreChat/pull/6620)
+- 🔧 fix: Azure Blob Integration and File Source References by **@rubentalstra** in [#6575](https://github.com/danny-avila/LibreChat/pull/6575)
+- 🐛 fix: Safeguard against undefined addedEndpoints by **@wipash** in [#6654](https://github.com/danny-avila/LibreChat/pull/6654)
+- 🤖 fix: Gemini 2.5 Vision Support by **@danny-avila** in [#6663](https://github.com/danny-avila/LibreChat/pull/6663)
+- 🔄 fix: Avatar & Error Handling Enhancements by **@danny-avila** in [#6687](https://github.com/danny-avila/LibreChat/pull/6687)
+- 🔧 fix: Chat Middleware, Zod Conversion, Auto-Save and S3 URL Refresh by **@danny-avila** in [#6720](https://github.com/danny-avila/LibreChat/pull/6720)
+- 🔧 fix: Agent Capability Checks & DocumentDB Compatibility for Agent Resource Removal by **@danny-avila** in [#6726](https://github.com/danny-avila/LibreChat/pull/6726)
+- 🔄 fix: Improve audio MIME type detection and handling by **@berry-13** in [#6707](https://github.com/danny-avila/LibreChat/pull/6707)
+- 🪺 fix: Update Role Handling due to New Schema Shape by **@danny-avila** in [#6774](https://github.com/danny-avila/LibreChat/pull/6774)
+- 🗨️ fix: Show ModelSpec Greeting by **@berry-13** in [#6770](https://github.com/danny-avila/LibreChat/pull/6770)
+- 🔧 fix: Keyv and Proxy Issues, and More Memory Optimizations by **@danny-avila** in [#6867](https://github.com/danny-avila/LibreChat/pull/6867)
+- ✨ fix: Implement dynamic text sizing for greeting and name display by **@berry-13** in [#6833](https://github.com/danny-avila/LibreChat/pull/6833)
+- 📝 fix: Mistral OCR Image Support and Azure Agent Titles by **@danny-avila** in [#6901](https://github.com/danny-avila/LibreChat/pull/6901)
+- 📢 fix: Invalid `engineTTS` and Conversation State on Navigation by **@berry-13** in [#6904](https://github.com/danny-avila/LibreChat/pull/6904)
+- 🛠️ fix: Improve Accessibility and Display of Conversation Menu by **@danny-avila** in [#6913](https://github.com/danny-avila/LibreChat/pull/6913)
+- 🔧 fix: Agent Resource Form, Convo Menu Style, Ensure Draft Clears on Submission by **@danny-avila** in [#6925](https://github.com/danny-avila/LibreChat/pull/6925)
+- 🔀 fix: MCP Improvements, Auto-Save Drafts, Artifact Markup by **@danny-avila** in [#7040](https://github.com/danny-avila/LibreChat/pull/7040)
+- 🐋 fix: Improve Deepseek Compatbility by **@danny-avila** in [#7132](https://github.com/danny-avila/LibreChat/pull/7132)
+- 🐙 fix: Add Redis Ping Interval to Prevent Connection Drops by **@peeeteeer** in [#7127](https://github.com/danny-avila/LibreChat/pull/7127)
+
+### ⚙️ Other Changes
+
+- 📦 refactor: Move DB Models to `@librechat/data-schemas` by **@rubentalstra** in [#6210](https://github.com/danny-avila/LibreChat/pull/6210)
+- 📦 chore: Patch `axios` to address CVE-2025-27152 by **@danny-avila** in [#6222](https://github.com/danny-avila/LibreChat/pull/6222)
+- ⚠️ refactor: Use Error Content Part Instead Of Throwing Error for Agents by **@danny-avila** in [#6262](https://github.com/danny-avila/LibreChat/pull/6262)
+- 🏃‍♂️ refactor: Improve Agent Run Context & Misc. Changes by **@danny-avila** in [#6448](https://github.com/danny-avila/LibreChat/pull/6448)
+- 📝 docs: librechat.example.yaml by **@ineiti** in [#6442](https://github.com/danny-avila/LibreChat/pull/6442)
+- 🏃‍♂️ refactor: More Agent Context Improvements during Run by **@danny-avila** in [#6477](https://github.com/danny-avila/LibreChat/pull/6477)
+- 🔃 refactor: Allow streaming for `o1` models by **@danny-avila** in [#6509](https://github.com/danny-avila/LibreChat/pull/6509)
+- 🔧 chore: `Vite` Plugin Upgrades & Config Optimizations by **@rubentalstra** in [#6547](https://github.com/danny-avila/LibreChat/pull/6547)
+- 🔧 refactor: Consolidate Logging, Model Selection & Actions Optimizations, Minor Fixes by **@danny-avila** in [#6553](https://github.com/danny-avila/LibreChat/pull/6553)
+- 🎨 style: Address Minor UI Refresh Issues by **@berry-13** in [#6552](https://github.com/danny-avila/LibreChat/pull/6552)
+- 🔧 refactor: Enhance Model & Endpoint Configurations with Global Indicators 🌍 by **@berry-13** in [#6578](https://github.com/danny-avila/LibreChat/pull/6578)
+- 💬 style: Chat UI, Greeting, and Message adjustments by **@berry-13** in [#6612](https://github.com/danny-avila/LibreChat/pull/6612)
+- ⚡ refactor: DocumentDB Compatibility for Balance Updates by **@danny-avila** in [#6673](https://github.com/danny-avila/LibreChat/pull/6673)
+- 🧹 chore: Update ESLint rules for React hooks by **@rubentalstra** in [#6685](https://github.com/danny-avila/LibreChat/pull/6685)
+- 🪙 chore: Update Gemini Pricing by **@RedwindA** in [#6731](https://github.com/danny-avila/LibreChat/pull/6731)
+- 🪺 refactor: Nest Permission fields for Roles by **@rubentalstra** in [#6487](https://github.com/danny-avila/LibreChat/pull/6487)
+- 📦 chore: Update `caniuse-lite` dependency to version 1.0.30001706 by **@rubentalstra** in [#6482](https://github.com/danny-avila/LibreChat/pull/6482)
+- ⚙️ refactor: OAuth Flow Signal, Type Safety, Tool Progress & Updated Packages by **@danny-avila** in [#6752](https://github.com/danny-avila/LibreChat/pull/6752)
+- 📦 chore: bump vite from 6.2.3 to 6.2.5 by **@dependabot[bot]** in [#6745](https://github.com/danny-avila/LibreChat/pull/6745)
+- 💾 chore: Enhance Local Storage Handling and Update MCP SDK by **@danny-avila** in [#6809](https://github.com/danny-avila/LibreChat/pull/6809)
+- 🤖 refactor: Improve Agents Memory Usage, Bump Keyv, Grok 3 by **@danny-avila** in [#6850](https://github.com/danny-avila/LibreChat/pull/6850)
+- 💾 refactor: Enhance Memory In Image Encodings & Client Disposal by **@danny-avila** in [#6852](https://github.com/danny-avila/LibreChat/pull/6852)
+- 🔁 refactor: Token Event Handler and Standardize `maxTokens` Key by **@danny-avila** in [#6886](https://github.com/danny-avila/LibreChat/pull/6886)
+- 🔍 refactor: Search & Message Retrieval by **@berry-13** in [#6903](https://github.com/danny-avila/LibreChat/pull/6903)
+- 🎨 style: standardize dropdown styling & fix z-Index layering by **@berry-13** in [#6939](https://github.com/danny-avila/LibreChat/pull/6939)
+- 📙 docs: CONTRIBUTING.md by **@dblock** in [#6831](https://github.com/danny-avila/LibreChat/pull/6831)
+- 🧭 refactor: Modernize Nav/Header by **@danny-avila** in [#7094](https://github.com/danny-avila/LibreChat/pull/7094)
+- 🪶 refactor: Chat Input Focus for Conversation Navigations & ChatForm Optimizations by **@danny-avila** in [#7100](https://github.com/danny-avila/LibreChat/pull/7100)
+- 🔃 refactor: Streamline Navigation, Message Loading UX by **@danny-avila** in [#7118](https://github.com/danny-avila/LibreChat/pull/7118)
+- 📜 docs: Unreleased changelog by **@github-actions[bot]** in [#6265](https://github.com/danny-avila/LibreChat/pull/6265)
+
+
+
+[See full release details][release-v0.7.8-rc1]
+
+[release-v0.7.8-rc1]: https://github.com/danny-avila/LibreChat/releases/tag/v0.7.8-rc1
+
+---
--- a/CLAUDE.md
+++ b/CLAUDE.md
@ -1 +0,0 @@
-AGENTS.md
--- a/2
+++ b/2
@ -1,4 +1,4 @@
-# v0.8.3
+# v0.8.2

 # Base node image
 FROM node:20-alpine AS node
--- a/Dockerfile.multi
+++ b/Dockerfile.multi
@ -1,5 +1,5 @@
 # Dockerfile.multi
-# v0.8.3
+# v0.8.2

 # Set configurable max-old-space-size with default
 ARG NODE_MAX_OLD_SPACE_SIZE=6144
--- a/README.md
+++ b/README.md
@ -27,8 +27,8 @@
 </p>

 <p align="center">
-<a href="https://railway.com/deploy/b5k2mn?referralCode=HI9hWz">
-  <img src="https://railway.com/button.svg" alt="Deploy on Railway" height="30">
+<a href="https://railway.app/template/b5k2mn?referralCode=HI9hWz">
+  <img src="https://railway.app/button.svg" alt="Deploy on Railway" height="30">
 </a>
 <a href="https://zeabur.com/templates/0X2ZY8">
  <img src="https://zeabur.com/button.svg" alt="Deploy on Zeabur" height="30"/>
--- a/api/app/clients/BaseClient.js
+++ b/api/app/clients/BaseClient.js
@ -4,7 +4,6 @@ const { logger } = require('@librechat/data-schemas');
 const {
  countTokens,
  getBalanceConfig,
-  buildMessageFiles,
  extractFileContext,
  encodeAndFormatAudios,
  encodeAndFormatVideos,
@ -21,7 +20,6 @@ const {
  isAgentsEndpoint,
  isEphemeralAgentId,
  supportsBalanceCheck,
-  isBedrockDocumentType,
 } = require('librechat-data-provider');
 const {
  updateMessage,
@ -124,9 +122,7 @@ class BaseClient {
   * @returns {number}
   */
  getTokenCountForResponse(responseMessage) {
-    logger.debug('[BaseClient] `recordTokenUsage` not implemented.', {
-      messageId: responseMessage?.messageId,
-    });
+    logger.debug('[BaseClient] `recordTokenUsage` not implemented.', responseMessage);
  }

  /**
@ -137,14 +133,12 @@ class BaseClient {
   * @param {AppConfig['balance']} [balance]
   * @param {number} promptTokens
   * @param {number} completionTokens
-   * @param {string} [messageId]
   * @returns {Promise<void>}
   */
-  async recordTokenUsage({ model, balance, promptTokens, completionTokens, messageId }) {
+  async recordTokenUsage({ model, balance, promptTokens, completionTokens }) {
    logger.debug('[BaseClient] `recordTokenUsage` not implemented.', {
      model,
      balance,
-      messageId,
      promptTokens,
      completionTokens,
    });
@ -665,27 +659,16 @@ class BaseClient {
    );

    if (tokenCountMap) {
+      logger.debug('[BaseClient] tokenCountMap', tokenCountMap);
      if (tokenCountMap[userMessage.messageId]) {
        userMessage.tokenCount = tokenCountMap[userMessage.messageId];
-        logger.debug('[BaseClient] userMessage', {
-          messageId: userMessage.messageId,
-          tokenCount: userMessage.tokenCount,
-          conversationId: userMessage.conversationId,
-        });
+        logger.debug('[BaseClient] userMessage', userMessage);
      }

      this.handleTokenCountMap(tokenCountMap);
    }

    if (!isEdited && !this.skipSaveUserMessage) {
-      const reqFiles = this.options.req?.body?.files;
-      if (reqFiles && Array.isArray(this.options.attachments)) {
-        const files = buildMessageFiles(reqFiles, this.options.attachments);
-        if (files.length > 0) {
-          userMessage.files = files;
-        }
-        delete userMessage.image_urls;
-      }
      userMessagePromise = this.saveMessageToDatabase(userMessage, saveOptions, user);
      this.savedMessageIds.add(userMessage.messageId);
      if (typeof opts?.getReqData === 'function') {
@ -797,18 +780,9 @@ class BaseClient {
          promptTokens,
          completionTokens,
          balance: balanceConfig,
-          /** Note: When using agents, responseMessage.model is the agent ID, not the model */
-          model: this.model,
-          messageId: this.responseMessageId,
+          model: responseMessage.model,
        });
      }
-
-      logger.debug('[BaseClient] Response token usage', {
-        messageId: responseMessage.messageId,
-        model: responseMessage.model,
-        promptTokens,
-        completionTokens,
-      });
    }

    if (userMessagePromise) {
@ -1326,9 +1300,6 @@ class BaseClient {

    const allFiles = [];

-    const provider = this.options.agent?.provider ?? this.options.endpoint;
-    const isBedrock = provider === EModelEndpoint.bedrock;
-
    for (const file of attachments) {
      /** @type {FileSources} */
      const source = file.source ?? FileSources.local;
@ -1346,9 +1317,6 @@ class BaseClient {
      } else if (file.type === 'application/pdf') {
        categorizedAttachments.documents.push(file);
        allFiles.push(file);
-      } else if (isBedrock && isBedrockDocumentType(file.type)) {
-        categorizedAttachments.documents.push(file);
-        allFiles.push(file);
      } else if (file.type.startsWith('video/')) {
        categorizedAttachments.videos.push(file);
        allFiles.push(file);
--- a/api/app/clients/specs/BaseClient.test.js
+++ b/api/app/clients/specs/BaseClient.test.js
@ -41,9 +41,9 @@ jest.mock('~/models', () => ({
 const { getConvo, saveConvo } = require('~/models');

 jest.mock('@librechat/agents', () => {
-  const actual = jest.requireActual('@librechat/agents');
+  const { Providers } = jest.requireActual('@librechat/agents');
  return {
-    ...actual,
+    Providers,
    ChatOpenAI: jest.fn().mockImplementation(() => {
      return {};
    }),
@ -821,56 +821,6 @@ describe('BaseClient', () => {
    });
  });

-  describe('recordTokenUsage model assignment', () => {
-    test('should pass this.model to recordTokenUsage, not the agent ID from responseMessage.model', async () => {
-      const actualModel = 'claude-opus-4-5';
-      const agentId = 'agent_p5Z_IU6EIxBoqn1BoqLBp';
-
-      TestClient.model = actualModel;
-      TestClient.options.endpoint = 'agents';
-      TestClient.options.agent = { id: agentId };
-
-      TestClient.getTokenCountForResponse = jest.fn().mockReturnValue(50);
-      TestClient.recordTokenUsage = jest.fn().mockResolvedValue(undefined);
-      TestClient.buildMessages.mockReturnValue({
-        prompt: [],
-        tokenCountMap: { res: 50 },
-      });
-
-      await TestClient.sendMessage('Hello', {});
-
-      expect(TestClient.recordTokenUsage).toHaveBeenCalledWith(
-        expect.objectContaining({
-          model: actualModel,
-        }),
-      );
-
-      const callArgs = TestClient.recordTokenUsage.mock.calls[0][0];
-      expect(callArgs.model).not.toBe(agentId);
-    });
-
-    test('should pass this.model even when this.model differs from modelOptions.model', async () => {
-      const instanceModel = 'gpt-4o';
-      TestClient.model = instanceModel;
-      TestClient.modelOptions = { model: 'gpt-4o-mini' };
-
-      TestClient.getTokenCountForResponse = jest.fn().mockReturnValue(50);
-      TestClient.recordTokenUsage = jest.fn().mockResolvedValue(undefined);
-      TestClient.buildMessages.mockReturnValue({
-        prompt: [],
-        tokenCountMap: { res: 50 },
-      });
-
-      await TestClient.sendMessage('Hello', {});
-
-      expect(TestClient.recordTokenUsage).toHaveBeenCalledWith(
-        expect.objectContaining({
-          model: instanceModel,
-        }),
-      );
-    });
-  });
-
  describe('getMessagesWithinTokenLimit with instructions', () => {
    test('should always include instructions when present', async () => {
      TestClient.maxContextTokens = 50;
@ -978,123 +928,4 @@ describe('BaseClient', () => {
      expect(result.remainingContextTokens).toBe(2); // 25 - 20 - 3(assistant label)
    });
  });
-
-  describe('sendMessage file population', () => {
-    const attachment = {
-      file_id: 'file-abc',
-      filename: 'image.png',
-      filepath: '/uploads/image.png',
-      type: 'image/png',
-      bytes: 1024,
-      object: 'file',
-      user: 'user-1',
-      embedded: false,
-      usage: 0,
-      text: 'large ocr blob that should be stripped',
-      _id: 'mongo-id-1',
-    };
-
-    beforeEach(() => {
-      TestClient.options.req = { body: { files: [{ file_id: 'file-abc' }] } };
-      TestClient.options.attachments = [attachment];
-    });
-
-    test('populates userMessage.files before saveMessageToDatabase is called', async () => {
-      TestClient.saveMessageToDatabase = jest.fn().mockImplementation((msg) => {
-        return Promise.resolve({ message: msg });
-      });
-
-      await TestClient.sendMessage('Hello');
-
-      const userSave = TestClient.saveMessageToDatabase.mock.calls.find(
-        ([msg]) => msg.isCreatedByUser,
-      );
-      expect(userSave).toBeDefined();
-      expect(userSave[0].files).toBeDefined();
-      expect(userSave[0].files).toHaveLength(1);
-      expect(userSave[0].files[0].file_id).toBe('file-abc');
-    });
-
-    test('strips text and _id from files before saving', async () => {
-      TestClient.saveMessageToDatabase = jest.fn().mockResolvedValue({ message: {} });
-
-      await TestClient.sendMessage('Hello');
-
-      const userSave = TestClient.saveMessageToDatabase.mock.calls.find(
-        ([msg]) => msg.isCreatedByUser,
-      );
-      expect(userSave[0].files[0].text).toBeUndefined();
-      expect(userSave[0].files[0]._id).toBeUndefined();
-      expect(userSave[0].files[0].filename).toBe('image.png');
-    });
-
-    test('deletes image_urls from userMessage when files are present', async () => {
-      TestClient.saveMessageToDatabase = jest.fn().mockResolvedValue({ message: {} });
-      TestClient.options.attachments = [
-        { ...attachment, image_urls: ['data:image/png;base64,...'] },
-      ];
-
-      await TestClient.sendMessage('Hello');
-
-      const userSave = TestClient.saveMessageToDatabase.mock.calls.find(
-        ([msg]) => msg.isCreatedByUser,
-      );
-      expect(userSave[0].image_urls).toBeUndefined();
-    });
-
-    test('does not set files when no attachments match request file IDs', async () => {
-      TestClient.options.req = { body: { files: [{ file_id: 'file-nomatch' }] } };
-      TestClient.saveMessageToDatabase = jest.fn().mockResolvedValue({ message: {} });
-
-      await TestClient.sendMessage('Hello');
-
-      const userSave = TestClient.saveMessageToDatabase.mock.calls.find(
-        ([msg]) => msg.isCreatedByUser,
-      );
-      expect(userSave[0].files).toBeUndefined();
-    });
-
-    test('skips file population when attachments is not an array (Promise case)', async () => {
-      TestClient.options.attachments = Promise.resolve([attachment]);
-      TestClient.saveMessageToDatabase = jest.fn().mockResolvedValue({ message: {} });
-
-      await TestClient.sendMessage('Hello');
-
-      const userSave = TestClient.saveMessageToDatabase.mock.calls.find(
-        ([msg]) => msg.isCreatedByUser,
-      );
-      expect(userSave[0].files).toBeUndefined();
-    });
-
-    test('skips file population when skipSaveUserMessage is true', async () => {
-      TestClient.skipSaveUserMessage = true;
-      TestClient.saveMessageToDatabase = jest.fn().mockResolvedValue({ message: {} });
-
-      await TestClient.sendMessage('Hello');
-
-      const userSave = TestClient.saveMessageToDatabase.mock.calls.find(
-        ([msg]) => msg?.isCreatedByUser,
-      );
-      expect(userSave).toBeUndefined();
-    });
-
-    test('ignores file_id: undefined entries in req.body.files (no set poisoning)', async () => {
-      TestClient.options.req = {
-        body: { files: [{ file_id: undefined }, { file_id: 'file-abc' }] },
-      };
-      TestClient.options.attachments = [
-        { ...attachment, file_id: undefined },
-        { ...attachment, file_id: 'file-abc' },
-      ];
-      TestClient.saveMessageToDatabase = jest.fn().mockResolvedValue({ message: {} });
-
-      await TestClient.sendMessage('Hello');
-
-      const userSave = TestClient.saveMessageToDatabase.mock.calls.find(
-        ([msg]) => msg.isCreatedByUser,
-      );
-      expect(userSave[0].files).toHaveLength(1);
-      expect(userSave[0].files[0].file_id).toBe('file-abc');
-    });
-  });
 });
--- a/api/app/clients/tools/manifest.json
+++ b/api/app/clients/tools/manifest.json
@ -16,7 +16,7 @@
    "name": "Google",
    "pluginKey": "google",
    "description": "Use Google Search to find information about the weather, news, sports, and more.",
-    "icon": "assets/google-search.svg",
+    "icon": "https://i.imgur.com/SMmVkNB.png",
    "authConfig": [
      {
        "authField": "GOOGLE_CSE_ID",
@ -57,11 +57,24 @@
      }
    ]
  },
+  {
+    "name": "Browser",
+    "pluginKey": "web-browser",
+    "description": "Scrape and summarize webpage data",
+    "icon": "assets/web-browser.svg",
+    "authConfig": [
+      {
+        "authField": "OPENAI_API_KEY",
+        "label": "OpenAI API Key",
+        "description": "Browser makes use of OpenAI embeddings"
+      }
+    ]
+  },
  {
    "name": "DALL-E-3",
    "pluginKey": "dalle",
    "description": "[DALL-E-3] Create realistic images and art from a description in natural language",
-    "icon": "assets/openai.svg",
+    "icon": "https://i.imgur.com/u2TzXzH.png",
    "authConfig": [
      {
        "authField": "DALLE3_API_KEY||DALLE_API_KEY",
@ -74,7 +87,7 @@
    "name": "Tavily Search",
    "pluginKey": "tavily_search_results_json",
    "description": "Tavily Search is a robust search API tailored for LLM Agents. It seamlessly integrates with diverse data sources to ensure a superior, relevant search experience.",
-    "icon": "assets/tavily.svg",
+    "icon": "https://tavily.com/favicon.ico",
    "authConfig": [
      {
        "authField": "TAVILY_API_KEY",
@ -87,14 +100,14 @@
    "name": "Calculator",
    "pluginKey": "calculator",
    "description": "Perform simple and complex mathematical calculations.",
-    "icon": "assets/calculator.svg",
+    "icon": "https://i.imgur.com/RHsSG5h.png",
    "authConfig": []
  },
  {
    "name": "Stable Diffusion",
    "pluginKey": "stable-diffusion",
    "description": "Generate photo-realistic images given any text input.",
-    "icon": "assets/stability-ai.svg",
+    "icon": "https://i.imgur.com/Yr466dp.png",
    "authConfig": [
      {
        "authField": "SD_WEBUI_URL",
@ -107,7 +120,7 @@
    "name": "Azure AI Search",
    "pluginKey": "azure-ai-search",
    "description": "Use Azure AI Search to find information",
-    "icon": "assets/azure-ai-search.svg",
+    "icon": "https://i.imgur.com/E7crPze.png",
    "authConfig": [
      {
        "authField": "AZURE_AI_SEARCH_SERVICE_ENDPOINT",
@ -143,7 +156,7 @@
    "name": "Flux",
    "pluginKey": "flux",
    "description": "Generate images using text with the Flux API.",
-    "icon": "assets/bfl-ai.svg",
+    "icon": "https://blackforestlabs.ai/wp-content/uploads/2024/07/bfl_logo_retraced_blk.png",
    "isAuthRequired": "true",
    "authConfig": [
      {
@ -156,14 +169,14 @@
  {
    "name": "Gemini Image Tools",
    "pluginKey": "gemini_image_gen",
+    "toolkit": true,
    "description": "Generate high-quality images using Google's Gemini Image Models. Supports Gemini API or Vertex AI.",
    "icon": "assets/gemini_image_gen.svg",
    "authConfig": [
      {
-        "authField": "GEMINI_API_KEY||GOOGLE_KEY||GOOGLE_SERVICE_KEY_FILE",
-        "label": "Gemini API Key (optional)",
-        "description": "Your Google Gemini API Key from <a href='https://aistudio.google.com/app/apikey' target='_blank'>Google AI Studio</a>. Leave blank to use Vertex AI with a service account (GOOGLE_SERVICE_KEY_FILE or api/data/auth.json).",
-        "optional": true
+        "authField": "GEMINI_API_KEY||GOOGLE_KEY||GEMINI_VERTEX_ENABLED",
+        "label": "Gemini API Key (Optional if Vertex AI is configured)",
+        "description": "Your Google Gemini API Key from <a href='https://aistudio.google.com/app/apikey' target='_blank'>Google AI Studio</a>. Leave blank if using Vertex AI with service account."
      }
    ]
  }
--- a/api/app/clients/tools/structured/AzureAISearch.js
+++ b/api/app/clients/tools/structured/AzureAISearch.js
@ -1,28 +1,14 @@
+const { z } = require('zod');
 const { Tool } = require('@langchain/core/tools');
 const { logger } = require('@librechat/data-schemas');
 const { SearchClient, AzureKeyCredential } = require('@azure/search-documents');

-const azureAISearchJsonSchema = {
-  type: 'object',
-  properties: {
-    query: {
-      type: 'string',
-      description: 'Search word or phrase to Azure AI Search',
-    },
-  },
-  required: ['query'],
-};
-
 class AzureAISearch extends Tool {
  // Constants for default values
  static DEFAULT_API_VERSION = '2023-11-01';
  static DEFAULT_QUERY_TYPE = 'simple';
  static DEFAULT_TOP = 5;

-  static get jsonSchema() {
-    return azureAISearchJsonSchema;
-  }
-
  // Helper function for initializing properties
  _initializeField(field, envVar, defaultValue) {
    return field || process.env[envVar] || defaultValue;
@ -36,7 +22,10 @@ class AzureAISearch extends Tool {
    /* Used to initialize the Tool without necessary variables. */
    this.override = fields.override ?? false;

-    this.schema = azureAISearchJsonSchema;
+    // Define schema
+    this.schema = z.object({
+      query: z.string().describe('Search word or phrase to Azure AI Search'),
+    });

    // Initialize properties using helper function
    this.serviceEndpoint = this._initializeField(
--- a/api/app/clients/tools/structured/DALLE3.js
+++ b/api/app/clients/tools/structured/DALLE3.js
@ -1,3 +1,4 @@
+const { z } = require('zod');
 const path = require('path');
 const OpenAI = require('openai');
 const { v4: uuidv4 } = require('uuid');
@ -7,36 +8,6 @@ const { logger } = require('@librechat/data-schemas');
 const { getImageBasename, extractBaseURL } = require('@librechat/api');
 const { FileContext, ContentTypes } = require('librechat-data-provider');

-const dalle3JsonSchema = {
-  type: 'object',
-  properties: {
-    prompt: {
-      type: 'string',
-      maxLength: 4000,
-      description:
-        'A text description of the desired image, following the rules, up to 4000 characters.',
-    },
-    style: {
-      type: 'string',
-      enum: ['vivid', 'natural'],
-      description:
-        'Must be one of `vivid` or `natural`. `vivid` generates hyper-real and dramatic images, `natural` produces more natural, less hyper-real looking images',
-    },
-    quality: {
-      type: 'string',
-      enum: ['hd', 'standard'],
-      description: 'The quality of the generated image. Only `hd` and `standard` are supported.',
-    },
-    size: {
-      type: 'string',
-      enum: ['1024x1024', '1792x1024', '1024x1792'],
-      description:
-        'The size of the requested image. Use 1024x1024 (square) as the default, 1792x1024 if the user requests a wide image, and 1024x1792 for full-body portraits. Always include this parameter in the request.',
-    },
-  },
-  required: ['prompt', 'style', 'quality', 'size'],
-};
-
 const displayMessage =
  "DALL-E displayed an image. All generated images are already plainly visible, so don't repeat the descriptions in detail. Do not list download links as they are available in the UI already. The user may download the images by clicking on them, but do not mention anything about downloading to the user.";
 class DALLE3 extends Tool {
@ -101,11 +72,27 @@ class DALLE3 extends Tool {
    // The prompt must intricately describe every part of the image in concrete, objective detail. THINK about what the end goal of the description is, and extrapolate that to what would make satisfying images.
    // All descriptions sent to dalle should be a paragraph of text that is extremely descriptive and detailed. Each should be more than 3 sentences long.
    // - The "vivid" style is HIGHLY preferred, but "natural" is also supported.`;
-    this.schema = dalle3JsonSchema;
-  }
-
-  static get jsonSchema() {
-    return dalle3JsonSchema;
+    this.schema = z.object({
+      prompt: z
+        .string()
+        .max(4000)
+        .describe(
+          'A text description of the desired image, following the rules, up to 4000 characters.',
+        ),
+      style: z
+        .enum(['vivid', 'natural'])
+        .describe(
+          'Must be one of `vivid` or `natural`. `vivid` generates hyper-real and dramatic images, `natural` produces more natural, less hyper-real looking images',
+        ),
+      quality: z
+        .enum(['hd', 'standard'])
+        .describe('The quality of the generated image. Only `hd` and `standard` are supported.'),
+      size: z
+        .enum(['1024x1024', '1792x1024', '1024x1792'])
+        .describe(
+          'The size of the requested image. Use 1024x1024 (square) as the default, 1792x1024 if the user requests a wide image, and 1024x1792 for full-body portraits. Always include this parameter in the request.',
+        ),
+    });
  }

  getApiKey() {
--- a/api/app/clients/tools/structured/FluxAPI.js
+++ b/api/app/clients/tools/structured/FluxAPI.js
@ -1,3 +1,4 @@
+const { z } = require('zod');
 const axios = require('axios');
 const fetch = require('node-fetch');
 const { v4: uuidv4 } = require('uuid');
@ -6,84 +7,6 @@ const { logger } = require('@librechat/data-schemas');
 const { HttpsProxyAgent } = require('https-proxy-agent');
 const { FileContext, ContentTypes } = require('librechat-data-provider');

-const fluxApiJsonSchema = {
-  type: 'object',
-  properties: {
-    action: {
-      type: 'string',
-      enum: ['generate', 'list_finetunes', 'generate_finetuned'],
-      description:
-        'Action to perform: "generate" for image generation, "generate_finetuned" for finetuned model generation, "list_finetunes" to get available custom models',
-    },
-    prompt: {
-      type: 'string',
-      description:
-        'Text prompt for image generation. Required when action is "generate". Not used for list_finetunes.',
-    },
-    width: {
-      type: 'number',
-      description:
-        'Width of the generated image in pixels. Must be a multiple of 32. Default is 1024.',
-    },
-    height: {
-      type: 'number',
-      description:
-        'Height of the generated image in pixels. Must be a multiple of 32. Default is 768.',
-    },
-    prompt_upsampling: {
-      type: 'boolean',
-      description: 'Whether to perform upsampling on the prompt.',
-    },
-    steps: {
-      type: 'integer',
-      description: 'Number of steps to run the model for, a number from 1 to 50. Default is 40.',
-    },
-    seed: {
-      type: 'number',
-      description: 'Optional seed for reproducibility.',
-    },
-    safety_tolerance: {
-      type: 'number',
-      description:
-        'Tolerance level for input and output moderation. Between 0 and 6, 0 being most strict, 6 being least strict.',
-    },
-    endpoint: {
-      type: 'string',
-      enum: [
-        '/v1/flux-pro-1.1',
-        '/v1/flux-pro',
-        '/v1/flux-dev',
-        '/v1/flux-pro-1.1-ultra',
-        '/v1/flux-pro-finetuned',
-        '/v1/flux-pro-1.1-ultra-finetuned',
-      ],
-      description: 'Endpoint to use for image generation.',
-    },
-    raw: {
-      type: 'boolean',
-      description:
-        'Generate less processed, more natural-looking images. Only works for /v1/flux-pro-1.1-ultra.',
-    },
-    finetune_id: {
-      type: 'string',
-      description: 'ID of the finetuned model to use',
-    },
-    finetune_strength: {
-      type: 'number',
-      description: 'Strength of the finetuning effect (typically between 0.1 and 1.2)',
-    },
-    guidance: {
-      type: 'number',
-      description: 'Guidance scale for finetuned models',
-    },
-    aspect_ratio: {
-      type: 'string',
-      description: 'Aspect ratio for ultra models (e.g., "16:9")',
-    },
-  },
-  required: [],
-};
-
 const displayMessage =
  "Flux displayed an image. All generated images are already plainly visible, so don't repeat the descriptions in detail. Do not list download links as they are available in the UI already. The user may download the images by clicking on them, but do not mention anything about downloading to the user.";

@ -134,11 +57,82 @@ class FluxAPI extends Tool {
    // Add base URL from environment variable with fallback
    this.baseUrl = process.env.FLUX_API_BASE_URL || 'https://api.us1.bfl.ai';

-    this.schema = fluxApiJsonSchema;
-  }
-
-  static get jsonSchema() {
-    return fluxApiJsonSchema;
+    // Define the schema for structured input
+    this.schema = z.object({
+      action: z
+        .enum(['generate', 'list_finetunes', 'generate_finetuned'])
+        .default('generate')
+        .describe(
+          'Action to perform: "generate" for image generation, "generate_finetuned" for finetuned model generation, "list_finetunes" to get available custom models',
+        ),
+      prompt: z
+        .string()
+        .optional()
+        .describe(
+          'Text prompt for image generation. Required when action is "generate". Not used for list_finetunes.',
+        ),
+      width: z
+        .number()
+        .optional()
+        .describe(
+          'Width of the generated image in pixels. Must be a multiple of 32. Default is 1024.',
+        ),
+      height: z
+        .number()
+        .optional()
+        .describe(
+          'Height of the generated image in pixels. Must be a multiple of 32. Default is 768.',
+        ),
+      prompt_upsampling: z
+        .boolean()
+        .optional()
+        .default(false)
+        .describe('Whether to perform upsampling on the prompt.'),
+      steps: z
+        .number()
+        .int()
+        .optional()
+        .describe('Number of steps to run the model for, a number from 1 to 50. Default is 40.'),
+      seed: z.number().optional().describe('Optional seed for reproducibility.'),
+      safety_tolerance: z
+        .number()
+        .optional()
+        .default(6)
+        .describe(
+          'Tolerance level for input and output moderation. Between 0 and 6, 0 being most strict, 6 being least strict.',
+        ),
+      endpoint: z
+        .enum([
+          '/v1/flux-pro-1.1',
+          '/v1/flux-pro',
+          '/v1/flux-dev',
+          '/v1/flux-pro-1.1-ultra',
+          '/v1/flux-pro-finetuned',
+          '/v1/flux-pro-1.1-ultra-finetuned',
+        ])
+        .optional()
+        .default('/v1/flux-pro-1.1')
+        .describe('Endpoint to use for image generation.'),
+      raw: z
+        .boolean()
+        .optional()
+        .default(false)
+        .describe(
+          'Generate less processed, more natural-looking images. Only works for /v1/flux-pro-1.1-ultra.',
+        ),
+      finetune_id: z.string().optional().describe('ID of the finetuned model to use'),
+      finetune_strength: z
+        .number()
+        .optional()
+        .default(1.1)
+        .describe('Strength of the finetuning effect (typically between 0.1 and 1.2)'),
+      guidance: z.number().optional().default(2.5).describe('Guidance scale for finetuned models'),
+      aspect_ratio: z
+        .string()
+        .optional()
+        .default('16:9')
+        .describe('Aspect ratio for ultra models (e.g., "16:9")'),
+    });
  }

  getAxiosConfig() {
--- a/api/app/clients/tools/structured/GeminiImageGen.js
+++ b/api/app/clients/tools/structured/GeminiImageGen.js
@ -1,3 +1,4 @@
+const fs = require('fs');
 const path = require('path');
 const sharp = require('sharp');
 const { v4 } = require('uuid');
@ -5,7 +6,12 @@ const { ProxyAgent } = require('undici');
 const { GoogleGenAI } = require('@google/genai');
 const { tool } = require('@langchain/core/tools');
 const { logger } = require('@librechat/data-schemas');
-const { ContentTypes, EImageOutputType } = require('librechat-data-provider');
+const {
+  FileContext,
+  ContentTypes,
+  FileSources,
+  EImageOutputType,
+} = require('librechat-data-provider');
 const {
  geminiToolkit,
  loadServiceKey,
@ -53,12 +59,17 @@ const displayMessage =
 * @returns {string} - The processed string
 */
 function replaceUnwantedChars(inputString) {
-  return (
-    inputString
-      ?.replace(/\r\n|\r|\n/g, ' ')
-      .replace(/"/g, '')
-      .trim() || ''
-  );
+  return inputString?.replace(/[^\w\s\-_.,!?()]/g, '') || '';
+}
+
+/**
+ * Validate and sanitize image format
+ * @param {string} format - The format to validate
+ * @returns {string} - Safe format
+ */
+function getSafeFormat(format) {
+  const allowedFormats = ['png', 'jpg', 'jpeg', 'webp', 'gif'];
+  return allowedFormats.includes(format?.toLowerCase()) ? format.toLowerCase() : 'png';
 }

 /**
@ -106,8 +117,11 @@ async function initializeGeminiClient(options = {}) {
    return new GoogleGenAI({ apiKey: googleKey });
  }

+  // Fall back to Vertex AI with service account
  logger.debug('[GeminiImageGen] Using Vertex AI with service account');
  const credentialsPath = getDefaultServiceKeyPath();
+
+  // Use loadServiceKey for consistent loading (supports file paths, JSON strings, base64)
  const serviceKey = await loadServiceKey(credentialsPath);

  if (!serviceKey || !serviceKey.project_id) {
@ -117,14 +131,75 @@ async function initializeGeminiClient(options = {}) {
    );
  }

+  // Set GOOGLE_APPLICATION_CREDENTIALS for any Google Cloud SDK dependencies
+  try {
+    await fs.promises.access(credentialsPath);
+    process.env.GOOGLE_APPLICATION_CREDENTIALS = credentialsPath;
+  } catch {
+    // File doesn't exist, skip setting env var
+  }
+
  return new GoogleGenAI({
    vertexai: true,
    project: serviceKey.project_id,
    location: process.env.GOOGLE_LOC || process.env.GOOGLE_CLOUD_LOCATION || 'global',
-    googleAuthOptions: { credentials: serviceKey },
  });
 }

+/**
+ * Save image to local filesystem
+ * @param {string} base64Data - Base64 encoded image data
+ * @param {string} format - Image format
+ * @param {string} userId - User ID
+ * @returns {Promise<string>} - The relative URL
+ */
+async function saveImageLocally(base64Data, format, userId) {
+  const safeFormat = getSafeFormat(format);
+  const safeUserId = userId ? path.basename(userId) : 'default';
+  const imageName = `gemini-img-${v4()}.${safeFormat}`;
+  const userDir = path.join(process.cwd(), 'client/public/images', safeUserId);
+
+  await fs.promises.mkdir(userDir, { recursive: true });
+
+  const filePath = path.join(userDir, imageName);
+  await fs.promises.writeFile(filePath, Buffer.from(base64Data, 'base64'));
+
+  logger.debug('[GeminiImageGen] Image saved locally to:', filePath);
+  return `/images/${safeUserId}/${imageName}`;
+}
+
+/**
+ * Save image to cloud storage
+ * @param {Object} params - Parameters
+ * @returns {Promise<string|null>} - The storage URL or null
+ */
+async function saveToCloudStorage({ base64Data, format, processFileURL, fileStrategy, userId }) {
+  if (!processFileURL || !fileStrategy || !userId) {
+    return null;
+  }
+
+  try {
+    const safeFormat = getSafeFormat(format);
+    const safeUserId = path.basename(userId);
+    const dataURL = `data:image/${safeFormat};base64,${base64Data}`;
+    const imageName = `gemini-img-${v4()}.${safeFormat}`;
+
+    const result = await processFileURL({
+      URL: dataURL,
+      basePath: 'images',
+      userId: safeUserId,
+      fileName: imageName,
+      fileStrategy,
+      context: FileContext.image_generation,
+    });
+
+    return result.filepath;
+  } catch (error) {
+    logger.error('[GeminiImageGen] Error saving to cloud storage:', error);
+    return null;
+  }
+}
+
 /**
 * Convert image files to Gemini inline data format
 * @param {Object} params - Parameters
@ -251,9 +326,8 @@ function checkForSafetyBlock(response) {
 * @param {string} params.userId - The user ID
 * @param {string} params.conversationId - The conversation ID
 * @param {string} params.model - The model name
- * @param {string} [params.messageId] - The response message ID for transaction correlation
 */
-async function recordTokenUsage({ usageMetadata, req, userId, conversationId, model, messageId }) {
+async function recordTokenUsage({ usageMetadata, req, userId, conversationId, model }) {
  if (!usageMetadata) {
    logger.debug('[GeminiImageGen] No usage metadata available for balance tracking');
    return;
@ -289,7 +363,6 @@ async function recordTokenUsage({ usageMetadata, req, userId, conversationId, mo
      {
        user: userId,
        model,
-        messageId,
        conversationId,
        context: 'image_generation',
        balance,
@ -317,18 +390,34 @@ function createGeminiImageTool(fields = {}) {
    throw new Error('This tool is only available for agents.');
  }

-  const { req, imageFiles = [], userId, fileStrategy, GEMINI_API_KEY, GOOGLE_KEY } = fields;
+  // Skip validation during tool creation - validation happens at runtime in initializeGeminiClient
+  // This allows the tool to be added to agents when using Vertex AI without requiring API keys
+  // The actual credentials check happens when the tool is invoked
+
+  const {
+    req,
+    imageFiles = [],
+    processFileURL,
+    userId,
+    fileStrategy,
+    GEMINI_API_KEY,
+    GOOGLE_KEY,
+    // GEMINI_VERTEX_ENABLED is used for auth validation only (not used in code)
+    // When set as env var, it signals Vertex AI is configured and bypasses API key requirement
+  } = fields;

  const imageOutputType = fields.imageOutputType || EImageOutputType.PNG;

  const geminiImageGenTool = tool(
-    async ({ prompt, image_ids, aspectRatio, imageSize }, runnableConfig) => {
+    async ({ prompt, image_ids, aspectRatio, imageSize }, _runnableConfig) => {
      if (!prompt) {
        throw new Error('Missing required field: prompt');
      }

-      logger.debug('[GeminiImageGen] Generating image', { aspectRatio, imageSize });
+      logger.debug('[GeminiImageGen] Generating image with prompt:', prompt?.substring(0, 100));
+      logger.debug('[GeminiImageGen] Options:', { aspectRatio, imageSize });

+      // Initialize Gemini client with user-provided credentials
      let ai;
      try {
        ai = await initializeGeminiClient({
@ -343,8 +432,10 @@ function createGeminiImageTool(fields = {}) {
        ];
      }

+      // Build request contents
      const contents = [{ text: replaceUnwantedChars(prompt) }];

+      // Add context images if provided
      if (image_ids?.length > 0) {
        const contextImages = await convertImagesToInlineData({
          imageFiles,
@ -356,34 +447,28 @@ function createGeminiImageTool(fields = {}) {
        logger.debug('[GeminiImageGen] Added', contextImages.length, 'context images');
      }

+      // Generate image
      let apiResponse;
      const geminiModel = process.env.GEMINI_IMAGE_MODEL || 'gemini-2.5-flash-image';
-      const config = {
-        responseModalities: ['TEXT', 'IMAGE'],
-      };
-
-      const supportsImageSize = !geminiModel.includes('gemini-2.5-flash-image');
-      if (aspectRatio || (imageSize && supportsImageSize)) {
-        config.imageConfig = {};
-        if (aspectRatio) {
-          config.imageConfig.aspectRatio = aspectRatio;
-        }
-        if (imageSize && supportsImageSize) {
-          config.imageConfig.imageSize = imageSize;
-        }
-      }
-
-      let derivedSignal = null;
-      let abortHandler = null;
-
-      if (runnableConfig?.signal) {
-        derivedSignal = AbortSignal.any([runnableConfig.signal]);
-        abortHandler = () => logger.debug('[GeminiImageGen] Image generation aborted');
-        derivedSignal.addEventListener('abort', abortHandler, { once: true });
-        config.abortSignal = derivedSignal;
-      }
-
      try {
+        // Build config with optional imageConfig
+        const config = {
+          responseModalities: ['TEXT', 'IMAGE'],
+        };
+
+        // Add imageConfig if aspectRatio or imageSize is specified
+        // Note: gemini-2.5-flash-image doesn't support imageSize
+        const supportsImageSize = !geminiModel.includes('gemini-2.5-flash-image');
+        if (aspectRatio || (imageSize && supportsImageSize)) {
+          config.imageConfig = {};
+          if (aspectRatio) {
+            config.imageConfig.aspectRatio = aspectRatio;
+          }
+          if (imageSize && supportsImageSize) {
+            config.imageConfig.imageSize = imageSize;
+          }
+        }
+
        apiResponse = await ai.models.generateContent({
          model: geminiModel,
          contents,
@ -395,12 +480,9 @@ function createGeminiImageTool(fields = {}) {
          [{ type: ContentTypes.TEXT, text: `Image generation failed: ${error.message}` }],
          { content: [], file_ids: [] },
        ];
-      } finally {
-        if (abortHandler && derivedSignal) {
-          derivedSignal.removeEventListener('abort', abortHandler);
-        }
      }

+      // Check for safety blocks
      const safetyBlock = checkForSafetyBlock(apiResponse);
      if (safetyBlock) {
        logger.warn('[GeminiImageGen] Safety block:', safetyBlock);
@ -427,7 +509,46 @@ function createGeminiImageTool(fields = {}) {
      const imageData = convertedBuffer.toString('base64');
      const mimeType = outputFormat === 'jpeg' ? 'image/jpeg' : `image/${outputFormat}`;

+      logger.debug('[GeminiImageGen] Image format:', { outputFormat, mimeType });
+
+      let imageUrl;
+      const useLocalStorage = !fileStrategy || fileStrategy === FileSources.local;
+
+      if (useLocalStorage) {
+        try {
+          imageUrl = await saveImageLocally(imageData, outputFormat, userId);
+        } catch (error) {
+          logger.error('[GeminiImageGen] Local save failed:', error);
+          imageUrl = `data:${mimeType};base64,${imageData}`;
+        }
+      } else {
+        const cloudUrl = await saveToCloudStorage({
+          base64Data: imageData,
+          format: outputFormat,
+          processFileURL,
+          fileStrategy,
+          userId,
+        });
+
+        if (cloudUrl) {
+          imageUrl = cloudUrl;
+        } else {
+          // Fallback to local
+          try {
+            imageUrl = await saveImageLocally(imageData, outputFormat, userId);
+          } catch (_error) {
+            imageUrl = `data:${mimeType};base64,${imageData}`;
+          }
+        }
+      }
+
+      logger.debug('[GeminiImageGen] Image URL:', imageUrl);
+
+      // For the artifact, we need a data URL (same as OpenAI)
+      // The local file save is for persistence, but the response needs a data URL
      const dataUrl = `data:${mimeType};base64,${imageData}`;
+
+      // Return in content_and_artifact format (same as OpenAI)
      const file_ids = [v4()];
      const content = [
        {
@ -446,15 +567,12 @@ function createGeminiImageTool(fields = {}) {
        },
      ];

-      const conversationId = runnableConfig?.configurable?.thread_id;
-      const messageId =
-        runnableConfig?.configurable?.run_id ??
-        runnableConfig?.configurable?.requestBody?.messageId;
+      // Record token usage for balance tracking (don't await to avoid blocking response)
+      const conversationId = _runnableConfig?.configurable?.thread_id;
      recordTokenUsage({
        usageMetadata: apiResponse.usageMetadata,
        req,
        userId,
-        messageId,
        conversationId,
        model: geminiModel,
      }).catch((error) => {
--- a/api/app/clients/tools/structured/GoogleSearch.js
+++ b/api/app/clients/tools/structured/GoogleSearch.js
@ -1,33 +1,12 @@
+const { z } = require('zod');
 const { Tool } = require('@langchain/core/tools');
 const { getEnvironmentVariable } = require('@langchain/core/utils/env');

-const googleSearchJsonSchema = {
-  type: 'object',
-  properties: {
-    query: {
-      type: 'string',
-      minLength: 1,
-      description: 'The search query string.',
-    },
-    max_results: {
-      type: 'integer',
-      minimum: 1,
-      maximum: 10,
-      description: 'The maximum number of search results to return. Defaults to 5.',
-    },
-  },
-  required: ['query'],
-};
-
 class GoogleSearchResults extends Tool {
  static lc_name() {
    return 'google';
  }

-  static get jsonSchema() {
-    return googleSearchJsonSchema;
-  }
-
  constructor(fields = {}) {
    super(fields);
    this.name = 'google';
@ -49,11 +28,25 @@ class GoogleSearchResults extends Tool {
    this.description =
      'A search engine optimized for comprehensive, accurate, and trusted results. Useful for when you need to answer questions about current events.';

-    this.schema = googleSearchJsonSchema;
+    this.schema = z.object({
+      query: z.string().min(1).describe('The search query string.'),
+      max_results: z
+        .number()
+        .min(1)
+        .max(10)
+        .optional()
+        .describe('The maximum number of search results to return. Defaults to 10.'),
+      // Note: Google API has its own parameters for search customization, adjust as needed.
+    });
  }

  async _call(input) {
-    const { query, max_results = 5 } = input;
+    const validationResult = this.schema.safeParse(input);
+    if (!validationResult.success) {
+      throw new Error(`Validation failed: ${JSON.stringify(validationResult.error.issues)}`);
+    }
+
+    const { query, max_results = 5 } = validationResult.data;

    const response = await fetch(
      `https://www.googleapis.com/customsearch/v1?key=${this.apiKey}&cx=${
--- a/api/app/clients/tools/structured/OpenWeather.js
+++ b/api/app/clients/tools/structured/OpenWeather.js
@ -1,52 +1,8 @@
 const { Tool } = require('@langchain/core/tools');
+const { z } = require('zod');
 const { getEnvironmentVariable } = require('@langchain/core/utils/env');
 const fetch = require('node-fetch');

-const openWeatherJsonSchema = {
-  type: 'object',
-  properties: {
-    action: {
-      type: 'string',
-      enum: ['help', 'current_forecast', 'timestamp', 'daily_aggregation', 'overview'],
-      description: 'The action to perform',
-    },
-    city: {
-      type: 'string',
-      description: 'City name for geocoding if lat/lon not provided',
-    },
-    lat: {
-      type: 'number',
-      description: 'Latitude coordinate',
-    },
-    lon: {
-      type: 'number',
-      description: 'Longitude coordinate',
-    },
-    exclude: {
-      type: 'string',
-      description: 'Parts to exclude from the response',
-    },
-    units: {
-      type: 'string',
-      enum: ['Celsius', 'Kelvin', 'Fahrenheit'],
-      description: 'Temperature units',
-    },
-    lang: {
-      type: 'string',
-      description: 'Language code',
-    },
-    date: {
-      type: 'string',
-      description: 'Date in YYYY-MM-DD format for timestamp and daily_aggregation',
-    },
-    tz: {
-      type: 'string',
-      description: 'Timezone',
-    },
-  },
-  required: ['action'],
-};
-
 /**
 * Map user-friendly units to OpenWeather units.
 * Defaults to Celsius if not specified.
@ -110,11 +66,17 @@ class OpenWeather extends Tool {
    'Units: "Celsius", "Kelvin", or "Fahrenheit" (default: Celsius). ' +
    'For timestamp action, use "date" in YYYY-MM-DD format.';

-  schema = openWeatherJsonSchema;
-
-  static get jsonSchema() {
-    return openWeatherJsonSchema;
-  }
+  schema = z.object({
+    action: z.enum(['help', 'current_forecast', 'timestamp', 'daily_aggregation', 'overview']),
+    city: z.string().optional(),
+    lat: z.number().optional(),
+    lon: z.number().optional(),
+    exclude: z.string().optional(),
+    units: z.enum(['Celsius', 'Kelvin', 'Fahrenheit']).optional(),
+    lang: z.string().optional(),
+    date: z.string().optional(), // For timestamp and daily_aggregation
+    tz: z.string().optional(),
+  });

  constructor(fields = {}) {
    super();
--- a/api/app/clients/tools/structured/StableDiffusion.js
+++ b/api/app/clients/tools/structured/StableDiffusion.js
@ -1,5 +1,6 @@
 // Generates image using stable diffusion webui's api (automatic1111)
 const fs = require('fs');
+const { z } = require('zod');
 const path = require('path');
 const axios = require('axios');
 const sharp = require('sharp');
@ -10,23 +11,6 @@ const { FileContext, ContentTypes } = require('librechat-data-provider');
 const { getBasePath } = require('@librechat/api');
 const paths = require('~/config/paths');

-const stableDiffusionJsonSchema = {
-  type: 'object',
-  properties: {
-    prompt: {
-      type: 'string',
-      description:
-        'Detailed keywords to describe the subject, using at least 7 keywords to accurately describe the image, separated by comma',
-    },
-    negative_prompt: {
-      type: 'string',
-      description:
-        'Keywords we want to exclude from the final image, using at least 7 keywords to accurately describe the image, separated by comma',
-    },
-  },
-  required: ['prompt', 'negative_prompt'],
-};
-
 const displayMessage =
  "Stable Diffusion displayed an image. All generated images are already plainly visible, so don't repeat the descriptions in detail. Do not list download links as they are available in the UI already. The user may download the images by clicking on them, but do not mention anything about downloading to the user.";

@ -62,11 +46,18 @@ class StableDiffusionAPI extends Tool {
 // - Generate images only once per human query unless explicitly requested by the user`;
    this.description =
      "You can generate images using text with 'stable-diffusion'. This tool is exclusively for visual content.";
-    this.schema = stableDiffusionJsonSchema;
-  }
-
-  static get jsonSchema() {
-    return stableDiffusionJsonSchema;
+    this.schema = z.object({
+      prompt: z
+        .string()
+        .describe(
+          'Detailed keywords to describe the subject, using at least 7 keywords to accurately describe the image, separated by comma',
+        ),
+      negative_prompt: z
+        .string()
+        .describe(
+          'Keywords we want to exclude from the final image, using at least 7 keywords to accurately describe the image, separated by comma',
+        ),
+    });
  }

  replaceNewLinesWithSpaces(inputString) {
--- a/api/app/clients/tools/structured/TavilySearchResults.js
+++ b/api/app/clients/tools/structured/TavilySearchResults.js
@ -1,75 +1,8 @@
+const { z } = require('zod');
 const { ProxyAgent, fetch } = require('undici');
 const { Tool } = require('@langchain/core/tools');
 const { getEnvironmentVariable } = require('@langchain/core/utils/env');

-const tavilySearchJsonSchema = {
-  type: 'object',
-  properties: {
-    query: {
-      type: 'string',
-      minLength: 1,
-      description: 'The search query string.',
-    },
-    max_results: {
-      type: 'number',
-      minimum: 1,
-      maximum: 10,
-      description: 'The maximum number of search results to return. Defaults to 5.',
-    },
-    search_depth: {
-      type: 'string',
-      enum: ['basic', 'advanced'],
-      description:
-        'The depth of the search, affecting result quality and response time (`basic` or `advanced`). Default is basic for quick results and advanced for indepth high quality results but longer response time. Advanced calls equals 2 requests.',
-    },
-    include_images: {
-      type: 'boolean',
-      description:
-        'Whether to include a list of query-related images in the response. Default is False.',
-    },
-    include_answer: {
-      type: 'boolean',
-      description: 'Whether to include answers in the search results. Default is False.',
-    },
-    include_raw_content: {
-      type: 'boolean',
-      description: 'Whether to include raw content in the search results. Default is False.',
-    },
-    include_domains: {
-      type: 'array',
-      items: { type: 'string' },
-      description: 'A list of domains to specifically include in the search results.',
-    },
-    exclude_domains: {
-      type: 'array',
-      items: { type: 'string' },
-      description: 'A list of domains to specifically exclude from the search results.',
-    },
-    topic: {
-      type: 'string',
-      enum: ['general', 'news', 'finance'],
-      description:
-        'The category of the search. Use news ONLY if query SPECIFCALLY mentions the word "news".',
-    },
-    time_range: {
-      type: 'string',
-      enum: ['day', 'week', 'month', 'year', 'd', 'w', 'm', 'y'],
-      description: 'The time range back from the current date to filter results.',
-    },
-    days: {
-      type: 'number',
-      minimum: 1,
-      description: 'Number of days back from the current date to include. Only if topic is news.',
-    },
-    include_image_descriptions: {
-      type: 'boolean',
-      description:
-        'When include_images is true, also add a descriptive text for each image. Default is false.',
-    },
-  },
-  required: ['query'],
-};
-
 class TavilySearchResults extends Tool {
  static lc_name() {
    return 'TavilySearchResults';
@ -87,11 +20,64 @@ class TavilySearchResults extends Tool {
    this.description =
      'A search engine optimized for comprehensive, accurate, and trusted results. Useful for when you need to answer questions about current events.';

-    this.schema = tavilySearchJsonSchema;
-  }
-
-  static get jsonSchema() {
-    return tavilySearchJsonSchema;
+    this.schema = z.object({
+      query: z.string().min(1).describe('The search query string.'),
+      max_results: z
+        .number()
+        .min(1)
+        .max(10)
+        .optional()
+        .describe('The maximum number of search results to return. Defaults to 5.'),
+      search_depth: z
+        .enum(['basic', 'advanced'])
+        .optional()
+        .describe(
+          'The depth of the search, affecting result quality and response time (`basic` or `advanced`). Default is basic for quick results and advanced for indepth high quality results but longer response time. Advanced calls equals 2 requests.',
+        ),
+      include_images: z
+        .boolean()
+        .optional()
+        .describe(
+          'Whether to include a list of query-related images in the response. Default is False.',
+        ),
+      include_answer: z
+        .boolean()
+        .optional()
+        .describe('Whether to include answers in the search results. Default is False.'),
+      include_raw_content: z
+        .boolean()
+        .optional()
+        .describe('Whether to include raw content in the search results. Default is False.'),
+      include_domains: z
+        .array(z.string())
+        .optional()
+        .describe('A list of domains to specifically include in the search results.'),
+      exclude_domains: z
+        .array(z.string())
+        .optional()
+        .describe('A list of domains to specifically exclude from the search results.'),
+      topic: z
+        .enum(['general', 'news', 'finance'])
+        .optional()
+        .describe(
+          'The category of the search. Use news ONLY if query SPECIFCALLY mentions the word "news".',
+        ),
+      time_range: z
+        .enum(['day', 'week', 'month', 'year', 'd', 'w', 'm', 'y'])
+        .optional()
+        .describe('The time range back from the current date to filter results.'),
+      days: z
+        .number()
+        .min(1)
+        .optional()
+        .describe('Number of days back from the current date to include. Only if topic is news.'),
+      include_image_descriptions: z
+        .boolean()
+        .optional()
+        .describe(
+          'When include_images is true, also add a descriptive text for each image. Default is false.',
+        ),
+    });
  }

  getApiKey() {
@ -103,7 +89,12 @@ class TavilySearchResults extends Tool {
  }

  async _call(input) {
-    const { query, ...rest } = input;
+    const validationResult = this.schema.safeParse(input);
+    if (!validationResult.success) {
+      throw new Error(`Validation failed: ${JSON.stringify(validationResult.error.issues)}`);
+    }
+
+    const { query, ...rest } = validationResult.data;

    const requestBody = {
      api_key: this.apiKey,
--- a/api/app/clients/tools/structured/TraversaalSearch.js
+++ b/api/app/clients/tools/structured/TraversaalSearch.js
@ -1,19 +1,8 @@
+const { z } = require('zod');
 const { Tool } = require('@langchain/core/tools');
 const { logger } = require('@librechat/data-schemas');
 const { getEnvironmentVariable } = require('@langchain/core/utils/env');

-const traversaalSearchJsonSchema = {
-  type: 'object',
-  properties: {
-    query: {
-      type: 'string',
-      description:
-        "A properly written sentence to be interpreted by an AI to search the web according to the user's request.",
-    },
-  },
-  required: ['query'],
-};
-
 /**
 * Tool for the Traversaal AI search API, Ares.
 */
@ -28,15 +17,17 @@ class TraversaalSearch extends Tool {
    Useful for when you need to answer questions about current events. Input should be a search query.`;
    this.description_for_model =
      '\'Please create a specific sentence for the AI to understand and use as a query to search the web based on the user\'s request. For example, "Find information about the highest mountains in the world." or "Show me the latest news articles about climate change and its impact on polar ice caps."\'';
-    this.schema = traversaalSearchJsonSchema;
+    this.schema = z.object({
+      query: z
+        .string()
+        .describe(
+          "A properly written sentence to be interpreted by an AI to search the web according to the user's request.",
+        ),
+    });

    this.apiKey = fields?.TRAVERSAAL_API_KEY ?? this.getApiKey();
  }

-  static get jsonSchema() {
-    return traversaalSearchJsonSchema;
-  }
-
  getApiKey() {
    const apiKey = getEnvironmentVariable('TRAVERSAAL_API_KEY');
    if (!apiKey && this.override) {
--- a/api/app/clients/tools/structured/Wolfram.js
+++ b/api/app/clients/tools/structured/Wolfram.js
@ -1,19 +1,9 @@
 /* eslint-disable no-useless-escape */
+const { z } = require('zod');
 const axios = require('axios');
 const { Tool } = require('@langchain/core/tools');
 const { logger } = require('@librechat/data-schemas');

-const wolframJsonSchema = {
-  type: 'object',
-  properties: {
-    input: {
-      type: 'string',
-      description: 'Natural language query to WolframAlpha following the guidelines',
-    },
-  },
-  required: ['input'],
-};
-
 class WolframAlphaAPI extends Tool {
  constructor(fields) {
    super();
@ -51,11 +41,9 @@ class WolframAlphaAPI extends Tool {
    // -- Do not explain each step unless user input is needed. Proceed directly to making a better API call based on the available assumptions.`;
    this.description = `WolframAlpha offers computation, math, curated knowledge, and real-time data. It handles natural language queries and performs complex calculations.
    Follow the guidelines to get the best results.`;
-    this.schema = wolframJsonSchema;
-  }
-
-  static get jsonSchema() {
-    return wolframJsonSchema;
+    this.schema = z.object({
+      input: z.string().describe('Natural language query to WolframAlpha following the guidelines'),
+    });
  }

  async fetchRawText(url) {
--- a/api/app/clients/tools/structured/specs/DALLE3-proxy.spec.js
+++ b/api/app/clients/tools/structured/specs/DALLE3-proxy.spec.js
@ -1,6 +1,7 @@
 const DALLE3 = require('../DALLE3');
 const { ProxyAgent } = require('undici');

+jest.mock('tiktoken');
 const processFileURL = jest.fn();

 describe('DALLE3 Proxy Configuration', () => {
--- a/api/app/clients/tools/structured/specs/DALLE3.spec.js
+++ b/api/app/clients/tools/structured/specs/DALLE3.spec.js
@ -14,6 +14,15 @@ jest.mock('@librechat/data-schemas', () => {
  };
 });

+jest.mock('tiktoken', () => {
+  return {
+    encoding_for_model: jest.fn().mockReturnValue({
+      encode: jest.fn(),
+      decode: jest.fn(),
+    }),
+  };
+});
+
 const processFileURL = jest.fn();

 const generate = jest.fn();
--- a/api/app/clients/tools/util/fileSearch.js
+++ b/api/app/clients/tools/util/fileSearch.js
@ -1,3 +1,4 @@
+const { z } = require('zod');
 const axios = require('axios');
 const { tool } = require('@langchain/core/tools');
 const { logger } = require('@librechat/data-schemas');
@ -6,18 +7,6 @@ const { Tools, EToolResources } = require('librechat-data-provider');
 const { filterFilesByAgentAccess } = require('~/server/services/Files/permissions');
 const { getFiles } = require('~/models');

-const fileSearchJsonSchema = {
-  type: 'object',
-  properties: {
-    query: {
-      type: 'string',
-      description:
-        "A natural language query to search for relevant information in the files. Be specific and use keywords related to the information you're looking for. The query will be used for semantic similarity matching against the file contents.",
-    },
-  },
-  required: ['query'],
-};
-
 /**
 *
 * @param {Object} options
@ -193,9 +182,15 @@ Use the EXACT anchor markers shown below (copy them verbatim) immediately after
 **ALWAYS mention the filename in your text before the citation marker. NEVER use markdown links or footnotes.**`
          : ''
      }`,
-      schema: fileSearchJsonSchema,
+      schema: z.object({
+        query: z
+          .string()
+          .describe(
+            "A natural language query to search for relevant information in the files. Be specific and use keywords related to the information you're looking for. The query will be used for semantic similarity matching against the file contents.",
+          ),
+      }),
    },
  );
 };

-module.exports = { createFileSearchTool, primeFiles, fileSearchJsonSchema };
+module.exports = { createFileSearchTool, primeFiles };
--- a/api/app/clients/tools/util/handleTools.js
+++ b/api/app/clients/tools/util/handleTools.js
@ -7,12 +7,10 @@ const {
 } = require('@librechat/agents');
 const {
  checkAccess,
-  toolkitParent,
  createSafeUser,
  mcpToolPattern,
  loadWebSearchAuth,
  buildImageToolContext,
-  buildWebSearchContext,
 } = require('@librechat/api');
 const { getMCPServersRegistry } = require('~/config');
 const {
@ -21,6 +19,7 @@ const {
  Permissions,
  EToolResources,
  PermissionTypes,
+  replaceSpecialVars,
 } = require('librechat-data-provider');
 const {
  availableTools,
@ -208,7 +207,7 @@ const loadTools = async ({
    },
    gemini_image_gen: async (toolContextMap) => {
      const authFields = getAuthFields('gemini_image_gen');
-      const authValues = await loadAuthValues({ userId: user, authFields, throwError: false });
+      const authValues = await loadAuthValues({ userId: user, authFields });
      const imageFiles = options.tool_resources?.[EToolResources.image_edit]?.files ?? [];
      const toolContext = buildImageToolContext({
        imageFiles,
@ -223,6 +222,7 @@ const loadTools = async ({
        isAgent: !!agent,
        req: options.req,
        imageFiles,
+        processFileURL: options.processFileURL,
        userId: user,
        fileStrategy,
      });
@ -325,7 +325,24 @@ const loadTools = async ({
      });
      const { onSearchResults, onGetHighlights } = options?.[Tools.web_search] ?? {};
      requestedTools[tool] = async () => {
-        toolContextMap[tool] = buildWebSearchContext();
+        toolContextMap[tool] = `# \`${tool}\`:
+Current Date & Time: ${replaceSpecialVars({ text: '{{iso_datetime}}' })}
+
+**Execute immediately without preface.** After search, provide a brief summary addressing the query directly, then structure your response with clear Markdown formatting (## headers, lists, tables). Cite sources properly, tailor tone to query type, and provide comprehensive details.
+
+**CITATION FORMAT - UNICODE ESCAPE SEQUENCES ONLY:**
+Use these EXACT escape sequences (copy verbatim): \\ue202 (before each anchor), \\ue200 (group start), \\ue201 (group end), \\ue203 (highlight start), \\ue204 (highlight end)
+
+Anchor pattern: \\ue202turn{N}{type}{index} where N=turn number, type=search|news|image|ref, index=0,1,2...
+
+**Examples (copy these exactly):**
+- Single: "Statement.\\ue202turn0search0"
+- Multiple: "Statement.\\ue202turn0search0\\ue202turn0news1"
+- Group: "Statement. \\ue200\\ue202turn0search0\\ue202turn0news1\\ue201"
+- Highlight: "\\ue203Cited text.\\ue204\\ue202turn0search0"
+- Image: "See photo\\ue202turn0image0."
+
+**CRITICAL:** Output escape sequences EXACTLY as shown. Do NOT substitute with † or other symbols. Place anchors AFTER punctuation. Cite every non-obvious fact/quote. NEVER use markdown links, [1], footnotes, or HTML tags.`.trim();
        return createSearchTool({
          ...result.authResult,
          onSearchResults,
@ -370,16 +387,8 @@ const loadTools = async ({
      continue;
    }

-    const toolKey = customConstructors[tool] ? tool : toolkitParent[tool];
-    if (toolKey && customConstructors[toolKey]) {
-      if (!requestedTools[toolKey]) {
-        let cached;
-        requestedTools[toolKey] = async () => {
-          cached ??= customConstructors[toolKey](toolContextMap);
-          return cached;
-        };
-      }
-      requestedTools[tool] = requestedTools[toolKey];
+    if (customConstructors[tool]) {
+      requestedTools[tool] = async () => customConstructors[tool](toolContextMap);
      continue;
    }

--- a/api/cache/banViolation.js
+++ b/api/cache/banViolation.js
@ -55,7 +55,6 @@ const banViolation = async (req, res, errorMessage) => {

  res.clearCookie('refreshToken');
  res.clearCookie('openid_access_token');
-  res.clearCookie('openid_id_token');
  res.clearCookie('openid_user_id');
  res.clearCookie('token_provider');

--- a/api/cache/getLogStores.js
+++ b/api/cache/getLogStores.js
@ -37,7 +37,6 @@ const namespaces = {
  [CacheKeys.ROLES]: standardCache(CacheKeys.ROLES),
  [CacheKeys.APP_CONFIG]: standardCache(CacheKeys.APP_CONFIG),
  [CacheKeys.CONFIG_STORE]: standardCache(CacheKeys.CONFIG_STORE),
-  [CacheKeys.TOOL_CACHE]: standardCache(CacheKeys.TOOL_CACHE),
  [CacheKeys.PENDING_REQ]: standardCache(CacheKeys.PENDING_REQ),
  [CacheKeys.ENCODED_DOMAINS]: new Keyv({ store: keyvMongo, namespace: CacheKeys.ENCODED_DOMAINS }),
  [CacheKeys.ABORT_KEYS]: standardCache(CacheKeys.ABORT_KEYS, Time.TEN_MINUTES),
@ -47,15 +46,11 @@ const namespaces = {
  [CacheKeys.MODEL_QUERIES]: standardCache(CacheKeys.MODEL_QUERIES),
  [CacheKeys.AUDIO_RUNS]: standardCache(CacheKeys.AUDIO_RUNS, Time.TEN_MINUTES),
  [CacheKeys.MESSAGES]: standardCache(CacheKeys.MESSAGES, Time.ONE_MINUTE),
-  [CacheKeys.FLOWS]: standardCache(CacheKeys.FLOWS, Time.ONE_MINUTE * 10),
+  [CacheKeys.FLOWS]: standardCache(CacheKeys.FLOWS, Time.ONE_MINUTE * 3),
  [CacheKeys.OPENID_EXCHANGED_TOKENS]: standardCache(
    CacheKeys.OPENID_EXCHANGED_TOKENS,
    Time.TEN_MINUTES,
  ),
-  [CacheKeys.ADMIN_OAUTH_EXCHANGE]: standardCache(
-    CacheKeys.ADMIN_OAUTH_EXCHANGE,
-    Time.THIRTY_SECONDS,
-  ),
 };

 /**
--- a/api/db/connect.js
+++ b/api/db/connect.js
@ -40,10 +40,6 @@ if (!cached) {
  cached = global.mongoose = { conn: null, promise: null };
 }

-mongoose.connection.on('error', (err) => {
-  logger.error('[connectDb] MongoDB connection error:', err);
-});
-
 async function connectDb() {
  if (cached.conn && cached.conn?._readyState === 1) {
    return cached.conn;
--- a/api/db/indexSync.js
+++ b/api/db/indexSync.js
@ -236,12 +236,8 @@ async function performSync(flowManager, flowId, flowType) {
      const messageCount = messageProgress.totalDocuments;
      const messagesIndexed = messageProgress.totalProcessed;
      const unindexedMessages = messageCount - messagesIndexed;
-      const noneIndexed = messagesIndexed === 0 && unindexedMessages > 0;

-      if (settingsUpdated || noneIndexed || unindexedMessages > syncThreshold) {
-        if (noneIndexed && !settingsUpdated) {
-          logger.info('[indexSync] No messages marked as indexed, forcing full sync');
-        }
+      if (settingsUpdated || unindexedMessages > syncThreshold) {
        logger.info(`[indexSync] Starting message sync (${unindexedMessages} unindexed)`);
        await Message.syncWithMeili();
        messagesSync = true;
@ -265,13 +261,9 @@ async function performSync(flowManager, flowId, flowType) {

      const convoCount = convoProgress.totalDocuments;
      const convosIndexed = convoProgress.totalProcessed;
-      const unindexedConvos = convoCount - convosIndexed;
-      const noneConvosIndexed = convosIndexed === 0 && unindexedConvos > 0;

-      if (settingsUpdated || noneConvosIndexed || unindexedConvos > syncThreshold) {
-        if (noneConvosIndexed && !settingsUpdated) {
-          logger.info('[indexSync] No conversations marked as indexed, forcing full sync');
-        }
+      const unindexedConvos = convoCount - convosIndexed;
+      if (settingsUpdated || unindexedConvos > syncThreshold) {
        logger.info(`[indexSync] Starting convos sync (${unindexedConvos} unindexed)`);
        await Conversation.syncWithMeili();
        convosSync = true;
--- a/api/db/indexSync.spec.js
+++ b/api/db/indexSync.spec.js
@ -462,69 +462,4 @@ describe('performSync() - syncThreshold logic', () => {
    );
    expect(mockLogger.info).toHaveBeenCalledWith('[indexSync] Starting convos sync (50 unindexed)');
  });
-
-  test('forces sync when zero documents indexed (reset scenario) even if below threshold', async () => {
-    Message.getSyncProgress.mockResolvedValue({
-      totalProcessed: 0,
-      totalDocuments: 680,
-      isComplete: false,
-    });
-
-    Conversation.getSyncProgress.mockResolvedValue({
-      totalProcessed: 0,
-      totalDocuments: 76,
-      isComplete: false,
-    });
-
-    Message.syncWithMeili.mockResolvedValue(undefined);
-    Conversation.syncWithMeili.mockResolvedValue(undefined);
-
-    const indexSync = require('./indexSync');
-    await indexSync();
-
-    expect(Message.syncWithMeili).toHaveBeenCalledTimes(1);
-    expect(Conversation.syncWithMeili).toHaveBeenCalledTimes(1);
-    expect(mockLogger.info).toHaveBeenCalledWith(
-      '[indexSync] No messages marked as indexed, forcing full sync',
-    );
-    expect(mockLogger.info).toHaveBeenCalledWith(
-      '[indexSync] Starting message sync (680 unindexed)',
-    );
-    expect(mockLogger.info).toHaveBeenCalledWith(
-      '[indexSync] No conversations marked as indexed, forcing full sync',
-    );
-    expect(mockLogger.info).toHaveBeenCalledWith('[indexSync] Starting convos sync (76 unindexed)');
-  });
-
-  test('does NOT force sync when some documents already indexed and below threshold', async () => {
-    Message.getSyncProgress.mockResolvedValue({
-      totalProcessed: 630,
-      totalDocuments: 680,
-      isComplete: false,
-    });
-
-    Conversation.getSyncProgress.mockResolvedValue({
-      totalProcessed: 70,
-      totalDocuments: 76,
-      isComplete: false,
-    });
-
-    const indexSync = require('./indexSync');
-    await indexSync();
-
-    expect(Message.syncWithMeili).not.toHaveBeenCalled();
-    expect(Conversation.syncWithMeili).not.toHaveBeenCalled();
-    expect(mockLogger.info).not.toHaveBeenCalledWith(
-      '[indexSync] No messages marked as indexed, forcing full sync',
-    );
-    expect(mockLogger.info).not.toHaveBeenCalledWith(
-      '[indexSync] No conversations marked as indexed, forcing full sync',
-    );
-    expect(mockLogger.info).toHaveBeenCalledWith(
-      '[indexSync] 50 messages unindexed (below threshold: 1000, skipping)',
-    );
-    expect(mockLogger.info).toHaveBeenCalledWith(
-      '[indexSync] 6 convos unindexed (below threshold: 1000, skipping)',
-    );
-  });
 });
--- a/api/db/utils.js
+++ b/api/db/utils.js
@ -26,7 +26,7 @@ async function batchResetMeiliFlags(collection) {
  try {
    while (hasMore) {
      const docs = await collection
-        .find({ expiredAt: null, _meiliIndex: { $ne: false } }, { projection: { _id: 1 } })
+        .find({ expiredAt: null, _meiliIndex: true }, { projection: { _id: 1 } })
        .limit(BATCH_SIZE)
        .toArray();

--- a/api/db/utils.spec.js
+++ b/api/db/utils.spec.js
@ -265,8 +265,8 @@ describe('batchResetMeiliFlags', () => {

      const result = await batchResetMeiliFlags(testCollection);

-      // both documents should be updated
-      expect(result).toBe(2);
+      // Only one document has _meiliIndex: true
+      expect(result).toBe(1);
    });

    it('should handle mixed document states correctly', async () => {
@ -275,18 +275,16 @@ describe('batchResetMeiliFlags', () => {
        { _id: new mongoose.Types.ObjectId(), expiredAt: null, _meiliIndex: false },
        { _id: new mongoose.Types.ObjectId(), expiredAt: new Date(), _meiliIndex: true },
        { _id: new mongoose.Types.ObjectId(), expiredAt: null, _meiliIndex: true },
-        { _id: new mongoose.Types.ObjectId(), expiredAt: null, _meiliIndex: null },
-        { _id: new mongoose.Types.ObjectId(), expiredAt: null },
      ]);

      const result = await batchResetMeiliFlags(testCollection);

-      expect(result).toBe(4);
+      expect(result).toBe(2);

      const flaggedDocs = await testCollection
        .find({ expiredAt: null, _meiliIndex: false })
        .toArray();
-      expect(flaggedDocs).toHaveLength(5); // 4 were updated, 1 was already false
+      expect(flaggedDocs).toHaveLength(3); // 2 were updated, 1 was already false
    });
  });

--- a/api/jest.config.js
+++ b/api/jest.config.js
@ -3,13 +3,12 @@ module.exports = {
  clearMocks: true,
  roots: ['<rootDir>'],
  coverageDirectory: 'coverage',
-  maxWorkers: '50%',
  testTimeout: 30000, // 30 seconds timeout for all tests
  setupFiles: ['./test/jestSetup.js', './test/__mocks__/logger.js'],
  moduleNameMapper: {
    '~/(.*)': '<rootDir>/$1',
    '~/data/auth.json': '<rootDir>/__mocks__/auth.mock.json',
-    '^openid-client/passport$': '<rootDir>/test/__mocks__/openid-client-passport.js',
+    '^openid-client/passport$': '<rootDir>/test/__mocks__/openid-client-passport.js', // Mock for the passport strategy part
    '^openid-client$': '<rootDir>/test/__mocks__/openid-client.js',
  },
  transformIgnorePatterns: ['/node_modules/(?!(openid-client|oauth4webapi|jose)/).*/'],
--- a/api/models/Action.js
+++ b/api/models/Action.js
@ -4,7 +4,9 @@ const { Action } = require('~/db/models');
 * Update an action with new data without overwriting existing properties,
 * or create a new action if it doesn't exist.
 *
- * @param {{ action_id: string, agent_id?: string, assistant_id?: string, user?: string }} searchParams
+ * @param {Object} searchParams - The search parameters to find the action to update.
+ * @param {string} searchParams.action_id - The ID of the action to update.
+ * @param {string} searchParams.user - The user ID of the action's author.
 * @param {Object} updateData - An object containing the properties to update.
 * @returns {Promise<Action>} The updated or newly created action document as a plain object.
 */
@ -45,8 +47,10 @@ const getActions = async (searchParams, includeSensitive = false) => {
 /**
 * Deletes an action by params.
 *
- * @param {{ action_id: string, agent_id?: string, assistant_id?: string, user?: string }} searchParams
- * @returns {Promise<Action|null>} The deleted action document as a plain object, or null if no match.
+ * @param {Object} searchParams - The search parameters to find the action to delete.
+ * @param {string} searchParams.action_id - The ID of the action to delete.
+ * @param {string} searchParams.user - The user ID of the action's author.
+ * @returns {Promise<Action>} A promise that resolves to the deleted action document as a plain object, or null if no document was found.
 */
 const deleteAction = async (searchParams) => {
  return await Action.findOneAndDelete(searchParams).lean();
--- a/api/models/Action.spec.js
+++ b/api/models/Action.spec.js
@ -1,250 +0,0 @@
-const mongoose = require('mongoose');
-const { MongoMemoryServer } = require('mongodb-memory-server');
-const { actionSchema } = require('@librechat/data-schemas');
-const { updateAction, getActions, deleteAction } = require('./Action');
-
-let mongoServer;
-
-beforeAll(async () => {
-  mongoServer = await MongoMemoryServer.create();
-  const mongoUri = mongoServer.getUri();
-  if (!mongoose.models.Action) {
-    mongoose.model('Action', actionSchema);
-  }
-  await mongoose.connect(mongoUri);
-}, 20000);
-
-afterAll(async () => {
-  await mongoose.disconnect();
-  await mongoServer.stop();
-});
-
-beforeEach(async () => {
-  await mongoose.models.Action.deleteMany({});
-});
-
-const userId = new mongoose.Types.ObjectId();
-
-describe('Action ownership scoping', () => {
-  describe('updateAction', () => {
-    it('updates when action_id and agent_id both match', async () => {
-      await mongoose.models.Action.create({
-        user: userId,
-        action_id: 'act_1',
-        agent_id: 'agent_A',
-        metadata: { domain: 'example.com' },
-      });
-
-      const result = await updateAction(
-        { action_id: 'act_1', agent_id: 'agent_A' },
-        { metadata: { domain: 'updated.com' } },
-      );
-
-      expect(result).not.toBeNull();
-      expect(result.metadata.domain).toBe('updated.com');
-      expect(result.agent_id).toBe('agent_A');
-    });
-
-    it('does not update when agent_id does not match (creates a new doc via upsert)', async () => {
-      await mongoose.models.Action.create({
-        user: userId,
-        action_id: 'act_1',
-        agent_id: 'agent_B',
-        metadata: { domain: 'victim.com', api_key: 'secret' },
-      });
-
-      const result = await updateAction(
-        { action_id: 'act_1', agent_id: 'agent_A' },
-        { user: userId, metadata: { domain: 'attacker.com' } },
-      );
-
-      expect(result.metadata.domain).toBe('attacker.com');
-
-      const original = await mongoose.models.Action.findOne({
-        action_id: 'act_1',
-        agent_id: 'agent_B',
-      }).lean();
-      expect(original).not.toBeNull();
-      expect(original.metadata.domain).toBe('victim.com');
-      expect(original.metadata.api_key).toBe('secret');
-    });
-
-    it('updates when action_id and assistant_id both match', async () => {
-      await mongoose.models.Action.create({
-        user: userId,
-        action_id: 'act_2',
-        assistant_id: 'asst_X',
-        metadata: { domain: 'example.com' },
-      });
-
-      const result = await updateAction(
-        { action_id: 'act_2', assistant_id: 'asst_X' },
-        { metadata: { domain: 'updated.com' } },
-      );
-
-      expect(result).not.toBeNull();
-      expect(result.metadata.domain).toBe('updated.com');
-    });
-
-    it('does not overwrite when assistant_id does not match', async () => {
-      await mongoose.models.Action.create({
-        user: userId,
-        action_id: 'act_2',
-        assistant_id: 'asst_victim',
-        metadata: { domain: 'victim.com', api_key: 'secret' },
-      });
-
-      await updateAction(
-        { action_id: 'act_2', assistant_id: 'asst_attacker' },
-        { user: userId, metadata: { domain: 'attacker.com' } },
-      );
-
-      const original = await mongoose.models.Action.findOne({
-        action_id: 'act_2',
-        assistant_id: 'asst_victim',
-      }).lean();
-      expect(original).not.toBeNull();
-      expect(original.metadata.domain).toBe('victim.com');
-      expect(original.metadata.api_key).toBe('secret');
-    });
-  });
-
-  describe('deleteAction', () => {
-    it('deletes when action_id and agent_id both match', async () => {
-      await mongoose.models.Action.create({
-        user: userId,
-        action_id: 'act_del',
-        agent_id: 'agent_A',
-        metadata: { domain: 'example.com' },
-      });
-
-      const result = await deleteAction({ action_id: 'act_del', agent_id: 'agent_A' });
-      expect(result).not.toBeNull();
-      expect(result.action_id).toBe('act_del');
-
-      const remaining = await mongoose.models.Action.countDocuments();
-      expect(remaining).toBe(0);
-    });
-
-    it('returns null and preserves the document when agent_id does not match', async () => {
-      await mongoose.models.Action.create({
-        user: userId,
-        action_id: 'act_del',
-        agent_id: 'agent_B',
-        metadata: { domain: 'victim.com' },
-      });
-
-      const result = await deleteAction({ action_id: 'act_del', agent_id: 'agent_A' });
-      expect(result).toBeNull();
-
-      const remaining = await mongoose.models.Action.countDocuments();
-      expect(remaining).toBe(1);
-    });
-
-    it('deletes when action_id and assistant_id both match', async () => {
-      await mongoose.models.Action.create({
-        user: userId,
-        action_id: 'act_del_asst',
-        assistant_id: 'asst_X',
-        metadata: { domain: 'example.com' },
-      });
-
-      const result = await deleteAction({ action_id: 'act_del_asst', assistant_id: 'asst_X' });
-      expect(result).not.toBeNull();
-
-      const remaining = await mongoose.models.Action.countDocuments();
-      expect(remaining).toBe(0);
-    });
-
-    it('returns null and preserves the document when assistant_id does not match', async () => {
-      await mongoose.models.Action.create({
-        user: userId,
-        action_id: 'act_del_asst',
-        assistant_id: 'asst_victim',
-        metadata: { domain: 'victim.com' },
-      });
-
-      const result = await deleteAction({
-        action_id: 'act_del_asst',
-        assistant_id: 'asst_attacker',
-      });
-      expect(result).toBeNull();
-
-      const remaining = await mongoose.models.Action.countDocuments();
-      expect(remaining).toBe(1);
-    });
-  });
-
-  describe('getActions (unscoped baseline)', () => {
-    it('returns actions by action_id regardless of agent_id', async () => {
-      await mongoose.models.Action.create({
-        user: userId,
-        action_id: 'act_shared',
-        agent_id: 'agent_B',
-        metadata: { domain: 'example.com' },
-      });
-
-      const results = await getActions({ action_id: 'act_shared' }, true);
-      expect(results).toHaveLength(1);
-      expect(results[0].agent_id).toBe('agent_B');
-    });
-
-    it('returns actions scoped by agent_id when provided', async () => {
-      await mongoose.models.Action.create({
-        user: userId,
-        action_id: 'act_scoped',
-        agent_id: 'agent_A',
-        metadata: { domain: 'a.com' },
-      });
-      await mongoose.models.Action.create({
-        user: userId,
-        action_id: 'act_other',
-        agent_id: 'agent_B',
-        metadata: { domain: 'b.com' },
-      });
-
-      const results = await getActions({ agent_id: 'agent_A' });
-      expect(results).toHaveLength(1);
-      expect(results[0].action_id).toBe('act_scoped');
-    });
-  });
-
-  describe('cross-type protection', () => {
-    it('updateAction with agent_id filter does not overwrite assistant-owned action', async () => {
-      await mongoose.models.Action.create({
-        user: userId,
-        action_id: 'act_cross',
-        assistant_id: 'asst_victim',
-        metadata: { domain: 'victim.com', api_key: 'secret' },
-      });
-
-      await updateAction(
-        { action_id: 'act_cross', agent_id: 'agent_attacker' },
-        { user: userId, metadata: { domain: 'evil.com' } },
-      );
-
-      const original = await mongoose.models.Action.findOne({
-        action_id: 'act_cross',
-        assistant_id: 'asst_victim',
-      }).lean();
-      expect(original).not.toBeNull();
-      expect(original.metadata.domain).toBe('victim.com');
-      expect(original.metadata.api_key).toBe('secret');
-    });
-
-    it('deleteAction with agent_id filter does not delete assistant-owned action', async () => {
-      await mongoose.models.Action.create({
-        user: userId,
-        action_id: 'act_cross_del',
-        assistant_id: 'asst_victim',
-        metadata: { domain: 'victim.com' },
-      });
-
-      const result = await deleteAction({ action_id: 'act_cross_del', agent_id: 'agent_attacker' });
-      expect(result).toBeNull();
-
-      const remaining = await mongoose.models.Action.countDocuments();
-      expect(remaining).toBe(1);
-    });
-  });
-});
--- a/api/models/Agent.js
+++ b/api/models/Agent.js
@ -589,16 +589,10 @@ const deleteAgent = async (searchParameter) => {
  const agent = await Agent.findOneAndDelete(searchParameter);
  if (agent) {
    await removeAgentFromAllProjects(agent.id);
-    await Promise.all([
-      removeAllPermissions({
-        resourceType: ResourceType.AGENT,
-        resourceId: agent._id,
-      }),
-      removeAllPermissions({
-        resourceType: ResourceType.REMOTE_AGENT,
-        resourceId: agent._id,
-      }),
-    ]);
+    await removeAllPermissions({
+      resourceType: ResourceType.AGENT,
+      resourceId: agent._id,
+    });
    try {
      await Agent.updateMany({ 'edges.to': agent.id }, { $pull: { edges: { to: agent.id } } });
    } catch (error) {
@ -637,7 +631,7 @@ const deleteUserAgents = async (userId) => {
    }

    await AclEntry.deleteMany({
-      resourceType: { $in: [ResourceType.AGENT, ResourceType.REMOTE_AGENT] },
+      resourceType: ResourceType.AGENT,
      resourceId: { $in: agentObjectIds },
    });

--- a/api/models/Conversation.js
+++ b/api/models/Conversation.js
@ -124,15 +124,10 @@ module.exports = {
        updateOperation,
        {
          new: true,
-          upsert: metadata?.noUpsert !== true,
+          upsert: true,
        },
      );

-      if (!conversation) {
-        logger.debug('[saveConvo] Conversation not found, skipping update');
-        return null;
-      }
-
      return conversation.toObject();
    } catch (error) {
      logger.error('[saveConvo] Error saving conversation', error);
@ -228,7 +223,7 @@ module.exports = {
            },
          ],
        };
-      } catch (_err) {
+      } catch (err) {
        logger.warn('[getConvosByCursor] Invalid cursor format, starting from beginning');
      }
      if (cursorFilter) {
@ -361,7 +356,6 @@ module.exports = {

      const deleteMessagesResult = await deleteMessages({
        conversationId: { $in: conversationIds },
-        user,
      });

      return { ...deleteConvoResult, messages: deleteMessagesResult };
--- a/api/models/Conversation.spec.js
+++ b/api/models/Conversation.spec.js
@ -106,47 +106,6 @@ describe('Conversation Operations', () => {
      expect(result.conversationId).toBe(newConversationId);
    });

-    it('should not create a conversation when noUpsert is true and conversation does not exist', async () => {
-      const nonExistentId = uuidv4();
-      const result = await saveConvo(
-        mockReq,
-        { conversationId: nonExistentId, title: 'Ghost Title' },
-        { noUpsert: true },
-      );
-
-      expect(result).toBeNull();
-
-      const dbConvo = await Conversation.findOne({ conversationId: nonExistentId });
-      expect(dbConvo).toBeNull();
-    });
-
-    it('should update an existing conversation when noUpsert is true', async () => {
-      await saveConvo(mockReq, mockConversationData);
-
-      const result = await saveConvo(
-        mockReq,
-        { conversationId: mockConversationData.conversationId, title: 'Updated Title' },
-        { noUpsert: true },
-      );
-
-      expect(result).not.toBeNull();
-      expect(result.title).toBe('Updated Title');
-      expect(result.conversationId).toBe(mockConversationData.conversationId);
-    });
-
-    it('should still upsert by default when noUpsert is not provided', async () => {
-      const newId = uuidv4();
-      const result = await saveConvo(mockReq, {
-        conversationId: newId,
-        title: 'New Conversation',
-        endpoint: EModelEndpoint.openAI,
-      });
-
-      expect(result).not.toBeNull();
-      expect(result.conversationId).toBe(newId);
-      expect(result.title).toBe('New Conversation');
-    });
-
    it('should handle unsetFields metadata', async () => {
      const metadata = {
        unsetFields: { someField: 1 },
@ -163,6 +122,7 @@ describe('Conversation Operations', () => {

  describe('isTemporary conversation handling', () => {
    it('should save a conversation with expiredAt when isTemporary is true', async () => {
+      // Mock app config with 24 hour retention
      mockReq.config.interfaceConfig.temporaryChatRetention = 24;

      mockReq.body = { isTemporary: true };
@ -175,6 +135,7 @@ describe('Conversation Operations', () => {
      expect(result.expiredAt).toBeDefined();
      expect(result.expiredAt).toBeInstanceOf(Date);

+      // Verify expiredAt is approximately 24 hours in the future
      const expectedExpirationTime = new Date(beforeSave.getTime() + 24 * 60 * 60 * 1000);
      const actualExpirationTime = new Date(result.expiredAt);

@ -196,6 +157,7 @@ describe('Conversation Operations', () => {
    });

    it('should save a conversation without expiredAt when isTemporary is not provided', async () => {
+      // No isTemporary in body
      mockReq.body = {};

      const result = await saveConvo(mockReq, mockConversationData);
@ -205,6 +167,7 @@ describe('Conversation Operations', () => {
    });

    it('should use custom retention period from config', async () => {
+      // Mock app config with 48 hour retention
      mockReq.config.interfaceConfig.temporaryChatRetention = 48;

      mockReq.body = { isTemporary: true };
@ -549,7 +512,6 @@ describe('Conversation Operations', () => {
      expect(result.messages.deletedCount).toBe(5);
      expect(deleteMessages).toHaveBeenCalledWith({
        conversationId: { $in: [mockConversationData.conversationId] },
-        user: 'user123',
      });

      // Verify conversation was deleted
--- a/api/models/File.js
+++ b/api/models/File.js
@ -26,8 +26,7 @@ const getFiles = async (filter, _sortOptions, selectFields = { text: 0 }) => {
 };

 /**
- * Retrieves tool files (files that are embedded or have a fileIdentifier) from an array of file IDs.
- * Note: execute_code files are handled separately by getCodeGeneratedFiles.
+ * Retrieves tool files (files that are embedded or have a fileIdentifier) from an array of file IDs
 * @param {string[]} fileIds - Array of file_id strings to search for
 * @param {Set<EToolResources>} toolResourceSet - Optional filter for tool resources
 * @returns {Promise<Array<MongoFile>>} Files that match the criteria
@ -38,25 +37,21 @@ const getToolFilesByIds = async (fileIds, toolResourceSet) => {
  }

  try {
-    const orConditions = [];
-
-    if (toolResourceSet.has(EToolResources.context)) {
-      orConditions.push({ text: { $exists: true, $ne: null }, context: FileContext.agents });
-    }
-    if (toolResourceSet.has(EToolResources.file_search)) {
-      orConditions.push({ embedded: true });
-    }
-
-    if (orConditions.length === 0) {
-      return [];
-    }
-
    const filter = {
      file_id: { $in: fileIds },
-      context: { $ne: FileContext.execute_code }, // Exclude code-generated files
-      $or: orConditions,
+      $or: [],
    };

+    if (toolResourceSet.has(EToolResources.context)) {
+      filter.$or.push({ text: { $exists: true, $ne: null }, context: FileContext.agents });
+    }
+    if (toolResourceSet.has(EToolResources.file_search)) {
+      filter.$or.push({ embedded: true });
+    }
+    if (toolResourceSet.has(EToolResources.execute_code)) {
+      filter.$or.push({ 'metadata.fileIdentifier': { $exists: true } });
+    }
+
    const selectFields = { text: 0 };
    const sortOptions = { updatedAt: -1 };

@ -67,70 +62,6 @@ const getToolFilesByIds = async (fileIds, toolResourceSet) => {
  }
 };

-/**
- * Retrieves files generated by code execution for a given conversation.
- * These files are stored locally with fileIdentifier metadata for code env re-upload.
- * @param {string} conversationId - The conversation ID to search for
- * @param {string[]} [messageIds] - Optional array of messageIds to filter by (for linear thread filtering)
- * @returns {Promise<Array<MongoFile>>} Files generated by code execution in the conversation
- */
-const getCodeGeneratedFiles = async (conversationId, messageIds) => {
-  if (!conversationId) {
-    return [];
-  }
-
-  /** messageIds are required for proper thread filtering of code-generated files */
-  if (!messageIds || messageIds.length === 0) {
-    return [];
-  }
-
-  try {
-    const filter = {
-      conversationId,
-      context: FileContext.execute_code,
-      messageId: { $exists: true, $in: messageIds },
-      'metadata.fileIdentifier': { $exists: true },
-    };
-
-    const selectFields = { text: 0 };
-    const sortOptions = { createdAt: 1 };
-
-    return await getFiles(filter, sortOptions, selectFields);
-  } catch (error) {
-    logger.error('[getCodeGeneratedFiles] Error retrieving code generated files:', error);
-    return [];
-  }
-};
-
-/**
- * Retrieves user-uploaded execute_code files (not code-generated) by their file IDs.
- * These are files with fileIdentifier metadata but context is NOT execute_code (e.g., agents or message_attachment).
- * File IDs should be collected from message.files arrays in the current thread.
- * @param {string[]} fileIds - Array of file IDs to fetch (from message.files in the thread)
- * @returns {Promise<Array<MongoFile>>} User-uploaded execute_code files
- */
-const getUserCodeFiles = async (fileIds) => {
-  if (!fileIds || fileIds.length === 0) {
-    return [];
-  }
-
-  try {
-    const filter = {
-      file_id: { $in: fileIds },
-      context: { $ne: FileContext.execute_code },
-      'metadata.fileIdentifier': { $exists: true },
-    };
-
-    const selectFields = { text: 0 };
-    const sortOptions = { createdAt: 1 };
-
-    return await getFiles(filter, sortOptions, selectFields);
-  } catch (error) {
-    logger.error('[getUserCodeFiles] Error retrieving user code files:', error);
-    return [];
-  }
-};
-
 /**
 * Creates a new file with a TTL of 1 hour.
 * @param {MongoFile} data - The file data to be created, must contain file_id.
@ -238,8 +169,6 @@ module.exports = {
  findFileById,
  getFiles,
  getToolFilesByIds,
-  getCodeGeneratedFiles,
-  getUserCodeFiles,
  createFile,
  updateFile,
  updateFileUsage,
--- a/api/models/File.spec.js
+++ b/api/models/File.spec.js
@ -152,11 +152,12 @@ describe('File Access Control', () => {
      expect(accessMap.get(fileIds[3])).toBe(false);
    });

-    it('should only grant author access to files attached to the agent', async () => {
+    it('should grant access to all files when user is the agent author', async () => {
      const authorId = new mongoose.Types.ObjectId();
      const agentId = uuidv4();
      const fileIds = [uuidv4(), uuidv4(), uuidv4()];

+      // Create author user
      await User.create({
        _id: authorId,
        email: 'author@example.com',
@ -164,6 +165,7 @@ describe('File Access Control', () => {
        provider: 'local',
      });

+      // Create agent
      await createAgent({
        id: agentId,
        name: 'Test Agent',
@ -172,83 +174,12 @@ describe('File Access Control', () => {
        provider: 'openai',
        tool_resources: {
          file_search: {
-            file_ids: [fileIds[0]],
-          },
-        },
-      });
-
-      const { hasAccessToFilesViaAgent } = require('~/server/services/Files/permissions');
-      const accessMap = await hasAccessToFilesViaAgent({
-        userId: authorId,
-        role: SystemRoles.USER,
-        fileIds,
-        agentId,
-      });
-
-      expect(accessMap.get(fileIds[0])).toBe(true);
-      expect(accessMap.get(fileIds[1])).toBe(false);
-      expect(accessMap.get(fileIds[2])).toBe(false);
-    });
-
-    it('should deny all access when agent has no tool_resources', async () => {
-      const authorId = new mongoose.Types.ObjectId();
-      const agentId = uuidv4();
-      const fileId = uuidv4();
-
-      await User.create({
-        _id: authorId,
-        email: 'author-no-resources@example.com',
-        emailVerified: true,
-        provider: 'local',
-      });
-
-      await createAgent({
-        id: agentId,
-        name: 'Bare Agent',
-        author: authorId,
-        model: 'gpt-4',
-        provider: 'openai',
-      });
-
-      const { hasAccessToFilesViaAgent } = require('~/server/services/Files/permissions');
-      const accessMap = await hasAccessToFilesViaAgent({
-        userId: authorId,
-        role: SystemRoles.USER,
-        fileIds: [fileId],
-        agentId,
-      });
-
-      expect(accessMap.get(fileId)).toBe(false);
-    });
-
-    it('should grant access to files across multiple resource types', async () => {
-      const authorId = new mongoose.Types.ObjectId();
-      const agentId = uuidv4();
-      const fileIds = [uuidv4(), uuidv4(), uuidv4()];
-
-      await User.create({
-        _id: authorId,
-        email: 'author-multi@example.com',
-        emailVerified: true,
-        provider: 'local',
-      });
-
-      await createAgent({
-        id: agentId,
-        name: 'Multi Resource Agent',
-        author: authorId,
-        model: 'gpt-4',
-        provider: 'openai',
-        tool_resources: {
-          file_search: {
-            file_ids: [fileIds[0]],
-          },
-          execute_code: {
-            file_ids: [fileIds[1]],
+            file_ids: [fileIds[0]], // Only one file attached
          },
        },
      });

+      // Check access as the author
      const { hasAccessToFilesViaAgent } = require('~/server/services/Files/permissions');
      const accessMap = await hasAccessToFilesViaAgent({
        userId: authorId,
@ -257,48 +188,10 @@ describe('File Access Control', () => {
        agentId,
      });

+      // Author should have access to all files
      expect(accessMap.get(fileIds[0])).toBe(true);
      expect(accessMap.get(fileIds[1])).toBe(true);
-      expect(accessMap.get(fileIds[2])).toBe(false);
-    });
-
-    it('should grant author access to attached files when isDelete is true', async () => {
-      const authorId = new mongoose.Types.ObjectId();
-      const agentId = uuidv4();
-      const attachedFileId = uuidv4();
-      const unattachedFileId = uuidv4();
-
-      await User.create({
-        _id: authorId,
-        email: 'author-delete@example.com',
-        emailVerified: true,
-        provider: 'local',
-      });
-
-      await createAgent({
-        id: agentId,
-        name: 'Delete Test Agent',
-        author: authorId,
-        model: 'gpt-4',
-        provider: 'openai',
-        tool_resources: {
-          file_search: {
-            file_ids: [attachedFileId],
-          },
-        },
-      });
-
-      const { hasAccessToFilesViaAgent } = require('~/server/services/Files/permissions');
-      const accessMap = await hasAccessToFilesViaAgent({
-        userId: authorId,
-        role: SystemRoles.USER,
-        fileIds: [attachedFileId, unattachedFileId],
-        agentId,
-        isDelete: true,
-      });
-
-      expect(accessMap.get(attachedFileId)).toBe(true);
-      expect(accessMap.get(unattachedFileId)).toBe(false);
+      expect(accessMap.get(fileIds[2])).toBe(true);
    });

    it('should handle non-existent agent gracefully', async () => {
--- a/api/models/Role.js
+++ b/api/models/Role.js
@ -114,28 +114,6 @@ async function updateAccessPermissions(roleName, permissionsUpdate, roleData) {
      }
    }

-    // Migrate legacy SHARED_GLOBAL → SHARE for PROMPTS and AGENTS.
-    // SHARED_GLOBAL was removed in favour of SHARE in PR #11283. If the DB still has
-    // SHARED_GLOBAL but not SHARE, inherit the value so sharing intent is preserved.
-    const legacySharedGlobalTypes = ['PROMPTS', 'AGENTS'];
-    for (const legacyPermType of legacySharedGlobalTypes) {
-      const existingTypePerms = currentPermissions[legacyPermType];
-      if (
-        existingTypePerms &&
-        'SHARED_GLOBAL' in existingTypePerms &&
-        !('SHARE' in existingTypePerms) &&
-        updates[legacyPermType] &&
-        // Don't override an explicit SHARE value the caller already provided
-        !('SHARE' in updates[legacyPermType])
-      ) {
-        const inheritedValue = existingTypePerms['SHARED_GLOBAL'];
-        updates[legacyPermType]['SHARE'] = inheritedValue;
-        logger.info(
-          `Migrating '${roleName}' role ${legacyPermType}.SHARED_GLOBAL=${inheritedValue} → SHARE`,
-        );
-      }
-    }
-
    for (const [permissionType, permissions] of Object.entries(updates)) {
      const currentTypePermissions = currentPermissions[permissionType] || {};
      updatedPermissions[permissionType] = { ...currentTypePermissions };
@ -151,32 +129,6 @@ async function updateAccessPermissions(roleName, permissionsUpdate, roleData) {
      }
    }

-    // Clean up orphaned SHARED_GLOBAL fields left in DB after the schema rename.
-    // Since we $set the full permissions object, deleting from updatedPermissions
-    // is sufficient to remove the field from MongoDB.
-    for (const legacyPermType of legacySharedGlobalTypes) {
-      const existingTypePerms = currentPermissions[legacyPermType];
-      if (existingTypePerms && 'SHARED_GLOBAL' in existingTypePerms) {
-        if (!updates[legacyPermType]) {
-          // permType wasn't in the update payload so the migration block above didn't run.
-          // Create a writable copy and handle the SHARED_GLOBAL → SHARE inheritance here
-          // to avoid removing SHARED_GLOBAL without writing SHARE (data loss).
-          updatedPermissions[legacyPermType] = { ...existingTypePerms };
-          if (!('SHARE' in existingTypePerms)) {
-            updatedPermissions[legacyPermType]['SHARE'] = existingTypePerms['SHARED_GLOBAL'];
-            logger.info(
-              `Migrating '${roleName}' role ${legacyPermType}.SHARED_GLOBAL=${existingTypePerms['SHARED_GLOBAL']} → SHARE`,
-            );
-          }
-        }
-        delete updatedPermissions[legacyPermType]['SHARED_GLOBAL'];
-        hasChanges = true;
-        logger.info(
-          `Removed legacy SHARED_GLOBAL field from '${roleName}' role ${legacyPermType} permissions`,
-        );
-      }
-    }
-
    if (hasChanges) {
      const updateObj = { permissions: updatedPermissions };

--- a/api/models/Role.spec.js
+++ b/api/models/Role.spec.js
@ -233,112 +233,6 @@ describe('updateAccessPermissions', () => {
    expect(updatedRole.permissions[PermissionTypes.MULTI_CONVO]).toEqual({ USE: true });
  });

-  it('should inherit SHARED_GLOBAL value into SHARE when SHARE is absent from both DB and update', async () => {
-    // Simulates the startup backfill path: caller sends SHARE_PUBLIC but not SHARE;
-    // migration should inherit SHARED_GLOBAL to preserve the deployment's sharing intent.
-    await Role.collection.insertOne({
-      name: SystemRoles.USER,
-      permissions: {
-        [PermissionTypes.PROMPTS]: { USE: true, CREATE: true, SHARED_GLOBAL: true },
-        [PermissionTypes.AGENTS]: { USE: true, CREATE: true, SHARED_GLOBAL: false },
-      },
-    });
-
-    await updateAccessPermissions(SystemRoles.USER, {
-      // No explicit SHARE — migration should inherit from SHARED_GLOBAL
-      [PermissionTypes.PROMPTS]: { SHARE_PUBLIC: false },
-      [PermissionTypes.AGENTS]: { SHARE_PUBLIC: false },
-    });
-
-    const updatedRole = await getRoleByName(SystemRoles.USER);
-
-    // SHARED_GLOBAL=true → SHARE=true (inherited)
-    expect(updatedRole.permissions[PermissionTypes.PROMPTS].SHARE).toBe(true);
-    // SHARED_GLOBAL=false → SHARE=false (inherited)
-    expect(updatedRole.permissions[PermissionTypes.AGENTS].SHARE).toBe(false);
-    // SHARED_GLOBAL cleaned up
-    expect(updatedRole.permissions[PermissionTypes.PROMPTS].SHARED_GLOBAL).toBeUndefined();
-    expect(updatedRole.permissions[PermissionTypes.AGENTS].SHARED_GLOBAL).toBeUndefined();
-  });
-
-  it('should respect explicit SHARE in update payload and not override it with SHARED_GLOBAL', async () => {
-    // Caller explicitly passes SHARE: false even though SHARED_GLOBAL=true in DB.
-    // The explicit intent must win; migration must not silently overwrite it.
-    await Role.collection.insertOne({
-      name: SystemRoles.USER,
-      permissions: {
-        [PermissionTypes.PROMPTS]: { USE: true, SHARED_GLOBAL: true },
-      },
-    });
-
-    await updateAccessPermissions(SystemRoles.USER, {
-      [PermissionTypes.PROMPTS]: { SHARE: false }, // explicit false — should be preserved
-    });
-
-    const updatedRole = await getRoleByName(SystemRoles.USER);
-
-    expect(updatedRole.permissions[PermissionTypes.PROMPTS].SHARE).toBe(false);
-    expect(updatedRole.permissions[PermissionTypes.PROMPTS].SHARED_GLOBAL).toBeUndefined();
-  });
-
-  it('should migrate SHARED_GLOBAL to SHARE even when the permType is not in the update payload', async () => {
-    // Bug #2 regression: cleanup block removes SHARED_GLOBAL but migration block only
-    // runs when the permType is in the update payload. Without the fix, SHARE would be
-    // lost when any other permType (e.g. MULTI_CONVO) is the only thing being updated.
-    await Role.collection.insertOne({
-      name: SystemRoles.USER,
-      permissions: {
-        [PermissionTypes.PROMPTS]: {
-          USE: true,
-          SHARED_GLOBAL: true, // legacy — NO SHARE present
-        },
-        [PermissionTypes.MULTI_CONVO]: { USE: false },
-      },
-    });
-
-    // Only update MULTI_CONVO — PROMPTS is intentionally absent from the payload
-    await updateAccessPermissions(SystemRoles.USER, {
-      [PermissionTypes.MULTI_CONVO]: { USE: true },
-    });
-
-    const updatedRole = await getRoleByName(SystemRoles.USER);
-
-    // SHARE should have been inherited from SHARED_GLOBAL, not silently dropped
-    expect(updatedRole.permissions[PermissionTypes.PROMPTS].SHARE).toBe(true);
-    // SHARED_GLOBAL should be removed
-    expect(updatedRole.permissions[PermissionTypes.PROMPTS].SHARED_GLOBAL).toBeUndefined();
-    // Original USE should be untouched
-    expect(updatedRole.permissions[PermissionTypes.PROMPTS].USE).toBe(true);
-    // The actual update should have applied
-    expect(updatedRole.permissions[PermissionTypes.MULTI_CONVO].USE).toBe(true);
-  });
-
-  it('should remove orphaned SHARED_GLOBAL when SHARE already exists and permType is not in update', async () => {
-    // Safe cleanup case: SHARE already set, SHARED_GLOBAL is just orphaned noise.
-    // SHARE must not be changed; SHARED_GLOBAL must be removed.
-    await Role.collection.insertOne({
-      name: SystemRoles.USER,
-      permissions: {
-        [PermissionTypes.PROMPTS]: {
-          USE: true,
-          SHARE: true, // already migrated
-          SHARED_GLOBAL: true, // orphaned
-        },
-        [PermissionTypes.MULTI_CONVO]: { USE: false },
-      },
-    });
-
-    await updateAccessPermissions(SystemRoles.USER, {
-      [PermissionTypes.MULTI_CONVO]: { USE: true },
-    });
-
-    const updatedRole = await getRoleByName(SystemRoles.USER);
-
-    expect(updatedRole.permissions[PermissionTypes.PROMPTS].SHARED_GLOBAL).toBeUndefined();
-    expect(updatedRole.permissions[PermissionTypes.PROMPTS].SHARE).toBe(true);
-    expect(updatedRole.permissions[PermissionTypes.MULTI_CONVO].USE).toBe(true);
-  });
-
  it('should not update MULTI_CONVO permissions when no changes are needed', async () => {
    await new Role({
      name: SystemRoles.USER,
--- a/api/models/Transaction.js
+++ b/api/models/Transaction.js
@ -1,19 +1,153 @@
-const { logger, CANCEL_RATE } = require('@librechat/data-schemas');
+const { logger } = require('@librechat/data-schemas');
 const { getMultiplier, getCacheMultiplier } = require('./tx');
-const { Transaction } = require('~/db/models');
-const { updateBalance } = require('~/models');
+const { Transaction, Balance } = require('~/db/models');
+
+const cancelRate = 1.15;
+
+/**
+ * Updates a user's token balance based on a transaction using optimistic concurrency control
+ * without schema changes. Compatible with DocumentDB.
+ * @async
+ * @function
+ * @param {Object} params - The function parameters.
+ * @param {string|mongoose.Types.ObjectId} params.user - The user ID.
+ * @param {number} params.incrementValue - The value to increment the balance by (can be negative).
+ * @param {import('mongoose').UpdateQuery<import('@librechat/data-schemas').IBalance>['$set']} [params.setValues] - Optional additional fields to set.
+ * @returns {Promise<Object>} Returns the updated balance document (lean).
+ * @throws {Error} Throws an error if the update fails after multiple retries.
+ */
+const updateBalance = async ({ user, incrementValue, setValues }) => {
+  let maxRetries = 10; // Number of times to retry on conflict
+  let delay = 50; // Initial retry delay in ms
+  let lastError = null;
+
+  for (let attempt = 1; attempt <= maxRetries; attempt++) {
+    let currentBalanceDoc;
+    try {
+      // 1. Read the current document state
+      currentBalanceDoc = await Balance.findOne({ user }).lean();
+      const currentCredits = currentBalanceDoc ? currentBalanceDoc.tokenCredits : 0;
+
+      // 2. Calculate the desired new state
+      const potentialNewCredits = currentCredits + incrementValue;
+      const newCredits = Math.max(0, potentialNewCredits); // Ensure balance doesn't go below zero
+
+      // 3. Prepare the update payload
+      const updatePayload = {
+        $set: {
+          tokenCredits: newCredits,
+          ...(setValues || {}), // Merge other values to set
+        },
+      };
+
+      // 4. Attempt the conditional update or upsert
+      let updatedBalance = null;
+      if (currentBalanceDoc) {
+        // --- Document Exists: Perform Conditional Update ---
+        // Try to update only if the tokenCredits match the value we read (currentCredits)
+        updatedBalance = await Balance.findOneAndUpdate(
+          {
+            user: user,
+            tokenCredits: currentCredits, // Optimistic lock: condition based on the read value
+          },
+          updatePayload,
+          {
+            new: true, // Return the modified document
+            // lean: true, // .lean() is applied after query execution in Mongoose >= 6
+          },
+        ).lean(); // Use lean() for plain JS object
+
+        if (updatedBalance) {
+          // Success! The update was applied based on the expected current state.
+          return updatedBalance;
+        }
+        // If updatedBalance is null, it means tokenCredits changed between read and write (conflict).
+        lastError = new Error(`Concurrency conflict for user ${user} on attempt ${attempt}.`);
+        // Proceed to retry logic below.
+      } else {
+        // --- Document Does Not Exist: Perform Conditional Upsert ---
+        // Try to insert the document, but only if it still doesn't exist.
+        // Using tokenCredits: {$exists: false} helps prevent race conditions where
+        // another process creates the doc between our findOne and findOneAndUpdate.
+        try {
+          updatedBalance = await Balance.findOneAndUpdate(
+            {
+              user: user,
+              // Attempt to match only if the document doesn't exist OR was just created
+              // without tokenCredits (less likely but possible). A simple { user } filter
+              // might also work, relying on the retry for conflicts.
+              // Let's use a simpler filter and rely on retry for races.
+              // tokenCredits: { $exists: false } // This condition might be too strict if doc exists with 0 credits
+            },
+            updatePayload,
+            {
+              upsert: true, // Create if doesn't exist
+              new: true, // Return the created/updated document
+              // setDefaultsOnInsert: true, // Ensure schema defaults are applied on insert
+              // lean: true,
+            },
+          ).lean();
+
+          if (updatedBalance) {
+            // Upsert succeeded (likely created the document)
+            return updatedBalance;
+          }
+          // If null, potentially a rare race condition during upsert. Retry should handle it.
+          lastError = new Error(
+            `Upsert race condition suspected for user ${user} on attempt ${attempt}.`,
+          );
+        } catch (error) {
+          if (error.code === 11000) {
+            // E11000 duplicate key error on index
+            // This means another process created the document *just* before our upsert.
+            // It's a concurrency conflict during creation. We should retry.
+            lastError = error; // Store the error
+            // Proceed to retry logic below.
+          } else {
+            // Different error, rethrow
+            throw error;
+          }
+        }
+      } // End if/else (document exists?)
+    } catch (error) {
+      // Catch errors from findOne or unexpected findOneAndUpdate errors
+      logger.error(`[updateBalance] Error during attempt ${attempt} for user ${user}:`, error);
+      lastError = error; // Store the error
+      // Consider stopping retries for non-transient errors, but for now, we retry.
+    }
+
+    // If we reached here, it means the update failed (conflict or error), wait and retry
+    if (attempt < maxRetries) {
+      const jitter = Math.random() * delay * 0.5; // Add jitter to delay
+      await new Promise((resolve) => setTimeout(resolve, delay + jitter));
+      delay = Math.min(delay * 2, 2000); // Exponential backoff with cap
+    }
+  } // End for loop (retries)
+
+  // If loop finishes without success, throw the last encountered error or a generic one
+  logger.error(
+    `[updateBalance] Failed to update balance for user ${user} after ${maxRetries} attempts.`,
+  );
+  throw (
+    lastError ||
+    new Error(
+      `Failed to update balance for user ${user} after maximum retries due to persistent conflicts.`,
+    )
+  );
+};

 /** Method to calculate and set the tokenValue for a transaction */
 function calculateTokenValue(txn) {
-  const { valueKey, tokenType, model, endpointTokenConfig, inputTokenCount } = txn;
-  const multiplier = Math.abs(
-    getMultiplier({ valueKey, tokenType, model, endpointTokenConfig, inputTokenCount }),
-  );
+  if (!txn.valueKey || !txn.tokenType) {
+    txn.tokenValue = txn.rawAmount;
+  }
+  const { valueKey, tokenType, model, endpointTokenConfig } = txn;
+  const multiplier = Math.abs(getMultiplier({ valueKey, tokenType, model, endpointTokenConfig }));
  txn.rate = multiplier;
  txn.tokenValue = txn.rawAmount * multiplier;
  if (txn.context && txn.tokenType === 'completion' && txn.context === 'incomplete') {
-    txn.tokenValue = Math.ceil(txn.tokenValue * CANCEL_RATE);
-    txn.rate *= CANCEL_RATE;
+    txn.tokenValue = Math.ceil(txn.tokenValue * cancelRate);
+    txn.rate *= cancelRate;
  }
 }

@ -32,7 +166,6 @@ async function createAutoRefillTransaction(txData) {
  }
  const transaction = new Transaction(txData);
  transaction.endpointTokenConfig = txData.endpointTokenConfig;
-  transaction.inputTokenCount = txData.inputTokenCount;
  calculateTokenValue(transaction);
  await transaction.save();

@ -67,7 +200,6 @@ async function createTransaction(_txData) {

  const transaction = new Transaction(txData);
  transaction.endpointTokenConfig = txData.endpointTokenConfig;
-  transaction.inputTokenCount = txData.inputTokenCount;
  calculateTokenValue(transaction);

  await transaction.save();
@ -99,9 +231,10 @@ async function createStructuredTransaction(_txData) {
    return;
  }

-  const transaction = new Transaction(txData);
-  transaction.endpointTokenConfig = txData.endpointTokenConfig;
-  transaction.inputTokenCount = txData.inputTokenCount;
+  const transaction = new Transaction({
+    ...txData,
+    endpointTokenConfig: txData.endpointTokenConfig,
+  });

  calculateStructuredTokenValue(transaction);

@ -133,15 +266,10 @@ function calculateStructuredTokenValue(txn) {
    return;
  }

-  const { model, endpointTokenConfig, inputTokenCount } = txn;
+  const { model, endpointTokenConfig } = txn;

  if (txn.tokenType === 'prompt') {
-    const inputMultiplier = getMultiplier({
-      tokenType: 'prompt',
-      model,
-      endpointTokenConfig,
-      inputTokenCount,
-    });
+    const inputMultiplier = getMultiplier({ tokenType: 'prompt', model, endpointTokenConfig });
    const writeMultiplier =
      getCacheMultiplier({ cacheType: 'write', model, endpointTokenConfig }) ?? inputMultiplier;
    const readMultiplier =
@ -176,23 +304,18 @@ function calculateStructuredTokenValue(txn) {

    txn.rawAmount = -totalPromptTokens;
  } else if (txn.tokenType === 'completion') {
-    const multiplier = getMultiplier({
-      tokenType: txn.tokenType,
-      model,
-      endpointTokenConfig,
-      inputTokenCount,
-    });
+    const multiplier = getMultiplier({ tokenType: txn.tokenType, model, endpointTokenConfig });
    txn.rate = Math.abs(multiplier);
    txn.tokenValue = -Math.abs(txn.rawAmount) * multiplier;
    txn.rawAmount = -Math.abs(txn.rawAmount);
  }

  if (txn.context && txn.tokenType === 'completion' && txn.context === 'incomplete') {
-    txn.tokenValue = Math.ceil(txn.tokenValue * CANCEL_RATE);
-    txn.rate *= CANCEL_RATE;
+    txn.tokenValue = Math.ceil(txn.tokenValue * cancelRate);
+    txn.rate *= cancelRate;
    if (txn.rateDetail) {
      txn.rateDetail = Object.fromEntries(
-        Object.entries(txn.rateDetail).map(([k, v]) => [k, v * CANCEL_RATE]),
+        Object.entries(txn.rateDetail).map(([k, v]) => [k, v * cancelRate]),
      );
    }
  }
--- a/api/models/Transaction.spec.js
+++ b/api/models/Transaction.spec.js
@ -1,10 +1,8 @@
 const mongoose = require('mongoose');
-const { recordCollectedUsage } = require('@librechat/api');
-const { createMethods } = require('@librechat/data-schemas');
 const { MongoMemoryServer } = require('mongodb-memory-server');
-const { getMultiplier, getCacheMultiplier, premiumTokenValues, tokenValues } = require('./tx');
-const { createTransaction, createStructuredTransaction } = require('./Transaction');
 const { spendTokens, spendStructuredTokens } = require('./spendTokens');
+const { getMultiplier, getCacheMultiplier } = require('./tx');
+const { createTransaction, createStructuredTransaction } = require('./Transaction');
 const { Balance, Transaction } = require('~/db/models');

 let mongoServer;
@ -566,760 +564,3 @@ describe('Transactions Config Tests', () => {
    expect(balance.tokenCredits).toBe(initialBalance);
  });
 });
-
-describe('calculateTokenValue Edge Cases', () => {
-  test('should derive multiplier from model when valueKey is not provided', async () => {
-    const userId = new mongoose.Types.ObjectId();
-    const initialBalance = 100000000;
-    await Balance.create({ user: userId, tokenCredits: initialBalance });
-
-    const model = 'gpt-4';
-    const promptTokens = 1000;
-
-    const result = await createTransaction({
-      user: userId,
-      conversationId: 'test-no-valuekey',
-      model,
-      tokenType: 'prompt',
-      rawAmount: -promptTokens,
-      context: 'test',
-      balance: { enabled: true },
-    });
-
-    const expectedRate = getMultiplier({ model, tokenType: 'prompt' });
-    expect(result.rate).toBe(expectedRate);
-
-    const tx = await Transaction.findOne({ user: userId });
-    expect(tx.tokenValue).toBe(-promptTokens * expectedRate);
-    expect(tx.rate).toBe(expectedRate);
-  });
-
-  test('should derive valueKey and apply correct rate for an unknown model with tokenType', async () => {
-    const userId = new mongoose.Types.ObjectId();
-    const initialBalance = 100000000;
-    await Balance.create({ user: userId, tokenCredits: initialBalance });
-
-    await createTransaction({
-      user: userId,
-      conversationId: 'test-unknown-model',
-      model: 'some-unrecognized-model-xyz',
-      tokenType: 'prompt',
-      rawAmount: -500,
-      context: 'test',
-      balance: { enabled: true },
-    });
-
-    const tx = await Transaction.findOne({ user: userId });
-    expect(tx.rate).toBeDefined();
-    expect(tx.rate).toBeGreaterThan(0);
-    expect(tx.tokenValue).toBe(tx.rawAmount * tx.rate);
-  });
-
-  test('should correctly apply model-derived multiplier without valueKey for completion', async () => {
-    const userId = new mongoose.Types.ObjectId();
-    const initialBalance = 100000000;
-    await Balance.create({ user: userId, tokenCredits: initialBalance });
-
-    const model = 'claude-opus-4-6';
-    const completionTokens = 500;
-
-    const result = await createTransaction({
-      user: userId,
-      conversationId: 'test-completion-no-valuekey',
-      model,
-      tokenType: 'completion',
-      rawAmount: -completionTokens,
-      context: 'test',
-      balance: { enabled: true },
-    });
-
-    const expectedRate = getMultiplier({ model, tokenType: 'completion' });
-    expect(expectedRate).toBe(tokenValues[model].completion);
-    expect(result.rate).toBe(expectedRate);
-
-    const updatedBalance = await Balance.findOne({ user: userId });
-    expect(updatedBalance.tokenCredits).toBeCloseTo(
-      initialBalance - completionTokens * expectedRate,
-      0,
-    );
-  });
-});
-
-describe('Premium Token Pricing Integration Tests', () => {
-  test('spendTokens should apply standard pricing when prompt tokens are below premium threshold', async () => {
-    const userId = new mongoose.Types.ObjectId();
-    const initialBalance = 100000000;
-    await Balance.create({ user: userId, tokenCredits: initialBalance });
-
-    const model = 'claude-opus-4-6';
-    const promptTokens = 100000;
-    const completionTokens = 500;
-
-    const txData = {
-      user: userId,
-      conversationId: 'test-premium-below',
-      model,
-      context: 'test',
-      endpointTokenConfig: null,
-      balance: { enabled: true },
-    };
-
-    await spendTokens(txData, { promptTokens, completionTokens });
-
-    const standardPromptRate = tokenValues[model].prompt;
-    const standardCompletionRate = tokenValues[model].completion;
-    const expectedCost =
-      promptTokens * standardPromptRate + completionTokens * standardCompletionRate;
-
-    const updatedBalance = await Balance.findOne({ user: userId });
-    expect(updatedBalance.tokenCredits).toBeCloseTo(initialBalance - expectedCost, 0);
-  });
-
-  test('spendTokens should apply premium pricing when prompt tokens exceed premium threshold', async () => {
-    const userId = new mongoose.Types.ObjectId();
-    const initialBalance = 100000000;
-    await Balance.create({ user: userId, tokenCredits: initialBalance });
-
-    const model = 'claude-opus-4-6';
-    const promptTokens = 250000;
-    const completionTokens = 500;
-
-    const txData = {
-      user: userId,
-      conversationId: 'test-premium-above',
-      model,
-      context: 'test',
-      endpointTokenConfig: null,
-      balance: { enabled: true },
-    };
-
-    await spendTokens(txData, { promptTokens, completionTokens });
-
-    const premiumPromptRate = premiumTokenValues[model].prompt;
-    const premiumCompletionRate = premiumTokenValues[model].completion;
-    const expectedCost =
-      promptTokens * premiumPromptRate + completionTokens * premiumCompletionRate;
-
-    const updatedBalance = await Balance.findOne({ user: userId });
-    expect(updatedBalance.tokenCredits).toBeCloseTo(initialBalance - expectedCost, 0);
-  });
-
-  test('spendTokens should apply standard pricing at exactly the premium threshold', async () => {
-    const userId = new mongoose.Types.ObjectId();
-    const initialBalance = 100000000;
-    await Balance.create({ user: userId, tokenCredits: initialBalance });
-
-    const model = 'claude-opus-4-6';
-    const promptTokens = premiumTokenValues[model].threshold;
-    const completionTokens = 500;
-
-    const txData = {
-      user: userId,
-      conversationId: 'test-premium-exact',
-      model,
-      context: 'test',
-      endpointTokenConfig: null,
-      balance: { enabled: true },
-    };
-
-    await spendTokens(txData, { promptTokens, completionTokens });
-
-    const standardPromptRate = tokenValues[model].prompt;
-    const standardCompletionRate = tokenValues[model].completion;
-    const expectedCost =
-      promptTokens * standardPromptRate + completionTokens * standardCompletionRate;
-
-    const updatedBalance = await Balance.findOne({ user: userId });
-    expect(updatedBalance.tokenCredits).toBeCloseTo(initialBalance - expectedCost, 0);
-  });
-
-  test('spendStructuredTokens should apply premium pricing when total input tokens exceed threshold', async () => {
-    const userId = new mongoose.Types.ObjectId();
-    const initialBalance = 100000000;
-    await Balance.create({ user: userId, tokenCredits: initialBalance });
-
-    const model = 'claude-opus-4-6';
-    const txData = {
-      user: userId,
-      conversationId: 'test-structured-premium',
-      model,
-      context: 'message',
-      endpointTokenConfig: null,
-      balance: { enabled: true },
-    };
-
-    const tokenUsage = {
-      promptTokens: {
-        input: 200000,
-        write: 10000,
-        read: 5000,
-      },
-      completionTokens: 1000,
-    };
-
-    const totalInput =
-      tokenUsage.promptTokens.input + tokenUsage.promptTokens.write + tokenUsage.promptTokens.read;
-
-    await spendStructuredTokens(txData, tokenUsage);
-
-    const premiumPromptRate = premiumTokenValues[model].prompt;
-    const premiumCompletionRate = premiumTokenValues[model].completion;
-    const writeMultiplier = getCacheMultiplier({ model, cacheType: 'write' });
-    const readMultiplier = getCacheMultiplier({ model, cacheType: 'read' });
-
-    const expectedPromptCost =
-      tokenUsage.promptTokens.input * premiumPromptRate +
-      tokenUsage.promptTokens.write * writeMultiplier +
-      tokenUsage.promptTokens.read * readMultiplier;
-    const expectedCompletionCost = tokenUsage.completionTokens * premiumCompletionRate;
-    const expectedTotalCost = expectedPromptCost + expectedCompletionCost;
-
-    const updatedBalance = await Balance.findOne({ user: userId });
-    expect(totalInput).toBeGreaterThan(premiumTokenValues[model].threshold);
-    expect(updatedBalance.tokenCredits).toBeCloseTo(initialBalance - expectedTotalCost, 0);
-  });
-
-  test('spendStructuredTokens should apply standard pricing when total input tokens are below threshold', async () => {
-    const userId = new mongoose.Types.ObjectId();
-    const initialBalance = 100000000;
-    await Balance.create({ user: userId, tokenCredits: initialBalance });
-
-    const model = 'claude-opus-4-6';
-    const txData = {
-      user: userId,
-      conversationId: 'test-structured-standard',
-      model,
-      context: 'message',
-      endpointTokenConfig: null,
-      balance: { enabled: true },
-    };
-
-    const tokenUsage = {
-      promptTokens: {
-        input: 50000,
-        write: 10000,
-        read: 5000,
-      },
-      completionTokens: 1000,
-    };
-
-    const totalInput =
-      tokenUsage.promptTokens.input + tokenUsage.promptTokens.write + tokenUsage.promptTokens.read;
-
-    await spendStructuredTokens(txData, tokenUsage);
-
-    const standardPromptRate = tokenValues[model].prompt;
-    const standardCompletionRate = tokenValues[model].completion;
-    const writeMultiplier = getCacheMultiplier({ model, cacheType: 'write' });
-    const readMultiplier = getCacheMultiplier({ model, cacheType: 'read' });
-
-    const expectedPromptCost =
-      tokenUsage.promptTokens.input * standardPromptRate +
-      tokenUsage.promptTokens.write * writeMultiplier +
-      tokenUsage.promptTokens.read * readMultiplier;
-    const expectedCompletionCost = tokenUsage.completionTokens * standardCompletionRate;
-    const expectedTotalCost = expectedPromptCost + expectedCompletionCost;
-
-    const updatedBalance = await Balance.findOne({ user: userId });
-    expect(totalInput).toBeLessThanOrEqual(premiumTokenValues[model].threshold);
-    expect(updatedBalance.tokenCredits).toBeCloseTo(initialBalance - expectedTotalCost, 0);
-  });
-
-  test('spendTokens should apply standard pricing for gemini-3.1-pro-preview below threshold', async () => {
-    const userId = new mongoose.Types.ObjectId();
-    const initialBalance = 100000000;
-    await Balance.create({ user: userId, tokenCredits: initialBalance });
-
-    const model = 'gemini-3.1-pro-preview';
-    const promptTokens = 100000;
-    const completionTokens = 500;
-
-    const txData = {
-      user: userId,
-      conversationId: 'test-gemini31-below',
-      model,
-      context: 'test',
-      endpointTokenConfig: null,
-      balance: { enabled: true },
-    };
-
-    await spendTokens(txData, { promptTokens, completionTokens });
-
-    const standardPromptRate = tokenValues['gemini-3.1'].prompt;
-    const standardCompletionRate = tokenValues['gemini-3.1'].completion;
-    const expectedCost =
-      promptTokens * standardPromptRate + completionTokens * standardCompletionRate;
-
-    const updatedBalance = await Balance.findOne({ user: userId });
-    expect(updatedBalance.tokenCredits).toBeCloseTo(initialBalance - expectedCost, 0);
-  });
-
-  test('spendTokens should apply premium pricing for gemini-3.1-pro-preview above threshold', async () => {
-    const userId = new mongoose.Types.ObjectId();
-    const initialBalance = 100000000;
-    await Balance.create({ user: userId, tokenCredits: initialBalance });
-
-    const model = 'gemini-3.1-pro-preview';
-    const promptTokens = 250000;
-    const completionTokens = 500;
-
-    const txData = {
-      user: userId,
-      conversationId: 'test-gemini31-above',
-      model,
-      context: 'test',
-      endpointTokenConfig: null,
-      balance: { enabled: true },
-    };
-
-    await spendTokens(txData, { promptTokens, completionTokens });
-
-    const premiumPromptRate = premiumTokenValues['gemini-3.1'].prompt;
-    const premiumCompletionRate = premiumTokenValues['gemini-3.1'].completion;
-    const expectedCost =
-      promptTokens * premiumPromptRate + completionTokens * premiumCompletionRate;
-
-    const updatedBalance = await Balance.findOne({ user: userId });
-    expect(updatedBalance.tokenCredits).toBeCloseTo(initialBalance - expectedCost, 0);
-  });
-
-  test('spendTokens should apply standard pricing for gemini-3.1-pro-preview at exactly the threshold', async () => {
-    const userId = new mongoose.Types.ObjectId();
-    const initialBalance = 100000000;
-    await Balance.create({ user: userId, tokenCredits: initialBalance });
-
-    const model = 'gemini-3.1-pro-preview';
-    const promptTokens = premiumTokenValues['gemini-3.1'].threshold;
-    const completionTokens = 500;
-
-    const txData = {
-      user: userId,
-      conversationId: 'test-gemini31-exact',
-      model,
-      context: 'test',
-      endpointTokenConfig: null,
-      balance: { enabled: true },
-    };
-
-    await spendTokens(txData, { promptTokens, completionTokens });
-
-    const standardPromptRate = tokenValues['gemini-3.1'].prompt;
-    const standardCompletionRate = tokenValues['gemini-3.1'].completion;
-    const expectedCost =
-      promptTokens * standardPromptRate + completionTokens * standardCompletionRate;
-
-    const updatedBalance = await Balance.findOne({ user: userId });
-    expect(updatedBalance.tokenCredits).toBeCloseTo(initialBalance - expectedCost, 0);
-  });
-
-  test('spendStructuredTokens should apply premium pricing for gemini-3.1 when total input exceeds threshold', async () => {
-    const userId = new mongoose.Types.ObjectId();
-    const initialBalance = 100000000;
-    await Balance.create({ user: userId, tokenCredits: initialBalance });
-
-    const model = 'gemini-3.1-pro-preview';
-    const txData = {
-      user: userId,
-      conversationId: 'test-gemini31-structured-premium',
-      model,
-      context: 'message',
-      endpointTokenConfig: null,
-      balance: { enabled: true },
-    };
-
-    const tokenUsage = {
-      promptTokens: {
-        input: 200000,
-        write: 10000,
-        read: 5000,
-      },
-      completionTokens: 1000,
-    };
-
-    const totalInput =
-      tokenUsage.promptTokens.input + tokenUsage.promptTokens.write + tokenUsage.promptTokens.read;
-
-    await spendStructuredTokens(txData, tokenUsage);
-
-    const premiumPromptRate = premiumTokenValues['gemini-3.1'].prompt;
-    const premiumCompletionRate = premiumTokenValues['gemini-3.1'].completion;
-    const writeMultiplier = getCacheMultiplier({ model, cacheType: 'write' });
-    const readMultiplier = getCacheMultiplier({ model, cacheType: 'read' });
-
-    const expectedPromptCost =
-      tokenUsage.promptTokens.input * premiumPromptRate +
-      tokenUsage.promptTokens.write * writeMultiplier +
-      tokenUsage.promptTokens.read * readMultiplier;
-    const expectedCompletionCost = tokenUsage.completionTokens * premiumCompletionRate;
-    const expectedTotalCost = expectedPromptCost + expectedCompletionCost;
-
-    const updatedBalance = await Balance.findOne({ user: userId });
-    expect(totalInput).toBeGreaterThan(premiumTokenValues['gemini-3.1'].threshold);
-    expect(updatedBalance.tokenCredits).toBeCloseTo(initialBalance - expectedTotalCost, 0);
-  });
-
-  test('non-premium models should not be affected by inputTokenCount regardless of prompt size', async () => {
-    const userId = new mongoose.Types.ObjectId();
-    const initialBalance = 100000000;
-    await Balance.create({ user: userId, tokenCredits: initialBalance });
-
-    const model = 'claude-opus-4-5';
-    const promptTokens = 300000;
-    const completionTokens = 500;
-
-    const txData = {
-      user: userId,
-      conversationId: 'test-no-premium',
-      model,
-      context: 'test',
-      endpointTokenConfig: null,
-      balance: { enabled: true },
-    };
-
-    await spendTokens(txData, { promptTokens, completionTokens });
-
-    const standardPromptRate = getMultiplier({ model, tokenType: 'prompt' });
-    const standardCompletionRate = getMultiplier({ model, tokenType: 'completion' });
-    const expectedCost =
-      promptTokens * standardPromptRate + completionTokens * standardCompletionRate;
-
-    const updatedBalance = await Balance.findOne({ user: userId });
-    expect(updatedBalance.tokenCredits).toBeCloseTo(initialBalance - expectedCost, 0);
-  });
-});
-
-describe('Bulk path parity', () => {
-  /**
-   * Each test here mirrors an existing legacy test above, replacing spendTokens/
-   * spendStructuredTokens with recordCollectedUsage + bulk deps.
-   * The balance deduction and transaction document fields must be numerically identical.
-   */
-  let bulkDeps;
-  let methods;
-
-  beforeEach(() => {
-    methods = createMethods(mongoose);
-    bulkDeps = {
-      spendTokens: () => Promise.resolve(),
-      spendStructuredTokens: () => Promise.resolve(),
-      pricing: { getMultiplier, getCacheMultiplier },
-      bulkWriteOps: {
-        insertMany: methods.bulkInsertTransactions,
-        updateBalance: methods.updateBalance,
-      },
-    };
-  });
-
-  test('balance should decrease when spending tokens via bulk path', async () => {
-    const userId = new mongoose.Types.ObjectId();
-    const initialBalance = 10000000;
-    await Balance.create({ user: userId, tokenCredits: initialBalance });
-
-    const model = 'gpt-3.5-turbo';
-    const promptTokens = 100;
-    const completionTokens = 50;
-
-    await recordCollectedUsage(bulkDeps, {
-      user: userId.toString(),
-      conversationId: 'test-conversation-id',
-      model,
-      context: 'test',
-      balance: { enabled: true },
-      transactions: { enabled: true },
-      collectedUsage: [{ input_tokens: promptTokens, output_tokens: completionTokens, model }],
-    });
-
-    const updatedBalance = await Balance.findOne({ user: userId });
-    const promptMultiplier = getMultiplier({
-      model,
-      tokenType: 'prompt',
-      inputTokenCount: promptTokens,
-    });
-    const completionMultiplier = getMultiplier({
-      model,
-      tokenType: 'completion',
-      inputTokenCount: promptTokens,
-    });
-    const expectedTotalCost =
-      promptTokens * promptMultiplier + completionTokens * completionMultiplier;
-    const expectedBalance = initialBalance - expectedTotalCost;
-
-    expect(updatedBalance.tokenCredits).toBeCloseTo(expectedBalance, 0);
-
-    const txns = await Transaction.find({ user: userId }).lean();
-    expect(txns).toHaveLength(2);
-  });
-
-  test('bulk path should not update balance when balance.enabled is false', async () => {
-    const userId = new mongoose.Types.ObjectId();
-    const initialBalance = 10000000;
-    await Balance.create({ user: userId, tokenCredits: initialBalance });
-
-    const model = 'gpt-3.5-turbo';
-
-    await recordCollectedUsage(bulkDeps, {
-      user: userId.toString(),
-      conversationId: 'test-conversation-id',
-      model,
-      context: 'test',
-      balance: { enabled: false },
-      transactions: { enabled: true },
-      collectedUsage: [{ input_tokens: 100, output_tokens: 50, model }],
-    });
-
-    const updatedBalance = await Balance.findOne({ user: userId });
-    expect(updatedBalance.tokenCredits).toBe(initialBalance);
-    const txns = await Transaction.find({ user: userId }).lean();
-    expect(txns).toHaveLength(2); // transactions still recorded
-  });
-
-  test('bulk path should not insert when transactions.enabled is false', async () => {
-    const userId = new mongoose.Types.ObjectId();
-    const initialBalance = 10000000;
-    await Balance.create({ user: userId, tokenCredits: initialBalance });
-
-    await recordCollectedUsage(bulkDeps, {
-      user: userId.toString(),
-      conversationId: 'test-conversation-id',
-      model: 'gpt-3.5-turbo',
-      context: 'test',
-      balance: { enabled: true },
-      transactions: { enabled: false },
-      collectedUsage: [{ input_tokens: 100, output_tokens: 50, model: 'gpt-3.5-turbo' }],
-    });
-
-    const txns = await Transaction.find({ user: userId }).lean();
-    expect(txns).toHaveLength(0);
-    const balance = await Balance.findOne({ user: userId });
-    expect(balance.tokenCredits).toBe(initialBalance);
-  });
-
-  test('bulk path handles incomplete context for completion tokens — same CANCEL_RATE as legacy', async () => {
-    const userId = new mongoose.Types.ObjectId();
-    const initialBalance = 17613154.55;
-    await Balance.create({ user: userId, tokenCredits: initialBalance });
-
-    const model = 'claude-3-5-sonnet';
-    const promptTokens = 10;
-    const completionTokens = 50;
-
-    await recordCollectedUsage(bulkDeps, {
-      user: userId.toString(),
-      conversationId: 'test-convo',
-      model,
-      context: 'incomplete',
-      balance: { enabled: true },
-      transactions: { enabled: true },
-      collectedUsage: [{ input_tokens: promptTokens, output_tokens: completionTokens, model }],
-    });
-
-    const txns = await Transaction.find({ user: userId }).lean();
-    const completionTx = txns.find((t) => t.tokenType === 'completion');
-    const completionMultiplier = getMultiplier({
-      model,
-      tokenType: 'completion',
-      inputTokenCount: promptTokens,
-    });
-    expect(completionTx.tokenValue).toBeCloseTo(-completionTokens * completionMultiplier * 1.15, 0);
-  });
-
-  test('bulk path structured tokens — balance deduction matches legacy spendStructuredTokens', async () => {
-    const userId = new mongoose.Types.ObjectId();
-    const initialBalance = 17613154.55;
-    await Balance.create({ user: userId, tokenCredits: initialBalance });
-
-    const model = 'claude-3-5-sonnet';
-    const promptInput = 11;
-    const promptWrite = 140522;
-    const promptRead = 0;
-    const completionTokens = 5;
-    const totalInput = promptInput + promptWrite + promptRead;
-
-    await recordCollectedUsage(bulkDeps, {
-      user: userId.toString(),
-      conversationId: 'test-convo',
-      model,
-      context: 'message',
-      balance: { enabled: true },
-      transactions: { enabled: true },
-      collectedUsage: [
-        {
-          input_tokens: promptInput,
-          output_tokens: completionTokens,
-          model,
-          input_token_details: { cache_creation: promptWrite, cache_read: promptRead },
-        },
-      ],
-    });
-
-    const promptMultiplier = getMultiplier({
-      model,
-      tokenType: 'prompt',
-      inputTokenCount: totalInput,
-    });
-    const completionMultiplier = getMultiplier({
-      model,
-      tokenType: 'completion',
-      inputTokenCount: totalInput,
-    });
-    const writeMultiplier = getCacheMultiplier({ model, cacheType: 'write' }) ?? promptMultiplier;
-    const readMultiplier = getCacheMultiplier({ model, cacheType: 'read' }) ?? promptMultiplier;
-
-    const expectedPromptCost =
-      promptInput * promptMultiplier + promptWrite * writeMultiplier + promptRead * readMultiplier;
-    const expectedCompletionCost = completionTokens * completionMultiplier;
-    const expectedTotalCost = expectedPromptCost + expectedCompletionCost;
-    const expectedBalance = initialBalance - expectedTotalCost;
-
-    const updatedBalance = await Balance.findOne({ user: userId });
-    expect(Math.abs(updatedBalance.tokenCredits - expectedBalance)).toBeLessThan(100);
-  });
-
-  test('premium pricing above threshold via bulk path — same balance as legacy', async () => {
-    const userId = new mongoose.Types.ObjectId();
-    const initialBalance = 100000000;
-    await Balance.create({ user: userId, tokenCredits: initialBalance });
-
-    const model = 'claude-opus-4-6';
-    const promptTokens = 250000;
-    const completionTokens = 500;
-
-    await recordCollectedUsage(bulkDeps, {
-      user: userId.toString(),
-      conversationId: 'test-premium',
-      model,
-      context: 'test',
-      balance: { enabled: true },
-      transactions: { enabled: true },
-      collectedUsage: [{ input_tokens: promptTokens, output_tokens: completionTokens, model }],
-    });
-
-    const premiumPromptRate = premiumTokenValues[model].prompt;
-    const premiumCompletionRate = premiumTokenValues[model].completion;
-    const expectedCost =
-      promptTokens * premiumPromptRate + completionTokens * premiumCompletionRate;
-
-    const updatedBalance = await Balance.findOne({ user: userId });
-    expect(updatedBalance.tokenCredits).toBeCloseTo(initialBalance - expectedCost, 0);
-  });
-
-  test('real-world multi-entry batch: 5 sequential tool calls — same total deduction as 5 legacy spendTokens calls', async () => {
-    const userId = new mongoose.Types.ObjectId();
-    const initialBalance = 100000000;
-    await Balance.create({ user: userId, tokenCredits: initialBalance });
-
-    const model = 'claude-opus-4-5-20251101';
-    const calls = [
-      { input_tokens: 31596, output_tokens: 151 },
-      { input_tokens: 35368, output_tokens: 150 },
-      { input_tokens: 58362, output_tokens: 295 },
-      { input_tokens: 112604, output_tokens: 193 },
-      { input_tokens: 257440, output_tokens: 2217 },
-    ];
-
-    let expectedTotalCost = 0;
-    for (const { input_tokens, output_tokens } of calls) {
-      const pm = getMultiplier({ model, tokenType: 'prompt', inputTokenCount: input_tokens });
-      const cm = getMultiplier({ model, tokenType: 'completion', inputTokenCount: input_tokens });
-      expectedTotalCost += input_tokens * pm + output_tokens * cm;
-    }
-
-    await recordCollectedUsage(bulkDeps, {
-      user: userId.toString(),
-      conversationId: 'test-sequential',
-      model,
-      context: 'message',
-      balance: { enabled: true },
-      transactions: { enabled: true },
-      collectedUsage: calls.map((c) => ({ ...c, model })),
-    });
-
-    const txns = await Transaction.find({ user: userId }).lean();
-    expect(txns).toHaveLength(10); // 5 calls × 2 docs (prompt + completion)
-
-    const updatedBalance = await Balance.findOne({ user: userId });
-    expect(updatedBalance.tokenCredits).toBeCloseTo(initialBalance - expectedTotalCost, 0);
-  });
-
-  test('bulk path should save transaction but not update balance when balance disabled, transactions enabled', async () => {
-    const userId = new mongoose.Types.ObjectId();
-    const initialBalance = 10000000;
-    await Balance.create({ user: userId, tokenCredits: initialBalance });
-
-    await recordCollectedUsage(bulkDeps, {
-      user: userId.toString(),
-      conversationId: 'test-conversation-id',
-      model: 'gpt-3.5-turbo',
-      context: 'test',
-      balance: { enabled: false },
-      transactions: { enabled: true },
-      collectedUsage: [{ input_tokens: 100, output_tokens: 50, model: 'gpt-3.5-turbo' }],
-    });
-
-    const txns = await Transaction.find({ user: userId }).lean();
-    expect(txns).toHaveLength(2);
-    expect(txns[0].rawAmount).toBeDefined();
-    const balance = await Balance.findOne({ user: userId });
-    expect(balance.tokenCredits).toBe(initialBalance);
-  });
-
-  test('bulk path structured tokens should not save when transactions.enabled is false', async () => {
-    const userId = new mongoose.Types.ObjectId();
-    const initialBalance = 10000000;
-    await Balance.create({ user: userId, tokenCredits: initialBalance });
-
-    await recordCollectedUsage(bulkDeps, {
-      user: userId.toString(),
-      conversationId: 'test-conversation-id',
-      model: 'claude-3-5-sonnet',
-      context: 'message',
-      balance: { enabled: true },
-      transactions: { enabled: false },
-      collectedUsage: [
-        {
-          input_tokens: 10,
-          output_tokens: 5,
-          model: 'claude-3-5-sonnet',
-          input_token_details: { cache_creation: 100, cache_read: 5 },
-        },
-      ],
-    });
-
-    const txns = await Transaction.find({ user: userId }).lean();
-    expect(txns).toHaveLength(0);
-    const balance = await Balance.findOne({ user: userId });
-    expect(balance.tokenCredits).toBe(initialBalance);
-  });
-
-  test('bulk path structured tokens should save but not update balance when balance disabled', async () => {
-    const userId = new mongoose.Types.ObjectId();
-    const initialBalance = 10000000;
-    await Balance.create({ user: userId, tokenCredits: initialBalance });
-
-    await recordCollectedUsage(bulkDeps, {
-      user: userId.toString(),
-      conversationId: 'test-conversation-id',
-      model: 'claude-3-5-sonnet',
-      context: 'message',
-      balance: { enabled: false },
-      transactions: { enabled: true },
-      collectedUsage: [
-        {
-          input_tokens: 10,
-          output_tokens: 5,
-          model: 'claude-3-5-sonnet',
-          input_token_details: { cache_creation: 100, cache_read: 5 },
-        },
-      ],
-    });
-
-    const txns = await Transaction.find({ user: userId }).lean();
-    expect(txns).toHaveLength(2);
-    const promptTx = txns.find((t) => t.tokenType === 'prompt');
-    expect(promptTx.inputTokens).toBe(-10);
-    expect(promptTx.writeTokens).toBe(-100);
-    expect(promptTx.readTokens).toBe(-5);
-    const balance = await Balance.findOne({ user: userId });
-    expect(balance.tokenCredits).toBe(initialBalance);
-  });
-});
--- a/api/models/loadAddedAgent.js
+++ b/api/models/loadAddedAgent.js
@ -48,14 +48,14 @@ const loadAddedAgent = async ({ req, conversation, primaryAgent }) => {
    return null;
  }

+  // If there's an agent_id, load the existing agent
  if (conversation.agent_id && !isEphemeralAgentId(conversation.agent_id)) {
-    let agent = req.resolvedAddedAgent;
-    if (!agent) {
-      if (!getAgent) {
-        throw new Error('getAgent not initialized - call setGetAgent first');
-      }
-      agent = await getAgent({ id: conversation.agent_id });
+    if (!getAgent) {
+      throw new Error('getAgent not initialized - call setGetAgent first');
    }
+    const agent = await getAgent({
+      id: conversation.agent_id,
+    });

    if (!agent) {
      logger.warn(`[loadAddedAgent] Agent ${conversation.agent_id} not found`);
--- a/api/models/spendTokens.js
+++ b/api/models/spendTokens.js
@ -24,14 +24,12 @@ const spendTokens = async (txData, tokenUsage) => {
    },
  );
  let prompt, completion;
-  const normalizedPromptTokens = Math.max(promptTokens ?? 0, 0);
  try {
    if (promptTokens !== undefined) {
      prompt = await createTransaction({
        ...txData,
        tokenType: 'prompt',
-        rawAmount: promptTokens === 0 ? 0 : -normalizedPromptTokens,
-        inputTokenCount: normalizedPromptTokens,
+        rawAmount: promptTokens === 0 ? 0 : -Math.max(promptTokens, 0),
      });
    }

@ -40,7 +38,6 @@ const spendTokens = async (txData, tokenUsage) => {
        ...txData,
        tokenType: 'completion',
        rawAmount: completionTokens === 0 ? 0 : -Math.max(completionTokens, 0),
-        inputTokenCount: normalizedPromptTokens,
      });
    }

@ -90,31 +87,21 @@ const spendStructuredTokens = async (txData, tokenUsage) => {
  let prompt, completion;
  try {
    if (promptTokens) {
-      const input = Math.max(promptTokens.input ?? 0, 0);
-      const write = Math.max(promptTokens.write ?? 0, 0);
-      const read = Math.max(promptTokens.read ?? 0, 0);
-      const totalInputTokens = input + write + read;
+      const { input = 0, write = 0, read = 0 } = promptTokens;
      prompt = await createStructuredTransaction({
        ...txData,
        tokenType: 'prompt',
        inputTokens: -input,
        writeTokens: -write,
        readTokens: -read,
-        inputTokenCount: totalInputTokens,
      });
    }

    if (completionTokens) {
-      const totalInputTokens = promptTokens
-        ? Math.max(promptTokens.input ?? 0, 0) +
-          Math.max(promptTokens.write ?? 0, 0) +
-          Math.max(promptTokens.read ?? 0, 0)
-        : undefined;
      completion = await createTransaction({
        ...txData,
        tokenType: 'completion',
-        rawAmount: -Math.max(completionTokens, 0),
-        inputTokenCount: totalInputTokens,
+        rawAmount: -completionTokens,
      });
    }

--- a/api/models/spendTokens.spec.js
+++ b/api/models/spendTokens.spec.js
@ -1,8 +1,7 @@
 const mongoose = require('mongoose');
 const { MongoMemoryServer } = require('mongodb-memory-server');
-const { createTransaction, createAutoRefillTransaction } = require('./Transaction');
-const { tokenValues, premiumTokenValues, getCacheMultiplier } = require('./tx');
 const { spendTokens, spendStructuredTokens } = require('./spendTokens');
+const { createTransaction, createAutoRefillTransaction } = require('./Transaction');

 require('~/db/models');

@ -735,457 +734,4 @@ describe('spendTokens', () => {
    expect(balance).toBeDefined();
    expect(balance.tokenCredits).toBeLessThan(10000); // Balance should be reduced
  });
-
-  describe('premium token pricing', () => {
-    it('should charge standard rates for claude-opus-4-6 when prompt tokens are below threshold', async () => {
-      const initialBalance = 100000000;
-      await Balance.create({
-        user: userId,
-        tokenCredits: initialBalance,
-      });
-
-      const model = 'claude-opus-4-6';
-      const promptTokens = 100000;
-      const completionTokens = 500;
-
-      const txData = {
-        user: userId,
-        conversationId: 'test-standard-pricing',
-        model,
-        context: 'test',
-        balance: { enabled: true },
-      };
-
-      await spendTokens(txData, { promptTokens, completionTokens });
-
-      const expectedCost =
-        promptTokens * tokenValues[model].prompt + completionTokens * tokenValues[model].completion;
-
-      const balance = await Balance.findOne({ user: userId });
-      expect(balance.tokenCredits).toBeCloseTo(initialBalance - expectedCost, 0);
-    });
-
-    it('should charge premium rates for claude-opus-4-6 when prompt tokens exceed threshold', async () => {
-      const initialBalance = 100000000;
-      await Balance.create({
-        user: userId,
-        tokenCredits: initialBalance,
-      });
-
-      const model = 'claude-opus-4-6';
-      const promptTokens = 250000;
-      const completionTokens = 500;
-
-      const txData = {
-        user: userId,
-        conversationId: 'test-premium-pricing',
-        model,
-        context: 'test',
-        balance: { enabled: true },
-      };
-
-      await spendTokens(txData, { promptTokens, completionTokens });
-
-      const expectedCost =
-        promptTokens * premiumTokenValues[model].prompt +
-        completionTokens * premiumTokenValues[model].completion;
-
-      const balance = await Balance.findOne({ user: userId });
-      expect(balance.tokenCredits).toBeCloseTo(initialBalance - expectedCost, 0);
-    });
-
-    it('should charge premium rates for both prompt and completion in structured tokens when above threshold', async () => {
-      const initialBalance = 100000000;
-      await Balance.create({
-        user: userId,
-        tokenCredits: initialBalance,
-      });
-
-      const model = 'claude-opus-4-6';
-      const txData = {
-        user: userId,
-        conversationId: 'test-structured-premium',
-        model,
-        context: 'test',
-        balance: { enabled: true },
-      };
-
-      const tokenUsage = {
-        promptTokens: {
-          input: 200000,
-          write: 10000,
-          read: 5000,
-        },
-        completionTokens: 1000,
-      };
-
-      const result = await spendStructuredTokens(txData, tokenUsage);
-
-      const premiumPromptRate = premiumTokenValues[model].prompt;
-      const premiumCompletionRate = premiumTokenValues[model].completion;
-      const writeRate = getCacheMultiplier({ model, cacheType: 'write' });
-      const readRate = getCacheMultiplier({ model, cacheType: 'read' });
-
-      const expectedPromptCost =
-        tokenUsage.promptTokens.input * premiumPromptRate +
-        tokenUsage.promptTokens.write * writeRate +
-        tokenUsage.promptTokens.read * readRate;
-      const expectedCompletionCost = tokenUsage.completionTokens * premiumCompletionRate;
-
-      expect(result.prompt.prompt).toBeCloseTo(-expectedPromptCost, 0);
-      expect(result.completion.completion).toBeCloseTo(-expectedCompletionCost, 0);
-    });
-
-    it('should charge standard rates for structured tokens when below threshold', async () => {
-      const initialBalance = 100000000;
-      await Balance.create({
-        user: userId,
-        tokenCredits: initialBalance,
-      });
-
-      const model = 'claude-opus-4-6';
-      const txData = {
-        user: userId,
-        conversationId: 'test-structured-standard',
-        model,
-        context: 'test',
-        balance: { enabled: true },
-      };
-
-      const tokenUsage = {
-        promptTokens: {
-          input: 50000,
-          write: 10000,
-          read: 5000,
-        },
-        completionTokens: 1000,
-      };
-
-      const result = await spendStructuredTokens(txData, tokenUsage);
-
-      const standardPromptRate = tokenValues[model].prompt;
-      const standardCompletionRate = tokenValues[model].completion;
-      const writeRate = getCacheMultiplier({ model, cacheType: 'write' });
-      const readRate = getCacheMultiplier({ model, cacheType: 'read' });
-
-      const expectedPromptCost =
-        tokenUsage.promptTokens.input * standardPromptRate +
-        tokenUsage.promptTokens.write * writeRate +
-        tokenUsage.promptTokens.read * readRate;
-      const expectedCompletionCost = tokenUsage.completionTokens * standardCompletionRate;
-
-      expect(result.prompt.prompt).toBeCloseTo(-expectedPromptCost, 0);
-      expect(result.completion.completion).toBeCloseTo(-expectedCompletionCost, 0);
-    });
-
-    it('should charge standard rates for gemini-3.1-pro-preview when prompt tokens are below threshold', async () => {
-      const initialBalance = 100000000;
-      await Balance.create({
-        user: userId,
-        tokenCredits: initialBalance,
-      });
-
-      const model = 'gemini-3.1-pro-preview';
-      const promptTokens = 100000;
-      const completionTokens = 500;
-
-      const txData = {
-        user: userId,
-        conversationId: 'test-gemini31-standard-pricing',
-        model,
-        context: 'test',
-        balance: { enabled: true },
-      };
-
-      await spendTokens(txData, { promptTokens, completionTokens });
-
-      const expectedCost =
-        promptTokens * tokenValues['gemini-3.1'].prompt +
-        completionTokens * tokenValues['gemini-3.1'].completion;
-
-      const balance = await Balance.findOne({ user: userId });
-      expect(balance.tokenCredits).toBeCloseTo(initialBalance - expectedCost, 0);
-    });
-
-    it('should charge premium rates for gemini-3.1-pro-preview when prompt tokens exceed threshold', async () => {
-      const initialBalance = 100000000;
-      await Balance.create({
-        user: userId,
-        tokenCredits: initialBalance,
-      });
-
-      const model = 'gemini-3.1-pro-preview';
-      const promptTokens = 250000;
-      const completionTokens = 500;
-
-      const txData = {
-        user: userId,
-        conversationId: 'test-gemini31-premium-pricing',
-        model,
-        context: 'test',
-        balance: { enabled: true },
-      };
-
-      await spendTokens(txData, { promptTokens, completionTokens });
-
-      const expectedCost =
-        promptTokens * premiumTokenValues['gemini-3.1'].prompt +
-        completionTokens * premiumTokenValues['gemini-3.1'].completion;
-
-      const balance = await Balance.findOne({ user: userId });
-      expect(balance.tokenCredits).toBeCloseTo(initialBalance - expectedCost, 0);
-    });
-
-    it('should charge premium rates for gemini-3.1-pro-preview-customtools when prompt tokens exceed threshold', async () => {
-      const initialBalance = 100000000;
-      await Balance.create({
-        user: userId,
-        tokenCredits: initialBalance,
-      });
-
-      const model = 'gemini-3.1-pro-preview-customtools';
-      const promptTokens = 250000;
-      const completionTokens = 500;
-
-      const txData = {
-        user: userId,
-        conversationId: 'test-gemini31-customtools-premium',
-        model,
-        context: 'test',
-        balance: { enabled: true },
-      };
-
-      await spendTokens(txData, { promptTokens, completionTokens });
-
-      const expectedCost =
-        promptTokens * premiumTokenValues['gemini-3.1'].prompt +
-        completionTokens * premiumTokenValues['gemini-3.1'].completion;
-
-      const balance = await Balance.findOne({ user: userId });
-      expect(balance.tokenCredits).toBeCloseTo(initialBalance - expectedCost, 0);
-    });
-
-    it('should charge premium rates for structured gemini-3.1 tokens when total input exceeds threshold', async () => {
-      const initialBalance = 100000000;
-      await Balance.create({
-        user: userId,
-        tokenCredits: initialBalance,
-      });
-
-      const model = 'gemini-3.1-pro-preview';
-      const txData = {
-        user: userId,
-        conversationId: 'test-gemini31-structured-premium',
-        model,
-        context: 'test',
-        balance: { enabled: true },
-      };
-
-      const tokenUsage = {
-        promptTokens: {
-          input: 200000,
-          write: 10000,
-          read: 5000,
-        },
-        completionTokens: 1000,
-      };
-
-      const result = await spendStructuredTokens(txData, tokenUsage);
-
-      const premiumPromptRate = premiumTokenValues['gemini-3.1'].prompt;
-      const premiumCompletionRate = premiumTokenValues['gemini-3.1'].completion;
-      const writeRate = getCacheMultiplier({ model, cacheType: 'write' });
-      const readRate = getCacheMultiplier({ model, cacheType: 'read' });
-
-      const expectedPromptCost =
-        tokenUsage.promptTokens.input * premiumPromptRate +
-        tokenUsage.promptTokens.write * writeRate +
-        tokenUsage.promptTokens.read * readRate;
-      const expectedCompletionCost = tokenUsage.completionTokens * premiumCompletionRate;
-
-      expect(result.prompt.prompt).toBeCloseTo(-expectedPromptCost, 0);
-      expect(result.completion.completion).toBeCloseTo(-expectedCompletionCost, 0);
-    });
-
-    it('should not apply premium pricing to non-premium models regardless of prompt size', async () => {
-      const initialBalance = 100000000;
-      await Balance.create({
-        user: userId,
-        tokenCredits: initialBalance,
-      });
-
-      const model = 'claude-opus-4-5';
-      const promptTokens = 300000;
-      const completionTokens = 500;
-
-      const txData = {
-        user: userId,
-        conversationId: 'test-no-premium',
-        model,
-        context: 'test',
-        balance: { enabled: true },
-      };
-
-      await spendTokens(txData, { promptTokens, completionTokens });
-
-      const expectedCost =
-        promptTokens * tokenValues[model].prompt + completionTokens * tokenValues[model].completion;
-
-      const balance = await Balance.findOne({ user: userId });
-      expect(balance.tokenCredits).toBeCloseTo(initialBalance - expectedCost, 0);
-    });
-  });
-
-  describe('inputTokenCount Normalization', () => {
-    it('should normalize negative promptTokens to zero for inputTokenCount', async () => {
-      await Balance.create({
-        user: userId,
-        tokenCredits: 100000000,
-      });
-
-      const txData = {
-        user: userId,
-        conversationId: 'test-negative-prompt',
-        model: 'claude-opus-4-6',
-        context: 'test',
-        balance: { enabled: true },
-      };
-
-      await spendTokens(txData, { promptTokens: -500, completionTokens: 100 });
-
-      const transactions = await Transaction.find({ user: userId }).sort({ tokenType: 1 });
-
-      const completionTx = transactions.find((t) => t.tokenType === 'completion');
-      const promptTx = transactions.find((t) => t.tokenType === 'prompt');
-
-      expect(Math.abs(promptTx.rawAmount)).toBe(0);
-      expect(completionTx.rawAmount).toBe(-100);
-
-      const standardCompletionRate = tokenValues['claude-opus-4-6'].completion;
-      expect(completionTx.rate).toBe(standardCompletionRate);
-    });
-
-    it('should use normalized inputTokenCount for premium threshold check on completion', async () => {
-      const initialBalance = 100000000;
-      await Balance.create({
-        user: userId,
-        tokenCredits: initialBalance,
-      });
-
-      const model = 'claude-opus-4-6';
-      const promptTokens = 250000;
-      const completionTokens = 500;
-
-      const txData = {
-        user: userId,
-        conversationId: 'test-normalized-premium',
-        model,
-        context: 'test',
-        balance: { enabled: true },
-      };
-
-      await spendTokens(txData, { promptTokens, completionTokens });
-
-      const transactions = await Transaction.find({ user: userId }).sort({ tokenType: 1 });
-      const completionTx = transactions.find((t) => t.tokenType === 'completion');
-      const promptTx = transactions.find((t) => t.tokenType === 'prompt');
-
-      const premiumPromptRate = premiumTokenValues[model].prompt;
-      const premiumCompletionRate = premiumTokenValues[model].completion;
-      expect(promptTx.rate).toBe(premiumPromptRate);
-      expect(completionTx.rate).toBe(premiumCompletionRate);
-    });
-
-    it('should keep inputTokenCount as zero when promptTokens is zero', async () => {
-      await Balance.create({
-        user: userId,
-        tokenCredits: 100000000,
-      });
-
-      const txData = {
-        user: userId,
-        conversationId: 'test-zero-prompt',
-        model: 'claude-opus-4-6',
-        context: 'test',
-        balance: { enabled: true },
-      };
-
-      await spendTokens(txData, { promptTokens: 0, completionTokens: 100 });
-
-      const transactions = await Transaction.find({ user: userId }).sort({ tokenType: 1 });
-      const completionTx = transactions.find((t) => t.tokenType === 'completion');
-      const promptTx = transactions.find((t) => t.tokenType === 'prompt');
-
-      expect(Math.abs(promptTx.rawAmount)).toBe(0);
-
-      const standardCompletionRate = tokenValues['claude-opus-4-6'].completion;
-      expect(completionTx.rate).toBe(standardCompletionRate);
-    });
-
-    it('should not trigger premium pricing with negative promptTokens on premium model', async () => {
-      const initialBalance = 100000000;
-      await Balance.create({
-        user: userId,
-        tokenCredits: initialBalance,
-      });
-
-      const model = 'claude-opus-4-6';
-      const txData = {
-        user: userId,
-        conversationId: 'test-negative-no-premium',
-        model,
-        context: 'test',
-        balance: { enabled: true },
-      };
-
-      await spendTokens(txData, { promptTokens: -300000, completionTokens: 500 });
-
-      const transactions = await Transaction.find({ user: userId }).sort({ tokenType: 1 });
-      const completionTx = transactions.find((t) => t.tokenType === 'completion');
-
-      const standardCompletionRate = tokenValues[model].completion;
-      expect(completionTx.rate).toBe(standardCompletionRate);
-    });
-
-    it('should normalize negative structured token values to zero in spendStructuredTokens', async () => {
-      const initialBalance = 100000000;
-      await Balance.create({
-        user: userId,
-        tokenCredits: initialBalance,
-      });
-
-      const model = 'claude-opus-4-6';
-      const txData = {
-        user: userId,
-        conversationId: 'test-negative-structured',
-        model,
-        context: 'test',
-        balance: { enabled: true },
-      };
-
-      const tokenUsage = {
-        promptTokens: { input: -100, write: 50, read: -30 },
-        completionTokens: -200,
-      };
-
-      await spendStructuredTokens(txData, tokenUsage);
-
-      const transactions = await Transaction.find({
-        user: userId,
-        conversationId: 'test-negative-structured',
-      }).sort({ tokenType: 1 });
-
-      const completionTx = transactions.find((t) => t.tokenType === 'completion');
-      const promptTx = transactions.find((t) => t.tokenType === 'prompt');
-
-      expect(Math.abs(promptTx.inputTokens)).toBe(0);
-      expect(promptTx.writeTokens).toBe(-50);
-      expect(Math.abs(promptTx.readTokens)).toBe(0);
-
-      expect(Math.abs(completionTx.rawAmount)).toBe(0);
-
-      const standardRate = tokenValues[model].completion;
-      expect(completionTx.rate).toBe(standardRate);
-    });
-  });
 });
--- a/api/models/tx.js
+++ b/api/models/tx.js
@ -1,27 +1,10 @@
 const { matchModelName, findMatchingPattern } = require('@librechat/api');
 const defaultRate = 6;

-/**
- * Token Pricing Configuration
- *
- * Pattern Matching
- * ================
- * `findMatchingPattern` (from @librechat/api) uses `modelName.includes(key)` and selects
- * the LONGEST matching key. If a key's length equals the model name's length (exact match),
- * it returns immediately. Definition order does NOT affect correctness.
- *
- * Key ordering matters only for:
- *   1. Performance: list older/less common models first so newer/common models
- *      are found earlier in the reverse scan.
- *   2. Same-length tie-breaking: the last-defined key wins on equal-length matches.
- *
- * This applies to BOTH `tokenValues` and `cacheTokenValues` objects.
- */
-
 /**
 * AWS Bedrock pricing
 * source: https://aws.amazon.com/bedrock/pricing/
- */
+ * */
 const bedrockValues = {
  // Basic llama2 patterns (base defaults to smallest variant)
  llama2: { prompt: 0.75, completion: 1.0 },
@ -97,11 +80,6 @@ const bedrockValues = {
  'nova-pro': { prompt: 0.8, completion: 3.2 },
  'nova-premier': { prompt: 2.5, completion: 12.5 },
  'deepseek.r1': { prompt: 1.35, completion: 5.4 },
-  // Moonshot/Kimi models on Bedrock
-  'moonshot.kimi': { prompt: 0.6, completion: 2.5 },
-  'moonshot.kimi-k2': { prompt: 0.6, completion: 2.5 },
-  'moonshot.kimi-k2.5': { prompt: 0.6, completion: 3.0 },
-  'moonshot.kimi-k2-thinking': { prompt: 0.6, completion: 2.5 },
 };

 /**
@ -137,14 +115,9 @@ const tokenValues = Object.assign(
    'gpt-5': { prompt: 1.25, completion: 10 },
    'gpt-5.1': { prompt: 1.25, completion: 10 },
    'gpt-5.2': { prompt: 1.75, completion: 14 },
-    'gpt-5.3': { prompt: 1.75, completion: 14 },
-    'gpt-5.4': { prompt: 2.5, completion: 15 },
-    // TODO: gpt-5.4-pro pricing not yet officially published — verify before release
-    'gpt-5.4-pro': { prompt: 5, completion: 30 },
    'gpt-5-nano': { prompt: 0.05, completion: 0.4 },
    'gpt-5-mini': { prompt: 0.25, completion: 2 },
    'gpt-5-pro': { prompt: 15, completion: 120 },
-    'gpt-5.2-pro': { prompt: 21, completion: 168 },
    o1: { prompt: 15, completion: 60 },
    'o1-mini': { prompt: 1.1, completion: 4.4 },
    'o1-preview': { prompt: 15, completion: 60 },
@ -166,9 +139,7 @@ const tokenValues = Object.assign(
    'claude-haiku-4-5': { prompt: 1, completion: 5 },
    'claude-opus-4': { prompt: 15, completion: 75 },
    'claude-opus-4-5': { prompt: 5, completion: 25 },
-    'claude-opus-4-6': { prompt: 5, completion: 25 },
    'claude-sonnet-4': { prompt: 3, completion: 15 },
-    'claude-sonnet-4-6': { prompt: 3, completion: 15 },
    'command-r': { prompt: 0.5, completion: 1.5 },
    'command-r-plus': { prompt: 3, completion: 15 },
    'command-text': { prompt: 1.5, completion: 2.0 },
@ -192,8 +163,6 @@ const tokenValues = Object.assign(
    'gemini-2.5-flash-image': { prompt: 0.15, completion: 30 },
    'gemini-3': { prompt: 2, completion: 12 },
    'gemini-3-pro-image': { prompt: 2, completion: 120 },
-    'gemini-3.1': { prompt: 2, completion: 12 },
-    'gemini-3.1-flash-lite': { prompt: 0.25, completion: 1.5 },
    'gemini-pro-vision': { prompt: 0.5, completion: 1.5 },
    grok: { prompt: 2.0, completion: 10.0 }, // Base pattern defaults to grok-2
    'grok-beta': { prompt: 5.0, completion: 15.0 },
@ -220,31 +189,7 @@ const tokenValues = Object.assign(
    'pixtral-large': { prompt: 2.0, completion: 6.0 },
    'mistral-large': { prompt: 2.0, completion: 6.0 },
    'mixtral-8x22b': { prompt: 0.65, completion: 0.65 },
-    // Moonshot/Kimi models (base patterns first, specific patterns last for correct matching)
-    kimi: { prompt: 0.6, completion: 2.5 }, // Base pattern
-    moonshot: { prompt: 2.0, completion: 5.0 }, // Base pattern (using 128k pricing)
-    'kimi-latest': { prompt: 0.2, completion: 2.0 }, // Uses 8k/32k/128k pricing dynamically
-    'kimi-k2': { prompt: 0.6, completion: 2.5 },
-    'kimi-k2.5': { prompt: 0.6, completion: 3.0 },
-    'kimi-k2-turbo': { prompt: 1.15, completion: 8.0 },
-    'kimi-k2-turbo-preview': { prompt: 1.15, completion: 8.0 },
-    'kimi-k2-0905': { prompt: 0.6, completion: 2.5 },
-    'kimi-k2-0905-preview': { prompt: 0.6, completion: 2.5 },
-    'kimi-k2-0711': { prompt: 0.6, completion: 2.5 },
-    'kimi-k2-0711-preview': { prompt: 0.6, completion: 2.5 },
-    'kimi-k2-thinking': { prompt: 0.6, completion: 2.5 },
-    'kimi-k2-thinking-turbo': { prompt: 1.15, completion: 8.0 },
-    'moonshot-v1': { prompt: 2.0, completion: 5.0 },
-    'moonshot-v1-auto': { prompt: 2.0, completion: 5.0 },
-    'moonshot-v1-8k': { prompt: 0.2, completion: 2.0 },
-    'moonshot-v1-8k-vision': { prompt: 0.2, completion: 2.0 },
-    'moonshot-v1-8k-vision-preview': { prompt: 0.2, completion: 2.0 },
-    'moonshot-v1-32k': { prompt: 1.0, completion: 3.0 },
-    'moonshot-v1-32k-vision': { prompt: 1.0, completion: 3.0 },
-    'moonshot-v1-32k-vision-preview': { prompt: 1.0, completion: 3.0 },
-    'moonshot-v1-128k': { prompt: 2.0, completion: 5.0 },
-    'moonshot-v1-128k-vision': { prompt: 2.0, completion: 5.0 },
-    'moonshot-v1-128k-vision-preview': { prompt: 2.0, completion: 5.0 },
+    kimi: { prompt: 0.14, completion: 2.49 }, // Base pattern (using kimi-k2 pricing)
    // GPT-OSS models (specific sizes)
    'gpt-oss:20b': { prompt: 0.05, completion: 0.2 },
    'gpt-oss-20b': { prompt: 0.05, completion: 0.2 },
@ -304,64 +249,12 @@ const cacheTokenValues = {
  'claude-3-haiku': { write: 0.3, read: 0.03 },
  'claude-haiku-4-5': { write: 1.25, read: 0.1 },
  'claude-sonnet-4': { write: 3.75, read: 0.3 },
-  'claude-sonnet-4-6': { write: 3.75, read: 0.3 },
  'claude-opus-4': { write: 18.75, read: 1.5 },
  'claude-opus-4-5': { write: 6.25, read: 0.5 },
-  'claude-opus-4-6': { write: 6.25, read: 0.5 },
-  // OpenAI models — cached input discount varies by family:
-  //   gpt-4o (incl. mini), o1 (incl. mini/preview): 50% off
-  //   gpt-4.1 (incl. mini/nano), o3 (incl. mini), o4-mini: 75% off
-  //   gpt-5.x (excl. pro variants): 90% off
-  //   gpt-5-pro, gpt-5.2-pro, gpt-5.4-pro: no caching
-  'gpt-4o': { write: 2.5, read: 1.25 },
-  'gpt-4o-mini': { write: 0.15, read: 0.075 },
-  'gpt-4.1': { write: 2, read: 0.5 },
-  'gpt-4.1-mini': { write: 0.4, read: 0.1 },
-  'gpt-4.1-nano': { write: 0.1, read: 0.025 },
-  'gpt-5': { write: 1.25, read: 0.125 },
-  'gpt-5.1': { write: 1.25, read: 0.125 },
-  'gpt-5.2': { write: 1.75, read: 0.175 },
-  'gpt-5.3': { write: 1.75, read: 0.175 },
-  'gpt-5.4': { write: 2.5, read: 0.25 },
-  'gpt-5-mini': { write: 0.25, read: 0.025 },
-  'gpt-5-nano': { write: 0.05, read: 0.005 },
-  o1: { write: 15, read: 7.5 },
-  'o1-mini': { write: 1.1, read: 0.55 },
-  'o1-preview': { write: 15, read: 7.5 },
-  o3: { write: 2, read: 0.5 },
-  'o3-mini': { write: 1.1, read: 0.275 },
-  'o4-mini': { write: 1.1, read: 0.275 },
  // DeepSeek models - cache hit: $0.028/1M, cache miss: $0.28/1M
  deepseek: { write: 0.28, read: 0.028 },
  'deepseek-chat': { write: 0.28, read: 0.028 },
  'deepseek-reasoner': { write: 0.28, read: 0.028 },
-  // Moonshot/Kimi models - cache hit: $0.15/1M (k2) or $0.10/1M (k2.5), cache miss: $0.60/1M
-  kimi: { write: 0.6, read: 0.15 },
-  'kimi-k2': { write: 0.6, read: 0.15 },
-  'kimi-k2.5': { write: 0.6, read: 0.1 },
-  'kimi-k2-turbo': { write: 1.15, read: 0.15 },
-  'kimi-k2-turbo-preview': { write: 1.15, read: 0.15 },
-  'kimi-k2-0905': { write: 0.6, read: 0.15 },
-  'kimi-k2-0905-preview': { write: 0.6, read: 0.15 },
-  'kimi-k2-0711': { write: 0.6, read: 0.15 },
-  'kimi-k2-0711-preview': { write: 0.6, read: 0.15 },
-  'kimi-k2-thinking': { write: 0.6, read: 0.15 },
-  'kimi-k2-thinking-turbo': { write: 1.15, read: 0.15 },
-  // Gemini 3.1 Pro - cache write: $2.00/1M, cache read: $0.20/1M
-  'gemini-3.1': { write: 2, read: 0.2 },
-  // Gemini 3.1 Flash-Lite - cache write: $0.25/1M, cache read: $0.025/1M
-  'gemini-3.1-flash-lite': { write: 0.25, read: 0.025 },
-};
-
-/**
- * Premium (tiered) pricing for models whose rates change based on prompt size.
- * Each entry specifies the token threshold and the rates that apply above it.
- * @type {Object.<string, {threshold: number, prompt: number, completion: number}>}
- */
-const premiumTokenValues = {
-  'claude-opus-4-6': { threshold: 200000, prompt: 10, completion: 37.5 },
-  'claude-sonnet-4-6': { threshold: 200000, prompt: 6, completion: 22.5 },
-  'gemini-3.1': { threshold: 200000, prompt: 4, completion: 18 },
 };

 /**
@ -420,27 +313,15 @@ const getValueKey = (model, endpoint) => {
 * @param {string} [params.model] - The model name to derive the value key from if not provided.
 * @param {string} [params.endpoint] - The endpoint name to derive the value key from if not provided.
 * @param {EndpointTokenConfig} [params.endpointTokenConfig] - The token configuration for the endpoint.
- * @param {number} [params.inputTokenCount] - Total input token count for tiered pricing.
 * @returns {number} The multiplier for the given parameters, or a default value if not found.
 */
-const getMultiplier = ({
-  model,
-  valueKey,
-  endpoint,
-  tokenType,
-  inputTokenCount,
-  endpointTokenConfig,
-}) => {
+const getMultiplier = ({ valueKey, tokenType, model, endpoint, endpointTokenConfig }) => {
  if (endpointTokenConfig) {
    return endpointTokenConfig?.[model]?.[tokenType] ?? defaultRate;
  }

  if (valueKey && tokenType) {
-    const premiumRate = getPremiumRate(valueKey, tokenType, inputTokenCount);
-    if (premiumRate != null) {
-      return premiumRate;
-    }
-    return tokenValues[valueKey]?.[tokenType] ?? defaultRate;
+    return tokenValues[valueKey][tokenType] ?? defaultRate;
  }

  if (!tokenType || !model) {
@ -452,33 +333,10 @@ const getMultiplier = ({
    return defaultRate;
  }

-  const premiumRate = getPremiumRate(valueKey, tokenType, inputTokenCount);
-  if (premiumRate != null) {
-    return premiumRate;
-  }
-
+  // If we got this far, and values[tokenType] is undefined somehow, return a rough average of default multipliers
  return tokenValues[valueKey]?.[tokenType] ?? defaultRate;
 };

-/**
- * Checks if premium (tiered) pricing applies and returns the premium rate.
- * Each model defines its own threshold in `premiumTokenValues`.
- * @param {string} valueKey
- * @param {string} tokenType
- * @param {number} [inputTokenCount]
- * @returns {number|null}
- */
-const getPremiumRate = (valueKey, tokenType, inputTokenCount) => {
-  if (inputTokenCount == null) {
-    return null;
-  }
-  const premiumEntry = premiumTokenValues[valueKey];
-  if (!premiumEntry || inputTokenCount <= premiumEntry.threshold) {
-    return null;
-  }
-  return premiumEntry[tokenType] ?? null;
-};
-
 /**
 * Retrieves the cache multiplier for a given value key and token type. If no value key is provided,
 * it attempts to derive it from the model name.
@ -515,10 +373,8 @@ const getCacheMultiplier = ({ valueKey, cacheType, model, endpoint, endpointToke

 module.exports = {
  tokenValues,
-  premiumTokenValues,
  getValueKey,
  getMultiplier,
-  getPremiumRate,
  getCacheMultiplier,
  defaultRate,
  cacheTokenValues,
--- a/api/models/tx.spec.js
+++ b/api/models/tx.spec.js
@ -1,4 +1,3 @@
-/** Note: No hard-coded values should be used in this file. */
 const { maxTokensMap } = require('@librechat/api');
 const { EModelEndpoint } = require('librechat-data-provider');
 const {
@ -6,10 +5,8 @@ const {
  tokenValues,
  getValueKey,
  getMultiplier,
-  getPremiumRate,
  cacheTokenValues,
  getCacheMultiplier,
-  premiumTokenValues,
 } = require('./tx');

 describe('getValueKey', () => {
@ -52,24 +49,6 @@ describe('getValueKey', () => {
    expect(getValueKey('openai/gpt-5.2')).toBe('gpt-5.2');
  });

-  it('should return "gpt-5.3" for model name containing "gpt-5.3"', () => {
-    expect(getValueKey('gpt-5.3')).toBe('gpt-5.3');
-    expect(getValueKey('gpt-5.3-chat-latest')).toBe('gpt-5.3');
-    expect(getValueKey('gpt-5.3-codex')).toBe('gpt-5.3');
-    expect(getValueKey('openai/gpt-5.3')).toBe('gpt-5.3');
-  });
-
-  it('should return "gpt-5.4" for model name containing "gpt-5.4"', () => {
-    expect(getValueKey('gpt-5.4')).toBe('gpt-5.4');
-    expect(getValueKey('gpt-5.4-thinking')).toBe('gpt-5.4');
-    expect(getValueKey('openai/gpt-5.4')).toBe('gpt-5.4');
-  });
-
-  it('should return "gpt-5.4-pro" for model name containing "gpt-5.4-pro"', () => {
-    expect(getValueKey('gpt-5.4-pro')).toBe('gpt-5.4-pro');
-    expect(getValueKey('openai/gpt-5.4-pro')).toBe('gpt-5.4-pro');
-  });
-
  it('should return "gpt-3.5-turbo-1106" for model name containing "gpt-3.5-turbo-1106"', () => {
    expect(getValueKey('gpt-3.5-turbo-1106-some-other-info')).toBe('gpt-3.5-turbo-1106');
    expect(getValueKey('openai/gpt-3.5-turbo-1106')).toBe('gpt-3.5-turbo-1106');
@ -156,12 +135,6 @@ describe('getValueKey', () => {
    expect(getValueKey('gpt-5-pro-preview')).toBe('gpt-5-pro');
  });

-  it('should return "gpt-5.2-pro" for model name containing "gpt-5.2-pro"', () => {
-    expect(getValueKey('gpt-5.2-pro')).toBe('gpt-5.2-pro');
-    expect(getValueKey('gpt-5.2-pro-2025-03-01')).toBe('gpt-5.2-pro');
-    expect(getValueKey('openai/gpt-5.2-pro')).toBe('gpt-5.2-pro');
-  });
-
  it('should return "gpt-4o" for model type of "gpt-4o"', () => {
    expect(getValueKey('gpt-4o-2024-08-06')).toBe('gpt-4o');
    expect(getValueKey('gpt-4o-2024-08-06-0718')).toBe('gpt-4o');
@ -266,15 +239,6 @@ describe('getMultiplier', () => {
    expect(getMultiplier({ valueKey: '8k', tokenType: 'unknownType' })).toBe(defaultRate);
  });

-  it('should return defaultRate if valueKey does not exist in tokenValues', () => {
-    expect(getMultiplier({ valueKey: 'non-existent-model', tokenType: 'prompt' })).toBe(
-      defaultRate,
-    );
-    expect(getMultiplier({ valueKey: 'non-existent-model', tokenType: 'completion' })).toBe(
-      defaultRate,
-    );
-  });
-
  it('should derive the valueKey from the model if not provided', () => {
    expect(getMultiplier({ tokenType: 'prompt', model: 'gpt-4-some-other-info' })).toBe(
      tokenValues['8k'].prompt,
@ -360,18 +324,6 @@ describe('getMultiplier', () => {
    );
  });

-  it('should return the correct multiplier for gpt-5.2-pro', () => {
-    expect(getMultiplier({ model: 'gpt-5.2-pro', tokenType: 'prompt' })).toBe(
-      tokenValues['gpt-5.2-pro'].prompt,
-    );
-    expect(getMultiplier({ model: 'gpt-5.2-pro', tokenType: 'completion' })).toBe(
-      tokenValues['gpt-5.2-pro'].completion,
-    );
-    expect(getMultiplier({ model: 'openai/gpt-5.2-pro', tokenType: 'prompt' })).toBe(
-      tokenValues['gpt-5.2-pro'].prompt,
-    );
-  });
-
  it('should return the correct multiplier for gpt-5.1', () => {
    expect(getMultiplier({ model: 'gpt-5.1', tokenType: 'prompt' })).toBe(
      tokenValues['gpt-5.1'].prompt,
@ -382,6 +334,8 @@ describe('getMultiplier', () => {
    expect(getMultiplier({ model: 'openai/gpt-5.1', tokenType: 'prompt' })).toBe(
      tokenValues['gpt-5.1'].prompt,
    );
+    expect(tokenValues['gpt-5.1'].prompt).toBe(1.25);
+    expect(tokenValues['gpt-5.1'].completion).toBe(10);
  });

  it('should return the correct multiplier for gpt-5.2', () => {
@ -394,48 +348,8 @@ describe('getMultiplier', () => {
    expect(getMultiplier({ model: 'openai/gpt-5.2', tokenType: 'prompt' })).toBe(
      tokenValues['gpt-5.2'].prompt,
    );
-  });
-
-  it('should return the correct multiplier for gpt-5.3', () => {
-    expect(getMultiplier({ model: 'gpt-5.3', tokenType: 'prompt' })).toBe(
-      tokenValues['gpt-5.3'].prompt,
-    );
-    expect(getMultiplier({ model: 'gpt-5.3', tokenType: 'completion' })).toBe(
-      tokenValues['gpt-5.3'].completion,
-    );
-    expect(getMultiplier({ model: 'gpt-5.3-codex', tokenType: 'prompt' })).toBe(
-      tokenValues['gpt-5.3'].prompt,
-    );
-    expect(getMultiplier({ model: 'openai/gpt-5.3', tokenType: 'completion' })).toBe(
-      tokenValues['gpt-5.3'].completion,
-    );
-  });
-
-  it('should return the correct multiplier for gpt-5.4', () => {
-    expect(getMultiplier({ model: 'gpt-5.4', tokenType: 'prompt' })).toBe(
-      tokenValues['gpt-5.4'].prompt,
-    );
-    expect(getMultiplier({ model: 'gpt-5.4', tokenType: 'completion' })).toBe(
-      tokenValues['gpt-5.4'].completion,
-    );
-    expect(getMultiplier({ model: 'gpt-5.4-thinking', tokenType: 'prompt' })).toBe(
-      tokenValues['gpt-5.4'].prompt,
-    );
-    expect(getMultiplier({ model: 'openai/gpt-5.4', tokenType: 'completion' })).toBe(
-      tokenValues['gpt-5.4'].completion,
-    );
-  });
-
-  it('should return the correct multiplier for gpt-5.4-pro', () => {
-    expect(getMultiplier({ model: 'gpt-5.4-pro', tokenType: 'prompt' })).toBe(
-      tokenValues['gpt-5.4-pro'].prompt,
-    );
-    expect(getMultiplier({ model: 'gpt-5.4-pro', tokenType: 'completion' })).toBe(
-      tokenValues['gpt-5.4-pro'].completion,
-    );
-    expect(getMultiplier({ model: 'openai/gpt-5.4-pro', tokenType: 'prompt' })).toBe(
-      tokenValues['gpt-5.4-pro'].prompt,
-    );
+    expect(tokenValues['gpt-5.2'].prompt).toBe(1.75);
+    expect(tokenValues['gpt-5.2'].completion).toBe(14);
  });

  it('should return the correct multiplier for gpt-4o', () => {
@ -901,6 +815,8 @@ describe('Deepseek Model Tests', () => {
    expect(getMultiplier({ model: 'deepseek-chat', tokenType: 'completion' })).toBe(
      tokenValues['deepseek-chat'].completion,
    );
+    expect(tokenValues['deepseek-chat'].prompt).toBe(0.28);
+    expect(tokenValues['deepseek-chat'].completion).toBe(0.42);
  });

  it('should return correct pricing for deepseek-reasoner', () => {
@ -910,6 +826,8 @@ describe('Deepseek Model Tests', () => {
    expect(getMultiplier({ model: 'deepseek-reasoner', tokenType: 'completion' })).toBe(
      tokenValues['deepseek-reasoner'].completion,
    );
+    expect(tokenValues['deepseek-reasoner'].prompt).toBe(0.28);
+    expect(tokenValues['deepseek-reasoner'].completion).toBe(0.42);
  });

  it('should handle DeepSeek model name variations with provider prefixes', () => {
@ -922,8 +840,8 @@ describe('Deepseek Model Tests', () => {
    modelVariations.forEach((model) => {
      const promptMultiplier = getMultiplier({ model, tokenType: 'prompt' });
      const completionMultiplier = getMultiplier({ model, tokenType: 'completion' });
-      expect(promptMultiplier).toBe(tokenValues['deepseek-chat'].prompt);
-      expect(completionMultiplier).toBe(tokenValues['deepseek-chat'].completion);
+      expect(promptMultiplier).toBe(0.28);
+      expect(completionMultiplier).toBe(0.42);
    });
  });

@ -942,13 +860,13 @@ describe('Deepseek Model Tests', () => {
    );
  });

-  it('should have consistent cache pricing across DeepSeek model variants', () => {
-    expect(cacheTokenValues['deepseek'].write).toBe(cacheTokenValues['deepseek-chat'].write);
-    expect(cacheTokenValues['deepseek'].read).toBe(cacheTokenValues['deepseek-chat'].read);
-    expect(cacheTokenValues['deepseek-reasoner'].write).toBe(
-      cacheTokenValues['deepseek-chat'].write,
-    );
-    expect(cacheTokenValues['deepseek-reasoner'].read).toBe(cacheTokenValues['deepseek-chat'].read);
+  it('should return correct cache pricing values for DeepSeek models', () => {
+    expect(cacheTokenValues['deepseek-chat'].write).toBe(0.28);
+    expect(cacheTokenValues['deepseek-chat'].read).toBe(0.028);
+    expect(cacheTokenValues['deepseek-reasoner'].write).toBe(0.28);
+    expect(cacheTokenValues['deepseek-reasoner'].read).toBe(0.028);
+    expect(cacheTokenValues['deepseek'].write).toBe(0.28);
+    expect(cacheTokenValues['deepseek'].read).toBe(0.028);
  });

  it('should handle DeepSeek cache multipliers with model variations', () => {
@ -957,195 +875,8 @@ describe('Deepseek Model Tests', () => {
    modelVariations.forEach((model) => {
      const writeMultiplier = getCacheMultiplier({ model, cacheType: 'write' });
      const readMultiplier = getCacheMultiplier({ model, cacheType: 'read' });
-      expect(writeMultiplier).toBe(cacheTokenValues['deepseek-chat'].write);
-      expect(readMultiplier).toBe(cacheTokenValues['deepseek-chat'].read);
-    });
-  });
-});
-
-describe('Moonshot/Kimi Model Tests - Pricing', () => {
-  describe('Kimi Models', () => {
-    it('should return correct pricing for kimi base pattern', () => {
-      expect(getMultiplier({ model: 'kimi', tokenType: 'prompt' })).toBe(
-        tokenValues['kimi'].prompt,
-      );
-      expect(getMultiplier({ model: 'kimi', tokenType: 'completion' })).toBe(
-        tokenValues['kimi'].completion,
-      );
-    });
-
-    it('should return correct pricing for kimi-k2.5', () => {
-      expect(getMultiplier({ model: 'kimi-k2.5', tokenType: 'prompt' })).toBe(
-        tokenValues['kimi-k2.5'].prompt,
-      );
-      expect(getMultiplier({ model: 'kimi-k2.5', tokenType: 'completion' })).toBe(
-        tokenValues['kimi-k2.5'].completion,
-      );
-    });
-
-    it('should return correct pricing for kimi-k2 series', () => {
-      expect(getMultiplier({ model: 'kimi-k2', tokenType: 'prompt' })).toBe(
-        tokenValues['kimi-k2'].prompt,
-      );
-      expect(getMultiplier({ model: 'kimi-k2', tokenType: 'completion' })).toBe(
-        tokenValues['kimi-k2'].completion,
-      );
-    });
-
-    it('should return correct pricing for kimi-k2-turbo (higher pricing)', () => {
-      expect(getMultiplier({ model: 'kimi-k2-turbo', tokenType: 'prompt' })).toBe(
-        tokenValues['kimi-k2-turbo'].prompt,
-      );
-      expect(getMultiplier({ model: 'kimi-k2-turbo', tokenType: 'completion' })).toBe(
-        tokenValues['kimi-k2-turbo'].completion,
-      );
-    });
-
-    it('should return correct pricing for kimi-k2-thinking models', () => {
-      expect(getMultiplier({ model: 'kimi-k2-thinking', tokenType: 'prompt' })).toBe(
-        tokenValues['kimi-k2-thinking'].prompt,
-      );
-      expect(getMultiplier({ model: 'kimi-k2-thinking', tokenType: 'completion' })).toBe(
-        tokenValues['kimi-k2-thinking'].completion,
-      );
-      expect(getMultiplier({ model: 'kimi-k2-thinking-turbo', tokenType: 'prompt' })).toBe(
-        tokenValues['kimi-k2-thinking-turbo'].prompt,
-      );
-      expect(getMultiplier({ model: 'kimi-k2-thinking-turbo', tokenType: 'completion' })).toBe(
-        tokenValues['kimi-k2-thinking-turbo'].completion,
-      );
-    });
-
-    it('should handle Kimi model variations with provider prefixes', () => {
-      const modelVariations = ['openrouter/kimi-k2', 'openrouter/kimi-k2.5', 'openrouter/kimi'];
-
-      modelVariations.forEach((model) => {
-        const promptMultiplier = getMultiplier({ model, tokenType: 'prompt' });
-        const completionMultiplier = getMultiplier({ model, tokenType: 'completion' });
-        expect(promptMultiplier).toBe(tokenValues['kimi'].prompt);
-        expect([tokenValues['kimi'].completion, tokenValues['kimi-k2.5'].completion]).toContain(
-          completionMultiplier,
-        );
-      });
-    });
-  });
-
-  describe('Moonshot Models', () => {
-    it('should return correct pricing for moonshot base pattern (128k pricing)', () => {
-      expect(getMultiplier({ model: 'moonshot', tokenType: 'prompt' })).toBe(
-        tokenValues['moonshot'].prompt,
-      );
-      expect(getMultiplier({ model: 'moonshot', tokenType: 'completion' })).toBe(
-        tokenValues['moonshot'].completion,
-      );
-    });
-
-    it('should return correct pricing for moonshot-v1-8k', () => {
-      expect(getMultiplier({ model: 'moonshot-v1-8k', tokenType: 'prompt' })).toBe(
-        tokenValues['moonshot-v1-8k'].prompt,
-      );
-      expect(getMultiplier({ model: 'moonshot-v1-8k', tokenType: 'completion' })).toBe(
-        tokenValues['moonshot-v1-8k'].completion,
-      );
-    });
-
-    it('should return correct pricing for moonshot-v1-32k', () => {
-      expect(getMultiplier({ model: 'moonshot-v1-32k', tokenType: 'prompt' })).toBe(
-        tokenValues['moonshot-v1-32k'].prompt,
-      );
-      expect(getMultiplier({ model: 'moonshot-v1-32k', tokenType: 'completion' })).toBe(
-        tokenValues['moonshot-v1-32k'].completion,
-      );
-    });
-
-    it('should return correct pricing for moonshot-v1-128k', () => {
-      expect(getMultiplier({ model: 'moonshot-v1-128k', tokenType: 'prompt' })).toBe(
-        tokenValues['moonshot-v1-128k'].prompt,
-      );
-      expect(getMultiplier({ model: 'moonshot-v1-128k', tokenType: 'completion' })).toBe(
-        tokenValues['moonshot-v1-128k'].completion,
-      );
-    });
-
-    it('should return correct pricing for moonshot-v1 vision models', () => {
-      expect(getMultiplier({ model: 'moonshot-v1-8k-vision', tokenType: 'prompt' })).toBe(
-        tokenValues['moonshot-v1-8k-vision'].prompt,
-      );
-      expect(getMultiplier({ model: 'moonshot-v1-8k-vision', tokenType: 'completion' })).toBe(
-        tokenValues['moonshot-v1-8k-vision'].completion,
-      );
-      expect(getMultiplier({ model: 'moonshot-v1-32k-vision', tokenType: 'prompt' })).toBe(
-        tokenValues['moonshot-v1-32k-vision'].prompt,
-      );
-      expect(getMultiplier({ model: 'moonshot-v1-32k-vision', tokenType: 'completion' })).toBe(
-        tokenValues['moonshot-v1-32k-vision'].completion,
-      );
-      expect(getMultiplier({ model: 'moonshot-v1-128k-vision', tokenType: 'prompt' })).toBe(
-        tokenValues['moonshot-v1-128k-vision'].prompt,
-      );
-      expect(getMultiplier({ model: 'moonshot-v1-128k-vision', tokenType: 'completion' })).toBe(
-        tokenValues['moonshot-v1-128k-vision'].completion,
-      );
-    });
-  });
-
-  describe('Kimi Cache Multipliers', () => {
-    it('should return correct cache multipliers for kimi-k2 models', () => {
-      expect(getCacheMultiplier({ model: 'kimi', cacheType: 'write' })).toBe(
-        cacheTokenValues['kimi'].write,
-      );
-      expect(getCacheMultiplier({ model: 'kimi', cacheType: 'read' })).toBe(
-        cacheTokenValues['kimi'].read,
-      );
-    });
-
-    it('should return correct cache multipliers for kimi-k2.5 (lower read price)', () => {
-      expect(getCacheMultiplier({ model: 'kimi-k2.5', cacheType: 'write' })).toBe(
-        cacheTokenValues['kimi-k2.5'].write,
-      );
-      expect(getCacheMultiplier({ model: 'kimi-k2.5', cacheType: 'read' })).toBe(
-        cacheTokenValues['kimi-k2.5'].read,
-      );
-    });
-
-    it('should return correct cache multipliers for kimi-k2-turbo', () => {
-      expect(getCacheMultiplier({ model: 'kimi-k2-turbo', cacheType: 'write' })).toBe(
-        cacheTokenValues['kimi-k2-turbo'].write,
-      );
-      expect(getCacheMultiplier({ model: 'kimi-k2-turbo', cacheType: 'read' })).toBe(
-        cacheTokenValues['kimi-k2-turbo'].read,
-      );
-    });
-
-    it('should handle Kimi cache multipliers with model variations', () => {
-      const modelVariations = ['openrouter/kimi-k2', 'openrouter/kimi'];
-
-      modelVariations.forEach((model) => {
-        const writeMultiplier = getCacheMultiplier({ model, cacheType: 'write' });
-        const readMultiplier = getCacheMultiplier({ model, cacheType: 'read' });
-        expect(writeMultiplier).toBe(cacheTokenValues['kimi'].write);
-        expect(readMultiplier).toBe(cacheTokenValues['kimi'].read);
-      });
-    });
-  });
-
-  describe('Bedrock Moonshot Models', () => {
-    it('should return correct pricing for Bedrock moonshot models', () => {
-      expect(getMultiplier({ model: 'moonshot.kimi', tokenType: 'prompt' })).toBe(
-        tokenValues['moonshot.kimi'].prompt,
-      );
-      expect(getMultiplier({ model: 'moonshot.kimi', tokenType: 'completion' })).toBe(
-        tokenValues['moonshot.kimi'].completion,
-      );
-      expect(getMultiplier({ model: 'moonshot.kimi-k2', tokenType: 'prompt' })).toBe(
-        tokenValues['moonshot.kimi-k2'].prompt,
-      );
-      expect(getMultiplier({ model: 'moonshot.kimi-k2.5', tokenType: 'prompt' })).toBe(
-        tokenValues['moonshot.kimi-k2.5'].prompt,
-      );
-      expect(getMultiplier({ model: 'moonshot.kimi-k2.5', tokenType: 'completion' })).toBe(
-        tokenValues['moonshot.kimi-k2.5'].completion,
-      );
+      expect(writeMultiplier).toBe(0.28);
+      expect(readMultiplier).toBe(0.028);
    });
  });
 });
@ -1404,73 +1135,6 @@ describe('getCacheMultiplier', () => {
    ).toBeNull();
  });

-  it('should return correct cache multipliers for OpenAI models', () => {
-    const openaiCacheModels = [
-      'gpt-4o',
-      'gpt-4o-mini',
-      'gpt-4.1',
-      'gpt-4.1-mini',
-      'gpt-4.1-nano',
-      'gpt-5',
-      'gpt-5.1',
-      'gpt-5.2',
-      'gpt-5.3',
-      'gpt-5.4',
-      'gpt-5-mini',
-      'gpt-5-nano',
-      'o1',
-      'o1-mini',
-      'o1-preview',
-      'o3',
-      'o3-mini',
-      'o4-mini',
-    ];
-
-    for (const model of openaiCacheModels) {
-      expect(getCacheMultiplier({ model, cacheType: 'write' })).toBe(cacheTokenValues[model].write);
-      expect(getCacheMultiplier({ model, cacheType: 'read' })).toBe(cacheTokenValues[model].read);
-    }
-  });
-
-  it('should return correct cache multipliers for OpenAI dated variants', () => {
-    expect(getCacheMultiplier({ model: 'gpt-4o-2024-08-06', cacheType: 'read' })).toBe(
-      cacheTokenValues['gpt-4o'].read,
-    );
-    expect(getCacheMultiplier({ model: 'gpt-4.1-2026-01-01', cacheType: 'read' })).toBe(
-      cacheTokenValues['gpt-4.1'].read,
-    );
-    expect(getCacheMultiplier({ model: 'gpt-5.3-codex', cacheType: 'read' })).toBe(
-      cacheTokenValues['gpt-5.3'].read,
-    );
-    expect(getCacheMultiplier({ model: 'openai/gpt-5.3', cacheType: 'write' })).toBe(
-      cacheTokenValues['gpt-5.3'].write,
-    );
-  });
-
-  it('should return null for pro models that do not support caching', () => {
-    expect(getCacheMultiplier({ model: 'gpt-5-pro', cacheType: 'read' })).toBeNull();
-    expect(getCacheMultiplier({ model: 'gpt-5-pro', cacheType: 'write' })).toBeNull();
-    expect(getCacheMultiplier({ model: 'gpt-5.2-pro', cacheType: 'read' })).toBeNull();
-    expect(getCacheMultiplier({ model: 'gpt-5.2-pro', cacheType: 'write' })).toBeNull();
-    expect(getCacheMultiplier({ model: 'gpt-5.4-pro', cacheType: 'read' })).toBeNull();
-    expect(getCacheMultiplier({ model: 'gpt-5.4-pro', cacheType: 'write' })).toBeNull();
-  });
-
-  it('should have consistent 10% cache read pricing for gpt-5.x models', () => {
-    const gpt5CacheModels = [
-      'gpt-5',
-      'gpt-5.1',
-      'gpt-5.2',
-      'gpt-5.3',
-      'gpt-5.4',
-      'gpt-5-mini',
-      'gpt-5-nano',
-    ];
-    for (const model of gpt5CacheModels) {
-      expect(cacheTokenValues[model].read).toBeCloseTo(cacheTokenValues[model].write * 0.1, 10);
-    }
-  });
-
  it('should handle models with "bedrock/" prefix', () => {
    expect(
      getCacheMultiplier({
@ -1490,9 +1154,6 @@ describe('getCacheMultiplier', () => {
 describe('Google Model Tests', () => {
  const googleModels = [
    'gemini-3',
-    'gemini-3.1-pro-preview',
-    'gemini-3.1-pro-preview-customtools',
-    'gemini-3.1-flash-lite-preview',
    'gemini-2.5-pro',
    'gemini-2.5-flash',
    'gemini-2.5-flash-lite',
@ -1537,9 +1198,6 @@ describe('Google Model Tests', () => {
  it('should map to the correct model keys', () => {
    const expected = {
      'gemini-3': 'gemini-3',
-      'gemini-3.1-pro-preview': 'gemini-3.1',
-      'gemini-3.1-pro-preview-customtools': 'gemini-3.1',
-      'gemini-3.1-flash-lite-preview': 'gemini-3.1-flash-lite',
      'gemini-2.5-pro': 'gemini-2.5-pro',
      'gemini-2.5-flash': 'gemini-2.5-flash',
      'gemini-2.5-flash-lite': 'gemini-2.5-flash-lite',
@ -1583,190 +1241,6 @@ describe('Google Model Tests', () => {
      ).toBe(tokenValues[expected].completion);
    });
  });
-
-  it('should return correct prompt and completion rates for Gemini 3.1', () => {
-    expect(
-      getMultiplier({
-        model: 'gemini-3.1-pro-preview',
-        tokenType: 'prompt',
-        endpoint: EModelEndpoint.google,
-      }),
-    ).toBe(tokenValues['gemini-3.1'].prompt);
-    expect(
-      getMultiplier({
-        model: 'gemini-3.1-pro-preview',
-        tokenType: 'completion',
-        endpoint: EModelEndpoint.google,
-      }),
-    ).toBe(tokenValues['gemini-3.1'].completion);
-    expect(
-      getMultiplier({
-        model: 'gemini-3.1-pro-preview-customtools',
-        tokenType: 'prompt',
-        endpoint: EModelEndpoint.google,
-      }),
-    ).toBe(tokenValues['gemini-3.1'].prompt);
-    expect(
-      getMultiplier({
-        model: 'gemini-3.1-pro-preview-customtools',
-        tokenType: 'completion',
-        endpoint: EModelEndpoint.google,
-      }),
-    ).toBe(tokenValues['gemini-3.1'].completion);
-  });
-
-  it('should return correct cache rates for Gemini 3.1', () => {
-    ['gemini-3.1-pro-preview', 'gemini-3.1-pro-preview-customtools'].forEach((model) => {
-      expect(getCacheMultiplier({ model, cacheType: 'write' })).toBe(
-        cacheTokenValues['gemini-3.1'].write,
-      );
-      expect(getCacheMultiplier({ model, cacheType: 'read' })).toBe(
-        cacheTokenValues['gemini-3.1'].read,
-      );
-    });
-  });
-
-  it('should return correct rates for Gemini 3.1 Flash-Lite', () => {
-    const model = 'gemini-3.1-flash-lite-preview';
-    expect(getMultiplier({ model, tokenType: 'prompt', endpoint: EModelEndpoint.google })).toBe(
-      tokenValues['gemini-3.1-flash-lite'].prompt,
-    );
-    expect(getMultiplier({ model, tokenType: 'completion', endpoint: EModelEndpoint.google })).toBe(
-      tokenValues['gemini-3.1-flash-lite'].completion,
-    );
-    expect(getCacheMultiplier({ model, cacheType: 'write' })).toBe(
-      cacheTokenValues['gemini-3.1-flash-lite'].write,
-    );
-    expect(getCacheMultiplier({ model, cacheType: 'read' })).toBe(
-      cacheTokenValues['gemini-3.1-flash-lite'].read,
-    );
-  });
-});
-
-describe('Gemini 3.1 Premium Token Pricing', () => {
-  const premiumKey = 'gemini-3.1';
-  const premiumEntry = premiumTokenValues[premiumKey];
-  const { threshold } = premiumEntry;
-  const belowThreshold = threshold - 1;
-  const aboveThreshold = threshold + 1;
-  const wellAboveThreshold = threshold * 2;
-
-  it('should have premium pricing defined for gemini-3.1', () => {
-    expect(premiumEntry).toBeDefined();
-    expect(premiumEntry.threshold).toBeDefined();
-    expect(premiumEntry.prompt).toBeDefined();
-    expect(premiumEntry.completion).toBeDefined();
-    expect(premiumEntry.prompt).toBeGreaterThan(tokenValues[premiumKey].prompt);
-    expect(premiumEntry.completion).toBeGreaterThan(tokenValues[premiumKey].completion);
-  });
-
-  it('should return null from getPremiumRate when inputTokenCount is below or at threshold', () => {
-    expect(getPremiumRate(premiumKey, 'prompt', belowThreshold)).toBeNull();
-    expect(getPremiumRate(premiumKey, 'completion', belowThreshold)).toBeNull();
-    expect(getPremiumRate(premiumKey, 'prompt', threshold)).toBeNull();
-  });
-
-  it('should return premium rate from getPremiumRate when inputTokenCount exceeds threshold', () => {
-    expect(getPremiumRate(premiumKey, 'prompt', aboveThreshold)).toBe(premiumEntry.prompt);
-    expect(getPremiumRate(premiumKey, 'completion', aboveThreshold)).toBe(premiumEntry.completion);
-    expect(getPremiumRate(premiumKey, 'prompt', wellAboveThreshold)).toBe(premiumEntry.prompt);
-  });
-
-  it('should return null from getPremiumRate when inputTokenCount is undefined or null', () => {
-    expect(getPremiumRate(premiumKey, 'prompt', undefined)).toBeNull();
-    expect(getPremiumRate(premiumKey, 'prompt', null)).toBeNull();
-  });
-
-  it('should return standard rate from getMultiplier when inputTokenCount is below threshold', () => {
-    expect(
-      getMultiplier({
-        model: 'gemini-3.1-pro-preview',
-        tokenType: 'prompt',
-        inputTokenCount: belowThreshold,
-      }),
-    ).toBe(tokenValues[premiumKey].prompt);
-    expect(
-      getMultiplier({
-        model: 'gemini-3.1-pro-preview',
-        tokenType: 'completion',
-        inputTokenCount: belowThreshold,
-      }),
-    ).toBe(tokenValues[premiumKey].completion);
-  });
-
-  it('should return premium rate from getMultiplier when inputTokenCount exceeds threshold', () => {
-    expect(
-      getMultiplier({
-        model: 'gemini-3.1-pro-preview',
-        tokenType: 'prompt',
-        inputTokenCount: aboveThreshold,
-      }),
-    ).toBe(premiumEntry.prompt);
-    expect(
-      getMultiplier({
-        model: 'gemini-3.1-pro-preview',
-        tokenType: 'completion',
-        inputTokenCount: aboveThreshold,
-      }),
-    ).toBe(premiumEntry.completion);
-  });
-
-  it('should return standard rate from getMultiplier when inputTokenCount is exactly at threshold', () => {
-    expect(
-      getMultiplier({
-        model: 'gemini-3.1-pro-preview',
-        tokenType: 'prompt',
-        inputTokenCount: threshold,
-      }),
-    ).toBe(tokenValues[premiumKey].prompt);
-  });
-
-  it('should apply premium pricing to customtools variant above threshold', () => {
-    expect(
-      getMultiplier({
-        model: 'gemini-3.1-pro-preview-customtools',
-        tokenType: 'prompt',
-        inputTokenCount: aboveThreshold,
-      }),
-    ).toBe(premiumEntry.prompt);
-    expect(
-      getMultiplier({
-        model: 'gemini-3.1-pro-preview-customtools',
-        tokenType: 'completion',
-        inputTokenCount: aboveThreshold,
-      }),
-    ).toBe(premiumEntry.completion);
-  });
-
-  it('should use standard rate when inputTokenCount is not provided', () => {
-    expect(getMultiplier({ model: 'gemini-3.1-pro-preview', tokenType: 'prompt' })).toBe(
-      tokenValues[premiumKey].prompt,
-    );
-    expect(getMultiplier({ model: 'gemini-3.1-pro-preview', tokenType: 'completion' })).toBe(
-      tokenValues[premiumKey].completion,
-    );
-  });
-
-  it('should apply premium pricing through getMultiplier with valueKey path', () => {
-    const valueKey = getValueKey('gemini-3.1-pro-preview');
-    expect(valueKey).toBe(premiumKey);
-    expect(getMultiplier({ valueKey, tokenType: 'prompt', inputTokenCount: aboveThreshold })).toBe(
-      premiumEntry.prompt,
-    );
-    expect(
-      getMultiplier({ valueKey, tokenType: 'completion', inputTokenCount: aboveThreshold }),
-    ).toBe(premiumEntry.completion);
-  });
-
-  it('should apply standard pricing through getMultiplier with valueKey path when below threshold', () => {
-    const valueKey = getValueKey('gemini-3.1-pro-preview');
-    expect(getMultiplier({ valueKey, tokenType: 'prompt', inputTokenCount: belowThreshold })).toBe(
-      tokenValues[premiumKey].prompt,
-    );
-    expect(
-      getMultiplier({ valueKey, tokenType: 'completion', inputTokenCount: belowThreshold }),
-    ).toBe(tokenValues[premiumKey].completion);
-  });
 });

 describe('Grok Model Tests - Pricing', () => {
@ -2215,201 +1689,6 @@ describe('Claude Model Tests', () => {
      );
    });
  });
-
-  it('should return correct prompt and completion rates for Claude Opus 4.6', () => {
-    expect(getMultiplier({ model: 'claude-opus-4-6', tokenType: 'prompt' })).toBe(
-      tokenValues['claude-opus-4-6'].prompt,
-    );
-    expect(getMultiplier({ model: 'claude-opus-4-6', tokenType: 'completion' })).toBe(
-      tokenValues['claude-opus-4-6'].completion,
-    );
-  });
-
-  it('should handle Claude Opus 4.6 model name variations', () => {
-    const modelVariations = [
-      'claude-opus-4-6',
-      'claude-opus-4-6-20250801',
-      'claude-opus-4-6-latest',
-      'anthropic/claude-opus-4-6',
-      'claude-opus-4-6/anthropic',
-      'claude-opus-4-6-preview',
-    ];
-
-    modelVariations.forEach((model) => {
-      const valueKey = getValueKey(model);
-      expect(valueKey).toBe('claude-opus-4-6');
-      expect(getMultiplier({ model, tokenType: 'prompt' })).toBe(
-        tokenValues['claude-opus-4-6'].prompt,
-      );
-      expect(getMultiplier({ model, tokenType: 'completion' })).toBe(
-        tokenValues['claude-opus-4-6'].completion,
-      );
-    });
-  });
-
-  it('should return correct cache rates for Claude Opus 4.6', () => {
-    expect(getCacheMultiplier({ model: 'claude-opus-4-6', cacheType: 'write' })).toBe(
-      cacheTokenValues['claude-opus-4-6'].write,
-    );
-    expect(getCacheMultiplier({ model: 'claude-opus-4-6', cacheType: 'read' })).toBe(
-      cacheTokenValues['claude-opus-4-6'].read,
-    );
-  });
-
-  it('should handle Claude Opus 4.6 cache rates with model name variations', () => {
-    const modelVariations = [
-      'claude-opus-4-6',
-      'claude-opus-4-6-20250801',
-      'claude-opus-4-6-latest',
-      'anthropic/claude-opus-4-6',
-      'claude-opus-4-6/anthropic',
-      'claude-opus-4-6-preview',
-    ];
-
-    modelVariations.forEach((model) => {
-      expect(getCacheMultiplier({ model, cacheType: 'write' })).toBe(
-        cacheTokenValues['claude-opus-4-6'].write,
-      );
-      expect(getCacheMultiplier({ model, cacheType: 'read' })).toBe(
-        cacheTokenValues['claude-opus-4-6'].read,
-      );
-    });
-  });
-});
-
-describe('Premium Token Pricing', () => {
-  const premiumModel = 'claude-opus-4-6';
-  const premiumEntry = premiumTokenValues[premiumModel];
-  const { threshold } = premiumEntry;
-  const belowThreshold = threshold - 1;
-  const aboveThreshold = threshold + 1;
-  const wellAboveThreshold = threshold * 2;
-
-  it('should have premium pricing defined for claude-opus-4-6', () => {
-    expect(premiumEntry).toBeDefined();
-    expect(premiumEntry.threshold).toBeDefined();
-    expect(premiumEntry.prompt).toBeDefined();
-    expect(premiumEntry.completion).toBeDefined();
-    expect(premiumEntry.prompt).toBeGreaterThan(tokenValues[premiumModel].prompt);
-    expect(premiumEntry.completion).toBeGreaterThan(tokenValues[premiumModel].completion);
-  });
-
-  it('should return null from getPremiumRate when inputTokenCount is below threshold', () => {
-    expect(getPremiumRate(premiumModel, 'prompt', belowThreshold)).toBeNull();
-    expect(getPremiumRate(premiumModel, 'completion', belowThreshold)).toBeNull();
-    expect(getPremiumRate(premiumModel, 'prompt', threshold)).toBeNull();
-  });
-
-  it('should return premium rate from getPremiumRate when inputTokenCount exceeds threshold', () => {
-    expect(getPremiumRate(premiumModel, 'prompt', aboveThreshold)).toBe(premiumEntry.prompt);
-    expect(getPremiumRate(premiumModel, 'completion', aboveThreshold)).toBe(
-      premiumEntry.completion,
-    );
-    expect(getPremiumRate(premiumModel, 'prompt', wellAboveThreshold)).toBe(premiumEntry.prompt);
-  });
-
-  it('should return null from getPremiumRate when inputTokenCount is undefined or null', () => {
-    expect(getPremiumRate(premiumModel, 'prompt', undefined)).toBeNull();
-    expect(getPremiumRate(premiumModel, 'prompt', null)).toBeNull();
-  });
-
-  it('should return null from getPremiumRate for models without premium pricing', () => {
-    expect(getPremiumRate('claude-opus-4-5', 'prompt', wellAboveThreshold)).toBeNull();
-    expect(getPremiumRate('claude-sonnet-4', 'prompt', wellAboveThreshold)).toBeNull();
-    expect(getPremiumRate('gpt-4o', 'prompt', wellAboveThreshold)).toBeNull();
-  });
-
-  it('should return standard rate from getMultiplier when inputTokenCount is below threshold', () => {
-    expect(
-      getMultiplier({
-        model: premiumModel,
-        tokenType: 'prompt',
-        inputTokenCount: belowThreshold,
-      }),
-    ).toBe(tokenValues[premiumModel].prompt);
-    expect(
-      getMultiplier({
-        model: premiumModel,
-        tokenType: 'completion',
-        inputTokenCount: belowThreshold,
-      }),
-    ).toBe(tokenValues[premiumModel].completion);
-  });
-
-  it('should return premium rate from getMultiplier when inputTokenCount exceeds threshold', () => {
-    expect(
-      getMultiplier({
-        model: premiumModel,
-        tokenType: 'prompt',
-        inputTokenCount: aboveThreshold,
-      }),
-    ).toBe(premiumEntry.prompt);
-    expect(
-      getMultiplier({
-        model: premiumModel,
-        tokenType: 'completion',
-        inputTokenCount: aboveThreshold,
-      }),
-    ).toBe(premiumEntry.completion);
-  });
-
-  it('should return standard rate from getMultiplier when inputTokenCount is exactly at threshold', () => {
-    expect(
-      getMultiplier({ model: premiumModel, tokenType: 'prompt', inputTokenCount: threshold }),
-    ).toBe(tokenValues[premiumModel].prompt);
-  });
-
-  it('should return premium rate from getMultiplier when inputTokenCount is one above threshold', () => {
-    expect(
-      getMultiplier({ model: premiumModel, tokenType: 'prompt', inputTokenCount: aboveThreshold }),
-    ).toBe(premiumEntry.prompt);
-  });
-
-  it('should not apply premium pricing to models without premium entries', () => {
-    expect(
-      getMultiplier({
-        model: 'claude-opus-4-5',
-        tokenType: 'prompt',
-        inputTokenCount: wellAboveThreshold,
-      }),
-    ).toBe(tokenValues['claude-opus-4-5'].prompt);
-    expect(
-      getMultiplier({
-        model: 'claude-sonnet-4',
-        tokenType: 'prompt',
-        inputTokenCount: wellAboveThreshold,
-      }),
-    ).toBe(tokenValues['claude-sonnet-4'].prompt);
-  });
-
-  it('should use standard rate when inputTokenCount is not provided', () => {
-    expect(getMultiplier({ model: premiumModel, tokenType: 'prompt' })).toBe(
-      tokenValues[premiumModel].prompt,
-    );
-    expect(getMultiplier({ model: premiumModel, tokenType: 'completion' })).toBe(
-      tokenValues[premiumModel].completion,
-    );
-  });
-
-  it('should apply premium pricing through getMultiplier with valueKey path', () => {
-    const valueKey = getValueKey(premiumModel);
-    expect(getMultiplier({ valueKey, tokenType: 'prompt', inputTokenCount: aboveThreshold })).toBe(
-      premiumEntry.prompt,
-    );
-    expect(
-      getMultiplier({ valueKey, tokenType: 'completion', inputTokenCount: aboveThreshold }),
-    ).toBe(premiumEntry.completion);
-  });
-
-  it('should apply standard pricing through getMultiplier with valueKey path when below threshold', () => {
-    const valueKey = getValueKey(premiumModel);
-    expect(getMultiplier({ valueKey, tokenType: 'prompt', inputTokenCount: belowThreshold })).toBe(
-      tokenValues[premiumModel].prompt,
-    );
-    expect(
-      getMultiplier({ valueKey, tokenType: 'completion', inputTokenCount: belowThreshold }),
-    ).toBe(tokenValues[premiumModel].completion);
-  });
 });

 describe('tokens.ts and tx.js sync validation', () => {
--- a/api/package.json
+++ b/api/package.json
@ -1,6 +1,6 @@
 {
  "name": "@librechat/backend",
-  "version": "v0.8.3",
+  "version": "v0.8.2",
  "description": "",
  "scripts": {
    "start": "echo 'please run this from the root directory'",
@ -34,25 +34,25 @@
  },
  "homepage": "https://librechat.ai",
  "dependencies": {
-    "@anthropic-ai/vertex-sdk": "^0.14.3",
-    "@aws-sdk/client-bedrock-runtime": "^3.980.0",
-    "@aws-sdk/client-s3": "^3.980.0",
+    "@anthropic-ai/sdk": "^0.71.0",
+    "@anthropic-ai/vertex-sdk": "^0.14.0",
+    "@aws-sdk/client-bedrock-runtime": "^3.941.0",
+    "@aws-sdk/client-s3": "^3.758.0",
    "@aws-sdk/s3-request-presigner": "^3.758.0",
    "@azure/identity": "^4.7.0",
    "@azure/search-documents": "^12.0.0",
-    "@azure/storage-blob": "^12.30.0",
+    "@azure/storage-blob": "^12.27.0",
    "@google/genai": "^1.19.0",
    "@keyv/redis": "^4.3.3",
    "@langchain/core": "^0.3.80",
-    "@librechat/agents": "^3.1.56",
+    "@librechat/agents": "^3.0.776",
    "@librechat/api": "*",
    "@librechat/data-schemas": "*",
    "@microsoft/microsoft-graph-client": "^3.0.7",
-    "@modelcontextprotocol/sdk": "^1.27.1",
+    "@modelcontextprotocol/sdk": "^1.25.3",
    "@node-saml/passport-saml": "^5.1.0",
    "@smithy/node-http-handler": "^4.4.5",
-    "ai-tokenizer": "^1.0.6",
-    "axios": "^1.13.5",
+    "axios": "^1.12.1",
    "bcryptjs": "^2.4.3",
    "compression": "^1.8.1",
    "connect-redis": "^8.1.0",
@ -64,10 +64,10 @@
    "eventsource": "^3.0.2",
    "express": "^5.2.1",
    "express-mongo-sanitize": "^2.2.0",
-    "express-rate-limit": "^8.3.0",
+    "express-rate-limit": "^8.2.1",
    "express-session": "^1.18.2",
    "express-static-gzip": "^2.2.0",
-    "file-type": "^21.3.2",
+    "file-type": "^18.7.0",
    "firebase": "^11.0.2",
    "form-data": "^4.0.4",
    "handlebars": "^4.7.7",
@ -81,14 +81,13 @@
    "klona": "^2.0.6",
    "librechat-data-provider": "*",
    "lodash": "^4.17.23",
-    "mammoth": "^1.11.0",
    "mathjs": "^15.1.0",
    "meilisearch": "^0.38.0",
    "memorystore": "^1.6.7",
    "mime": "^3.0.0",
    "module-alias": "^2.2.3",
    "mongoose": "^8.12.1",
-    "multer": "^2.1.1",
+    "multer": "^2.0.2",
    "nanoid": "^3.3.7",
    "node-fetch": "^2.7.0",
    "nodemailer": "^7.0.11",
@ -104,15 +103,14 @@
    "passport-jwt": "^4.0.1",
    "passport-ldapauth": "^3.0.1",
    "passport-local": "^1.0.0",
-    "pdfjs-dist": "^5.4.624",
    "rate-limit-redis": "^4.2.0",
    "sharp": "^0.33.5",
+    "tiktoken": "^1.0.15",
    "traverse": "^0.6.7",
    "ua-parser-js": "^1.0.36",
-    "undici": "^7.24.1",
+    "undici": "^7.18.2",
    "winston": "^3.11.0",
    "winston-daily-rotate-file": "^5.0.0",
-    "xlsx": "https://cdn.sheetjs.com/xlsx-0.20.3/xlsx-0.20.3.tgz",
    "zod": "^3.22.4"
  },
  "devDependencies": {
--- a/api/server/cleanup.js
+++ b/api/server/cleanup.js
@ -35,6 +35,7 @@ const graphPropsToClean = [
  'tools',
  'signal',
  'config',
+  'agentContexts',
  'messages',
  'contentData',
  'stepKeyIds',
@ -276,16 +277,7 @@ function disposeClient(client) {

    if (client.run) {
      if (client.run.Graph) {
-        if (typeof client.run.Graph.clearHeavyState === 'function') {
-          client.run.Graph.clearHeavyState();
-        } else {
-          client.run.Graph.resetValues();
-        }
-
-        if (client.run.Graph.agentContexts) {
-          client.run.Graph.agentContexts.clear();
-          client.run.Graph.agentContexts = null;
-        }
+        client.run.Graph.resetValues();

        graphPropsToClean.forEach((prop) => {
          if (client.run.Graph[prop] !== undefined) {
--- a/api/server/controllers/AuthController.js
+++ b/api/server/controllers/AuthController.js
@ -18,7 +18,8 @@ const {
  findUser,
 } = require('~/models');
 const { getGraphApiToken } = require('~/server/services/GraphTokenService');
-const { getOpenIdConfig, getOpenIdEmail } = require('~/strategies');
+const { getOAuthReconnectionManager } = require('~/config');
+const { getOpenIdConfig } = require('~/strategies');

 const registrationController = async (req, res) => {
  try {
@ -78,16 +79,11 @@ const refreshController = async (req, res) => {

    try {
      const openIdConfig = getOpenIdConfig();
-      const refreshParams = process.env.OPENID_SCOPE ? { scope: process.env.OPENID_SCOPE } : {};
-      const tokenset = await openIdClient.refreshTokenGrant(
-        openIdConfig,
-        refreshToken,
-        refreshParams,
-      );
+      const tokenset = await openIdClient.refreshTokenGrant(openIdConfig, refreshToken);
      const claims = tokenset.claims();
      const { user, error, migration } = await findOpenIDUser({
        findUser,
-        email: getOpenIdEmail(claims),
+        email: claims.email,
        openidId: claims.sub,
        idOnTheSource: claims.oid,
        strategyName: 'refreshController',
@ -165,6 +161,17 @@ const refreshController = async (req, res) => {
    if (session && session.expiration > new Date()) {
      const token = await setAuthTokens(userId, res, session);

+      // trigger OAuth MCP server reconnection asynchronously (best effort)
+      try {
+        void getOAuthReconnectionManager()
+          .reconnectServers(userId)
+          .catch((err) => {
+            logger.error('[refreshController] Error reconnecting OAuth MCP servers:', err);
+          });
+      } catch (err) {
+        logger.warn(`[refreshController] Cannot attempt OAuth MCP servers reconnection:`, err);
+      }
+
      res.status(200).send({ token, user });
    } else if (req?.query?.retry) {
      // Retrying from a refresh token request that failed (401)
@ -196,6 +203,15 @@ const graphTokenController = async (req, res) => {
      });
    }

+    // Extract access token from Authorization header
+    const authHeader = req.headers.authorization;
+    if (!authHeader || !authHeader.startsWith('Bearer ')) {
+      return res.status(401).json({
+        message: 'Valid authorization token required',
+      });
+    }
+
+    // Get scopes from query parameters
    const scopes = req.query.scopes;
    if (!scopes) {
      return res.status(400).json({
@ -203,13 +219,7 @@ const graphTokenController = async (req, res) => {
      });
    }

-    const accessToken = req.user.federatedTokens?.access_token;
-    if (!accessToken) {
-      return res.status(401).json({
-        message: 'No federated access token available for token exchange',
-      });
-    }
-
+    const accessToken = authHeader.substring(7); // Remove 'Bearer ' prefix
    const tokenResponse = await getGraphApiToken(req.user, accessToken, scopes);

    res.json(tokenResponse);
--- a/api/server/controllers/AuthController.spec.js
+++ b/api/server/controllers/AuthController.spec.js
@ -1,302 +0,0 @@
-jest.mock('@librechat/data-schemas', () => ({
-  logger: { error: jest.fn(), debug: jest.fn(), warn: jest.fn(), info: jest.fn() },
-}));
-jest.mock('~/server/services/GraphTokenService', () => ({
-  getGraphApiToken: jest.fn(),
-}));
-jest.mock('~/server/services/AuthService', () => ({
-  requestPasswordReset: jest.fn(),
-  setOpenIDAuthTokens: jest.fn(),
-  resetPassword: jest.fn(),
-  setAuthTokens: jest.fn(),
-  registerUser: jest.fn(),
-}));
-jest.mock('~/strategies', () => ({ getOpenIdConfig: jest.fn(), getOpenIdEmail: jest.fn() }));
-jest.mock('openid-client', () => ({ refreshTokenGrant: jest.fn() }));
-jest.mock('~/models', () => ({
-  deleteAllUserSessions: jest.fn(),
-  getUserById: jest.fn(),
-  findSession: jest.fn(),
-  updateUser: jest.fn(),
-  findUser: jest.fn(),
-}));
-jest.mock('@librechat/api', () => ({
-  isEnabled: jest.fn(),
-  findOpenIDUser: jest.fn(),
-}));
-
-const openIdClient = require('openid-client');
-const { isEnabled, findOpenIDUser } = require('@librechat/api');
-const { graphTokenController, refreshController } = require('./AuthController');
-const { getGraphApiToken } = require('~/server/services/GraphTokenService');
-const { setOpenIDAuthTokens } = require('~/server/services/AuthService');
-const { getOpenIdConfig, getOpenIdEmail } = require('~/strategies');
-const { updateUser } = require('~/models');
-
-describe('graphTokenController', () => {
-  let req, res;
-
-  beforeEach(() => {
-    jest.clearAllMocks();
-    isEnabled.mockReturnValue(true);
-
-    req = {
-      user: {
-        openidId: 'oid-123',
-        provider: 'openid',
-        federatedTokens: {
-          access_token: 'federated-access-token',
-          id_token: 'federated-id-token',
-        },
-      },
-      headers: { authorization: 'Bearer app-jwt-which-is-id-token' },
-      query: { scopes: 'https://graph.microsoft.com/.default' },
-    };
-
-    res = {
-      status: jest.fn().mockReturnThis(),
-      json: jest.fn(),
-    };
-
-    getGraphApiToken.mockResolvedValue({
-      access_token: 'graph-access-token',
-      token_type: 'Bearer',
-      expires_in: 3600,
-    });
-  });
-
-  it('should pass federatedTokens.access_token as OBO assertion, not the auth header bearer token', async () => {
-    await graphTokenController(req, res);
-
-    expect(getGraphApiToken).toHaveBeenCalledWith(
-      req.user,
-      'federated-access-token',
-      'https://graph.microsoft.com/.default',
-    );
-    expect(getGraphApiToken).not.toHaveBeenCalledWith(
-      expect.anything(),
-      'app-jwt-which-is-id-token',
-      expect.anything(),
-    );
-  });
-
-  it('should return the graph token response on success', async () => {
-    await graphTokenController(req, res);
-
-    expect(res.json).toHaveBeenCalledWith({
-      access_token: 'graph-access-token',
-      token_type: 'Bearer',
-      expires_in: 3600,
-    });
-  });
-
-  it('should return 403 when user is not authenticated via Entra ID', async () => {
-    req.user.provider = 'google';
-    req.user.openidId = undefined;
-
-    await graphTokenController(req, res);
-
-    expect(res.status).toHaveBeenCalledWith(403);
-    expect(getGraphApiToken).not.toHaveBeenCalled();
-  });
-
-  it('should return 403 when OPENID_REUSE_TOKENS is not enabled', async () => {
-    isEnabled.mockReturnValue(false);
-
-    await graphTokenController(req, res);
-
-    expect(res.status).toHaveBeenCalledWith(403);
-    expect(getGraphApiToken).not.toHaveBeenCalled();
-  });
-
-  it('should return 400 when scopes query param is missing', async () => {
-    req.query.scopes = undefined;
-
-    await graphTokenController(req, res);
-
-    expect(res.status).toHaveBeenCalledWith(400);
-    expect(getGraphApiToken).not.toHaveBeenCalled();
-  });
-
-  it('should return 401 when federatedTokens.access_token is missing', async () => {
-    req.user.federatedTokens = {};
-
-    await graphTokenController(req, res);
-
-    expect(res.status).toHaveBeenCalledWith(401);
-    expect(getGraphApiToken).not.toHaveBeenCalled();
-  });
-
-  it('should return 401 when federatedTokens is absent entirely', async () => {
-    req.user.federatedTokens = undefined;
-
-    await graphTokenController(req, res);
-
-    expect(res.status).toHaveBeenCalledWith(401);
-    expect(getGraphApiToken).not.toHaveBeenCalled();
-  });
-
-  it('should return 500 when getGraphApiToken throws', async () => {
-    getGraphApiToken.mockRejectedValue(new Error('OBO exchange failed'));
-
-    await graphTokenController(req, res);
-
-    expect(res.status).toHaveBeenCalledWith(500);
-    expect(res.json).toHaveBeenCalledWith({
-      message: 'Failed to obtain Microsoft Graph token',
-    });
-  });
-});
-
-describe('refreshController – OpenID path', () => {
-  const mockTokenset = {
-    claims: jest.fn(),
-    access_token: 'new-access',
-    id_token: 'new-id',
-    refresh_token: 'new-refresh',
-  };
-
-  const baseClaims = {
-    sub: 'oidc-sub-123',
-    oid: 'oid-456',
-    email: 'user@example.com',
-    exp: 9999999999,
-  };
-
-  let req, res;
-
-  beforeEach(() => {
-    jest.clearAllMocks();
-
-    isEnabled.mockReturnValue(true);
-    getOpenIdConfig.mockReturnValue({ some: 'config' });
-    openIdClient.refreshTokenGrant.mockResolvedValue(mockTokenset);
-    mockTokenset.claims.mockReturnValue(baseClaims);
-    getOpenIdEmail.mockReturnValue(baseClaims.email);
-    setOpenIDAuthTokens.mockReturnValue('new-app-token');
-    updateUser.mockResolvedValue({});
-
-    req = {
-      headers: { cookie: 'token_provider=openid; refreshToken=stored-refresh' },
-      session: {},
-    };
-
-    res = {
-      status: jest.fn().mockReturnThis(),
-      send: jest.fn().mockReturnThis(),
-      redirect: jest.fn(),
-    };
-  });
-
-  it('should call getOpenIdEmail with token claims and use result for findOpenIDUser', async () => {
-    const user = {
-      _id: 'user-db-id',
-      email: baseClaims.email,
-      openidId: baseClaims.sub,
-    };
-    findOpenIDUser.mockResolvedValue({ user, error: null, migration: false });
-
-    await refreshController(req, res);
-
-    expect(getOpenIdEmail).toHaveBeenCalledWith(baseClaims);
-    expect(findOpenIDUser).toHaveBeenCalledWith(
-      expect.objectContaining({ email: baseClaims.email }),
-    );
-    expect(res.status).toHaveBeenCalledWith(200);
-  });
-
-  it('should use OPENID_EMAIL_CLAIM-resolved value when claim is present in token', async () => {
-    const claimsWithUpn = { ...baseClaims, upn: 'user@corp.example.com' };
-    mockTokenset.claims.mockReturnValue(claimsWithUpn);
-    getOpenIdEmail.mockReturnValue('user@corp.example.com');
-
-    const user = {
-      _id: 'user-db-id',
-      email: 'user@corp.example.com',
-      openidId: baseClaims.sub,
-    };
-    findOpenIDUser.mockResolvedValue({ user, error: null, migration: false });
-
-    await refreshController(req, res);
-
-    expect(getOpenIdEmail).toHaveBeenCalledWith(claimsWithUpn);
-    expect(findOpenIDUser).toHaveBeenCalledWith(
-      expect.objectContaining({ email: 'user@corp.example.com' }),
-    );
-    expect(res.status).toHaveBeenCalledWith(200);
-  });
-
-  it('should fall back to claims.email when configured claim is absent from token claims', async () => {
-    getOpenIdEmail.mockReturnValue(baseClaims.email);
-
-    const user = {
-      _id: 'user-db-id',
-      email: baseClaims.email,
-      openidId: baseClaims.sub,
-    };
-    findOpenIDUser.mockResolvedValue({ user, error: null, migration: false });
-
-    await refreshController(req, res);
-
-    expect(findOpenIDUser).toHaveBeenCalledWith(
-      expect.objectContaining({ email: baseClaims.email }),
-    );
-  });
-
-  it('should update openidId when migration is triggered on refresh', async () => {
-    const user = { _id: 'user-db-id', email: baseClaims.email, openidId: null };
-    findOpenIDUser.mockResolvedValue({ user, error: null, migration: true });
-
-    await refreshController(req, res);
-
-    expect(updateUser).toHaveBeenCalledWith(
-      'user-db-id',
-      expect.objectContaining({ provider: 'openid', openidId: baseClaims.sub }),
-    );
-    expect(res.status).toHaveBeenCalledWith(200);
-  });
-
-  it('should return 401 and redirect to /login when findOpenIDUser returns no user', async () => {
-    findOpenIDUser.mockResolvedValue({ user: null, error: null, migration: false });
-
-    await refreshController(req, res);
-
-    expect(res.status).toHaveBeenCalledWith(401);
-    expect(res.redirect).toHaveBeenCalledWith('/login');
-  });
-
-  it('should return 401 and redirect when findOpenIDUser returns an error', async () => {
-    findOpenIDUser.mockResolvedValue({ user: null, error: 'AUTH_FAILED', migration: false });
-
-    await refreshController(req, res);
-
-    expect(res.status).toHaveBeenCalledWith(401);
-    expect(res.redirect).toHaveBeenCalledWith('/login');
-  });
-
-  it('should skip OpenID path when token_provider is not openid', async () => {
-    req.headers.cookie = 'token_provider=local; refreshToken=some-token';
-
-    await refreshController(req, res);
-
-    expect(openIdClient.refreshTokenGrant).not.toHaveBeenCalled();
-  });
-
-  it('should skip OpenID path when OPENID_REUSE_TOKENS is disabled', async () => {
-    isEnabled.mockReturnValue(false);
-
-    await refreshController(req, res);
-
-    expect(openIdClient.refreshTokenGrant).not.toHaveBeenCalled();
-  });
-
-  it('should return 200 with token not provided when refresh token is absent', async () => {
-    req.headers.cookie = 'token_provider=openid';
-    req.session = {};
-
-    await refreshController(req, res);
-
-    expect(res.status).toHaveBeenCalledWith(200);
-    expect(res.send).toHaveBeenCalledWith('Refresh token not provided');
-  });
-});
--- a/api/server/controllers/PermissionsController.js
+++ b/api/server/controllers/PermissionsController.js
@ -5,7 +5,6 @@
 const mongoose = require('mongoose');
 const { logger } = require('@librechat/data-schemas');
 const { ResourceType, PrincipalType, PermissionBits } = require('librechat-data-provider');
-const { enrichRemoteAgentPrincipals, backfillRemoteAgentPermissions } = require('@librechat/api');
 const {
  bulkUpdateResourcePermissions,
  ensureGroupPrincipalExists,
@ -15,6 +14,7 @@ const {
  findAccessibleResources,
  getResourcePermissionsMap,
 } = require('~/server/services/PermissionService');
+const { AclEntry } = require('~/db/models');
 const {
  searchPrincipals: searchLocalPrincipals,
  sortPrincipalsByRelevance,
@ -24,7 +24,6 @@ const {
  entraIdPrincipalFeatureEnabled,
  searchEntraIdPrincipals,
 } = require('~/server/services/GraphApiService');
-const { AclEntry, AccessRole } = require('~/db/models');

 /**
 * Generic controller for resource permission endpoints
@ -235,7 +234,7 @@ const getResourcePermissions = async (req, res) => {
      },
    ]);

-    let principals = [];
+    const principals = [];
    let publicPermission = null;

    // Process aggregation results
@ -281,13 +280,6 @@ const getResourcePermissions = async (req, res) => {
      }
    }

-    if (resourceType === ResourceType.REMOTE_AGENT) {
-      const enricherDeps = { AclEntry, AccessRole, logger };
-      const enrichResult = await enrichRemoteAgentPrincipals(enricherDeps, resourceId, principals);
-      principals = enrichResult.principals;
-      backfillRemoteAgentPermissions(enricherDeps, resourceId, enrichResult.entriesToBackfill);
-    }
-
    // Return response in format expected by frontend
    const response = {
      resourceType,
--- a/api/server/controllers/PluginController.js
+++ b/api/server/controllers/PluginController.js
@ -8,7 +8,7 @@ const { getLogStores } = require('~/cache');

 const getAvailablePluginsController = async (req, res) => {
  try {
-    const cache = getLogStores(CacheKeys.TOOL_CACHE);
+    const cache = getLogStores(CacheKeys.CONFIG_STORE);
    const cachedPlugins = await cache.get(CacheKeys.PLUGINS);
    if (cachedPlugins) {
      res.status(200).json(cachedPlugins);
@ -63,7 +63,7 @@ const getAvailableTools = async (req, res) => {
      logger.warn('[getAvailableTools] User ID not found in request');
      return res.status(401).json({ message: 'Unauthorized' });
    }
-    const cache = getLogStores(CacheKeys.TOOL_CACHE);
+    const cache = getLogStores(CacheKeys.CONFIG_STORE);
    const cachedToolsArray = await cache.get(CacheKeys.TOOLS);

    const appConfig = req.config ?? (await getAppConfig({ role: req.user?.role }));
--- a/api/server/controllers/PluginController.spec.js
+++ b/api/server/controllers/PluginController.spec.js
@ -1,4 +1,3 @@
-const { CacheKeys } = require('librechat-data-provider');
 const { getCachedTools, getAppConfig } = require('~/server/services/Config');
 const { getLogStores } = require('~/cache');

@ -64,28 +63,6 @@ describe('PluginController', () => {
    });
  });

-  describe('cache namespace', () => {
-    it('getAvailablePluginsController should use TOOL_CACHE namespace', async () => {
-      mockCache.get.mockResolvedValue([]);
-      await getAvailablePluginsController(mockReq, mockRes);
-      expect(getLogStores).toHaveBeenCalledWith(CacheKeys.TOOL_CACHE);
-    });
-
-    it('getAvailableTools should use TOOL_CACHE namespace', async () => {
-      mockCache.get.mockResolvedValue([]);
-      await getAvailableTools(mockReq, mockRes);
-      expect(getLogStores).toHaveBeenCalledWith(CacheKeys.TOOL_CACHE);
-    });
-
-    it('should NOT use CONFIG_STORE namespace for tool/plugin operations', async () => {
-      mockCache.get.mockResolvedValue([]);
-      await getAvailablePluginsController(mockReq, mockRes);
-      await getAvailableTools(mockReq, mockRes);
-      const allCalls = getLogStores.mock.calls.flat();
-      expect(allCalls).not.toContain(CacheKeys.CONFIG_STORE);
-    });
-  });
-
  describe('getAvailablePluginsController', () => {
    it('should use filterUniquePlugins to remove duplicate plugins', async () => {
      // Add plugins with duplicates to availableTools
--- a/api/server/controllers/TwoFactorController.js
+++ b/api/server/controllers/TwoFactorController.js
@ -1,6 +1,5 @@
 const { encryptV3, logger } = require('@librechat/data-schemas');
 const {
-  verifyOTPOrBackupCode,
  generateBackupCodes,
  generateTOTPSecret,
  verifyBackupCode,
@ -14,42 +13,24 @@ const safeAppTitle = (process.env.APP_TITLE || 'LibreChat').replace(/\s+/g, '');
 /**
 * Enable 2FA for the user by generating a new TOTP secret and backup codes.
 * The secret is encrypted and stored, and 2FA is marked as disabled until confirmed.
- * If 2FA is already enabled, requires OTP or backup code verification to re-enroll.
 */
 const enable2FA = async (req, res) => {
  try {
    const userId = req.user.id;
-    const existingUser = await getUserById(
-      userId,
-      '+totpSecret +backupCodes _id twoFactorEnabled email',
-    );
-
-    if (existingUser && existingUser.twoFactorEnabled) {
-      const { token, backupCode } = req.body;
-      const result = await verifyOTPOrBackupCode({
-        user: existingUser,
-        token,
-        backupCode,
-        persistBackupUse: false,
-      });
-
-      if (!result.verified) {
-        const msg = result.message ?? 'TOTP token or backup code is required to re-enroll 2FA';
-        return res.status(result.status ?? 400).json({ message: msg });
-      }
-    }
-
    const secret = generateTOTPSecret();
    const { plainCodes, codeObjects } = await generateBackupCodes();
+
+    // Encrypt the secret with v3 encryption before saving.
    const encryptedSecret = encryptV3(secret);

+    // Update the user record: store the secret & backup codes and set twoFactorEnabled to false.
    const user = await updateUser(userId, {
-      pendingTotpSecret: encryptedSecret,
-      pendingBackupCodes: codeObjects,
+      totpSecret: encryptedSecret,
+      backupCodes: codeObjects,
+      twoFactorEnabled: false,
    });

-    const email = user.email || (existingUser && existingUser.email) || '';
-    const otpauthUrl = `otpauth://totp/${safeAppTitle}:${email}?secret=${secret}&issuer=${safeAppTitle}`;
+    const otpauthUrl = `otpauth://totp/${safeAppTitle}:${user.email}?secret=${secret}&issuer=${safeAppTitle}`;

    return res.status(200).json({ otpauthUrl, backupCodes: plainCodes });
  } catch (err) {
@ -65,14 +46,13 @@ const verify2FA = async (req, res) => {
  try {
    const userId = req.user.id;
    const { token, backupCode } = req.body;
-    const user = await getUserById(userId, '+totpSecret +pendingTotpSecret +backupCodes _id');
-    const secretSource = user?.pendingTotpSecret ?? user?.totpSecret;
+    const user = await getUserById(userId, '_id totpSecret backupCodes');

-    if (!user || !secretSource) {
+    if (!user || !user.totpSecret) {
      return res.status(400).json({ message: '2FA not initiated' });
    }

-    const secret = await getTOTPSecret(secretSource);
+    const secret = await getTOTPSecret(user.totpSecret);
    let isVerified = false;

    if (token) {
@ -98,28 +78,15 @@ const confirm2FA = async (req, res) => {
  try {
    const userId = req.user.id;
    const { token } = req.body;
-    const user = await getUserById(
-      userId,
-      '+totpSecret +pendingTotpSecret +pendingBackupCodes _id',
-    );
-    const secretSource = user?.pendingTotpSecret ?? user?.totpSecret;
+    const user = await getUserById(userId, '_id totpSecret');

-    if (!user || !secretSource) {
+    if (!user || !user.totpSecret) {
      return res.status(400).json({ message: '2FA not initiated' });
    }

-    const secret = await getTOTPSecret(secretSource);
+    const secret = await getTOTPSecret(user.totpSecret);
    if (await verifyTOTP(secret, token)) {
-      const update = {
-        totpSecret: user.pendingTotpSecret ?? user.totpSecret,
-        twoFactorEnabled: true,
-        pendingTotpSecret: null,
-        pendingBackupCodes: [],
-      };
-      if (user.pendingBackupCodes?.length) {
-        update.backupCodes = user.pendingBackupCodes;
-      }
-      await updateUser(userId, update);
+      await updateUser(userId, { twoFactorEnabled: true });
      return res.status(200).json();
    }
    return res.status(400).json({ message: 'Invalid token.' });
@ -137,27 +104,31 @@ const disable2FA = async (req, res) => {
  try {
    const userId = req.user.id;
    const { token, backupCode } = req.body;
-    const user = await getUserById(userId, '+totpSecret +backupCodes _id twoFactorEnabled');
+    const user = await getUserById(userId, '_id totpSecret backupCodes');

    if (!user || !user.totpSecret) {
      return res.status(400).json({ message: '2FA is not setup for this user' });
    }

    if (user.twoFactorEnabled) {
-      const result = await verifyOTPOrBackupCode({ user, token, backupCode });
+      const secret = await getTOTPSecret(user.totpSecret);
+      let isVerified = false;

-      if (!result.verified) {
-        const msg = result.message ?? 'Either token or backup code is required to disable 2FA';
-        return res.status(result.status ?? 400).json({ message: msg });
+      if (token) {
+        isVerified = await verifyTOTP(secret, token);
+      } else if (backupCode) {
+        isVerified = await verifyBackupCode({ user, backupCode });
+      } else {
+        return res
+          .status(400)
+          .json({ message: 'Either token or backup code is required to disable 2FA' });
+      }
+
+      if (!isVerified) {
+        return res.status(401).json({ message: 'Invalid token or backup code' });
      }
    }
-    await updateUser(userId, {
-      totpSecret: null,
-      backupCodes: [],
-      twoFactorEnabled: false,
-      pendingTotpSecret: null,
-      pendingBackupCodes: [],
-    });
+    await updateUser(userId, { totpSecret: null, backupCodes: [], twoFactorEnabled: false });
    return res.status(200).json();
  } catch (err) {
    logger.error('[disable2FA]', err);
@ -167,28 +138,10 @@ const disable2FA = async (req, res) => {

 /**
 * Regenerate backup codes for the user.
- * Requires OTP or backup code verification if 2FA is already enabled.
 */
 const regenerateBackupCodes = async (req, res) => {
  try {
    const userId = req.user.id;
-    const user = await getUserById(userId, '+totpSecret +backupCodes _id twoFactorEnabled');
-
-    if (!user) {
-      return res.status(404).json({ message: 'User not found' });
-    }
-
-    if (user.twoFactorEnabled) {
-      const { token, backupCode } = req.body;
-      const result = await verifyOTPOrBackupCode({ user, token, backupCode });
-
-      if (!result.verified) {
-        const msg =
-          result.message ?? 'TOTP token or backup code is required to regenerate backup codes';
-        return res.status(result.status ?? 400).json({ message: msg });
-      }
-    }
-
    const { plainCodes, codeObjects } = await generateBackupCodes();
    await updateUser(userId, { backupCodes: codeObjects });
    return res.status(200).json({
--- a/api/server/controllers/UserController.js
+++ b/api/server/controllers/UserController.js
@ -14,7 +14,6 @@ const {
  deleteMessages,
  deletePresets,
  deleteUserKey,
-  getUserById,
  deleteConvos,
  deleteFiles,
  updateUser,
@ -23,7 +22,6 @@ const {
 } = require('~/models');
 const {
  ConversationTag,
-  AgentApiKey,
  Transaction,
  MemoryEntry,
  Assistant,
@ -35,10 +33,8 @@ const {
  User,
 } = require('~/db/models');
 const { updateUserPluginAuth, deleteUserPluginAuth } = require('~/server/services/PluginService');
-const { verifyOTPOrBackupCode } = require('~/server/services/twoFactorService');
 const { verifyEmail, resendVerificationEmail } = require('~/server/services/AuthService');
 const { getMCPManager, getFlowStateManager, getMCPServersRegistry } = require('~/config');
-const { invalidateCachedTools } = require('~/server/services/Config/getCachedTools');
 const { needsRefresh, getNewS3URL } = require('~/server/services/Files/S3/crud');
 const { processDeleteRequest } = require('~/server/services/Files/process');
 const { getAppConfig } = require('~/server/services/Config');
@ -218,7 +214,6 @@ const updateUserPluginsController = async (req, res) => {
              `[updateUserPluginsController] Attempting disconnect of MCP server "${serverName}" for user ${user.id} after plugin auth update.`,
            );
            await mcpManager.disconnectUserConnection(user.id, serverName);
-            await invalidateCachedTools({ userId: user.id, serverName });
          }
        } catch (disconnectError) {
          logger.error(
@ -243,22 +238,6 @@ const deleteUserController = async (req, res) => {
  const { user } = req;

  try {
-    const existingUser = await getUserById(
-      user.id,
-      '+totpSecret +backupCodes _id twoFactorEnabled',
-    );
-    if (existingUser && existingUser.twoFactorEnabled) {
-      const { token, backupCode } = req.body;
-      const result = await verifyOTPOrBackupCode({ user: existingUser, token, backupCode });
-
-      if (!result.verified) {
-        const msg =
-          result.message ??
-          'TOTP token or backup code is required to delete account with 2FA enabled';
-        return res.status(result.status ?? 400).json({ message: msg });
-      }
-    }
-
    await deleteMessages({ user: user.id }); // delete user messages
    await deleteAllUserSessions({ userId: user.id }); // delete user sessions
    await Transaction.deleteMany({ user: user.id }); // delete user transactions
@ -277,7 +256,6 @@ const deleteUserController = async (req, res) => {
    await deleteFiles(null, user.id); // delete database files in case of orphaned files from previous steps
    await deleteToolCalls(user.id); // delete user tool calls
    await deleteUserAgents(user.id); // delete user agents
-    await AgentApiKey.deleteMany({ user: user._id }); // delete user agent API keys
    await Assistant.deleteMany({ user: user.id }); // delete user assistants
    await ConversationTag.deleteMany({ user: user.id }); // delete user conversation tags
    await MemoryEntry.deleteMany({ userId: user.id }); // delete user memory entries
@ -370,7 +348,6 @@ const maybeUninstallOAuthMCP = async (userId, pluginKey, appConfig) => {
    serverConfig.oauth?.revocation_endpoint_auth_methods_supported ??
    clientMetadata.revocation_endpoint_auth_methods_supported;
  const oauthHeaders = serverConfig.oauth_headers ?? {};
-  const allowedDomains = getMCPServersRegistry().getAllowedDomains();

  if (tokens?.access_token) {
    try {
@ -386,7 +363,6 @@ const maybeUninstallOAuthMCP = async (userId, pluginKey, appConfig) => {
          revocationEndpointAuthMethodsSupported,
        },
        oauthHeaders,
-        allowedDomains,
      );
    } catch (error) {
      logger.error(`Error revoking OAuth access token for ${serverName}:`, error);
@ -407,7 +383,6 @@ const maybeUninstallOAuthMCP = async (userId, pluginKey, appConfig) => {
          revocationEndpointAuthMethodsSupported,
        },
        oauthHeaders,
-        allowedDomains,
      );
    } catch (error) {
      logger.error(`Error revoking OAuth refresh token for ${serverName}:`, error);
--- a/api/server/controllers/tests/TwoFactorController.spec.js
+++ b/api/server/controllers/tests/TwoFactorController.spec.js
@ -1,264 +0,0 @@
-const mockGetUserById = jest.fn();
-const mockUpdateUser = jest.fn();
-const mockVerifyOTPOrBackupCode = jest.fn();
-const mockGenerateTOTPSecret = jest.fn();
-const mockGenerateBackupCodes = jest.fn();
-const mockEncryptV3 = jest.fn();
-
-jest.mock('@librechat/data-schemas', () => ({
-  encryptV3: (...args) => mockEncryptV3(...args),
-  logger: { error: jest.fn() },
-}));
-
-jest.mock('~/server/services/twoFactorService', () => ({
-  verifyOTPOrBackupCode: (...args) => mockVerifyOTPOrBackupCode(...args),
-  generateBackupCodes: (...args) => mockGenerateBackupCodes(...args),
-  generateTOTPSecret: (...args) => mockGenerateTOTPSecret(...args),
-  verifyBackupCode: jest.fn(),
-  getTOTPSecret: jest.fn(),
-  verifyTOTP: jest.fn(),
-}));
-
-jest.mock('~/models', () => ({
-  getUserById: (...args) => mockGetUserById(...args),
-  updateUser: (...args) => mockUpdateUser(...args),
-}));
-
-const { enable2FA, regenerateBackupCodes } = require('~/server/controllers/TwoFactorController');
-
-function createRes() {
-  const res = {};
-  res.status = jest.fn().mockReturnValue(res);
-  res.json = jest.fn().mockReturnValue(res);
-  return res;
-}
-
-const PLAIN_CODES = ['code1', 'code2', 'code3'];
-const CODE_OBJECTS = [
-  { codeHash: 'h1', used: false, usedAt: null },
-  { codeHash: 'h2', used: false, usedAt: null },
-  { codeHash: 'h3', used: false, usedAt: null },
-];
-
-beforeEach(() => {
-  jest.clearAllMocks();
-  mockGenerateTOTPSecret.mockReturnValue('NEWSECRET');
-  mockGenerateBackupCodes.mockResolvedValue({ plainCodes: PLAIN_CODES, codeObjects: CODE_OBJECTS });
-  mockEncryptV3.mockReturnValue('encrypted-secret');
-});
-
-describe('enable2FA', () => {
-  it('allows first-time setup without token — writes to pending fields', async () => {
-    const req = { user: { id: 'user1' }, body: {} };
-    const res = createRes();
-    mockGetUserById.mockResolvedValue({ _id: 'user1', twoFactorEnabled: false, email: 'a@b.com' });
-    mockUpdateUser.mockResolvedValue({ email: 'a@b.com' });
-
-    await enable2FA(req, res);
-
-    expect(res.status).toHaveBeenCalledWith(200);
-    expect(res.json).toHaveBeenCalledWith(
-      expect.objectContaining({ otpauthUrl: expect.any(String), backupCodes: PLAIN_CODES }),
-    );
-    expect(mockVerifyOTPOrBackupCode).not.toHaveBeenCalled();
-    const updateCall = mockUpdateUser.mock.calls[0][1];
-    expect(updateCall).toHaveProperty('pendingTotpSecret', 'encrypted-secret');
-    expect(updateCall).toHaveProperty('pendingBackupCodes', CODE_OBJECTS);
-    expect(updateCall).not.toHaveProperty('twoFactorEnabled');
-    expect(updateCall).not.toHaveProperty('totpSecret');
-    expect(updateCall).not.toHaveProperty('backupCodes');
-  });
-
-  it('re-enrollment writes to pending fields, leaving live 2FA intact', async () => {
-    const req = { user: { id: 'user1' }, body: { token: '123456' } };
-    const res = createRes();
-    const existingUser = {
-      _id: 'user1',
-      twoFactorEnabled: true,
-      totpSecret: 'enc-secret',
-      email: 'a@b.com',
-    };
-    mockGetUserById.mockResolvedValue(existingUser);
-    mockVerifyOTPOrBackupCode.mockResolvedValue({ verified: true });
-    mockUpdateUser.mockResolvedValue({ email: 'a@b.com' });
-
-    await enable2FA(req, res);
-
-    expect(mockVerifyOTPOrBackupCode).toHaveBeenCalledWith({
-      user: existingUser,
-      token: '123456',
-      backupCode: undefined,
-      persistBackupUse: false,
-    });
-    expect(res.status).toHaveBeenCalledWith(200);
-    const updateCall = mockUpdateUser.mock.calls[0][1];
-    expect(updateCall).toHaveProperty('pendingTotpSecret', 'encrypted-secret');
-    expect(updateCall).toHaveProperty('pendingBackupCodes', CODE_OBJECTS);
-    expect(updateCall).not.toHaveProperty('twoFactorEnabled');
-    expect(updateCall).not.toHaveProperty('totpSecret');
-  });
-
-  it('allows re-enrollment with valid backup code (persistBackupUse: false)', async () => {
-    const req = { user: { id: 'user1' }, body: { backupCode: 'backup123' } };
-    const res = createRes();
-    const existingUser = {
-      _id: 'user1',
-      twoFactorEnabled: true,
-      totpSecret: 'enc-secret',
-      email: 'a@b.com',
-    };
-    mockGetUserById.mockResolvedValue(existingUser);
-    mockVerifyOTPOrBackupCode.mockResolvedValue({ verified: true });
-    mockUpdateUser.mockResolvedValue({ email: 'a@b.com' });
-
-    await enable2FA(req, res);
-
-    expect(mockVerifyOTPOrBackupCode).toHaveBeenCalledWith(
-      expect.objectContaining({ persistBackupUse: false }),
-    );
-    expect(res.status).toHaveBeenCalledWith(200);
-  });
-
-  it('returns error when no token provided and 2FA is enabled', async () => {
-    const req = { user: { id: 'user1' }, body: {} };
-    const res = createRes();
-    mockGetUserById.mockResolvedValue({
-      _id: 'user1',
-      twoFactorEnabled: true,
-      totpSecret: 'enc-secret',
-    });
-    mockVerifyOTPOrBackupCode.mockResolvedValue({ verified: false, status: 400 });
-
-    await enable2FA(req, res);
-
-    expect(res.status).toHaveBeenCalledWith(400);
-    expect(mockUpdateUser).not.toHaveBeenCalled();
-  });
-
-  it('returns 401 when invalid token provided and 2FA is enabled', async () => {
-    const req = { user: { id: 'user1' }, body: { token: 'wrong' } };
-    const res = createRes();
-    mockGetUserById.mockResolvedValue({
-      _id: 'user1',
-      twoFactorEnabled: true,
-      totpSecret: 'enc-secret',
-    });
-    mockVerifyOTPOrBackupCode.mockResolvedValue({
-      verified: false,
-      status: 401,
-      message: 'Invalid token or backup code',
-    });
-
-    await enable2FA(req, res);
-
-    expect(res.status).toHaveBeenCalledWith(401);
-    expect(res.json).toHaveBeenCalledWith({ message: 'Invalid token or backup code' });
-    expect(mockUpdateUser).not.toHaveBeenCalled();
-  });
-});
-
-describe('regenerateBackupCodes', () => {
-  it('returns 404 when user not found', async () => {
-    const req = { user: { id: 'user1' }, body: {} };
-    const res = createRes();
-    mockGetUserById.mockResolvedValue(null);
-
-    await regenerateBackupCodes(req, res);
-
-    expect(res.status).toHaveBeenCalledWith(404);
-    expect(res.json).toHaveBeenCalledWith({ message: 'User not found' });
-  });
-
-  it('requires OTP when 2FA is enabled', async () => {
-    const req = { user: { id: 'user1' }, body: { token: '123456' } };
-    const res = createRes();
-    mockGetUserById.mockResolvedValue({
-      _id: 'user1',
-      twoFactorEnabled: true,
-      totpSecret: 'enc-secret',
-    });
-    mockVerifyOTPOrBackupCode.mockResolvedValue({ verified: true });
-    mockUpdateUser.mockResolvedValue({});
-
-    await regenerateBackupCodes(req, res);
-
-    expect(mockVerifyOTPOrBackupCode).toHaveBeenCalled();
-    expect(res.status).toHaveBeenCalledWith(200);
-    expect(res.json).toHaveBeenCalledWith({
-      backupCodes: PLAIN_CODES,
-      backupCodesHash: CODE_OBJECTS,
-    });
-  });
-
-  it('returns error when no token provided and 2FA is enabled', async () => {
-    const req = { user: { id: 'user1' }, body: {} };
-    const res = createRes();
-    mockGetUserById.mockResolvedValue({
-      _id: 'user1',
-      twoFactorEnabled: true,
-      totpSecret: 'enc-secret',
-    });
-    mockVerifyOTPOrBackupCode.mockResolvedValue({ verified: false, status: 400 });
-
-    await regenerateBackupCodes(req, res);
-
-    expect(res.status).toHaveBeenCalledWith(400);
-  });
-
-  it('returns 401 when invalid token provided and 2FA is enabled', async () => {
-    const req = { user: { id: 'user1' }, body: { token: 'wrong' } };
-    const res = createRes();
-    mockGetUserById.mockResolvedValue({
-      _id: 'user1',
-      twoFactorEnabled: true,
-      totpSecret: 'enc-secret',
-    });
-    mockVerifyOTPOrBackupCode.mockResolvedValue({
-      verified: false,
-      status: 401,
-      message: 'Invalid token or backup code',
-    });
-
-    await regenerateBackupCodes(req, res);
-
-    expect(res.status).toHaveBeenCalledWith(401);
-    expect(res.json).toHaveBeenCalledWith({ message: 'Invalid token or backup code' });
-  });
-
-  it('includes backupCodesHash in response', async () => {
-    const req = { user: { id: 'user1' }, body: { token: '123456' } };
-    const res = createRes();
-    mockGetUserById.mockResolvedValue({
-      _id: 'user1',
-      twoFactorEnabled: true,
-      totpSecret: 'enc-secret',
-    });
-    mockVerifyOTPOrBackupCode.mockResolvedValue({ verified: true });
-    mockUpdateUser.mockResolvedValue({});
-
-    await regenerateBackupCodes(req, res);
-
-    const responseBody = res.json.mock.calls[0][0];
-    expect(responseBody).toHaveProperty('backupCodesHash', CODE_OBJECTS);
-    expect(responseBody).toHaveProperty('backupCodes', PLAIN_CODES);
-  });
-
-  it('allows regeneration without token when 2FA is not enabled', async () => {
-    const req = { user: { id: 'user1' }, body: {} };
-    const res = createRes();
-    mockGetUserById.mockResolvedValue({
-      _id: 'user1',
-      twoFactorEnabled: false,
-    });
-    mockUpdateUser.mockResolvedValue({});
-
-    await regenerateBackupCodes(req, res);
-
-    expect(mockVerifyOTPOrBackupCode).not.toHaveBeenCalled();
-    expect(res.status).toHaveBeenCalledWith(200);
-    expect(res.json).toHaveBeenCalledWith({
-      backupCodes: PLAIN_CODES,
-      backupCodesHash: CODE_OBJECTS,
-    });
-  });
-});
--- a/api/server/controllers/tests/deleteUser.spec.js
+++ b/api/server/controllers/tests/deleteUser.spec.js
@ -1,302 +0,0 @@
-const mockGetUserById = jest.fn();
-const mockDeleteMessages = jest.fn();
-const mockDeleteAllUserSessions = jest.fn();
-const mockDeleteUserById = jest.fn();
-const mockDeleteAllSharedLinks = jest.fn();
-const mockDeletePresets = jest.fn();
-const mockDeleteUserKey = jest.fn();
-const mockDeleteConvos = jest.fn();
-const mockDeleteFiles = jest.fn();
-const mockGetFiles = jest.fn();
-const mockUpdateUserPlugins = jest.fn();
-const mockUpdateUser = jest.fn();
-const mockFindToken = jest.fn();
-const mockVerifyOTPOrBackupCode = jest.fn();
-const mockDeleteUserPluginAuth = jest.fn();
-const mockProcessDeleteRequest = jest.fn();
-const mockDeleteToolCalls = jest.fn();
-const mockDeleteUserAgents = jest.fn();
-const mockDeleteUserPrompts = jest.fn();
-
-jest.mock('@librechat/data-schemas', () => ({
-  logger: { error: jest.fn(), info: jest.fn() },
-  webSearchKeys: [],
-}));
-
-jest.mock('librechat-data-provider', () => ({
-  Tools: {},
-  CacheKeys: {},
-  Constants: { mcp_delimiter: '::', mcp_prefix: 'mcp_' },
-  FileSources: {},
-}));
-
-jest.mock('@librechat/api', () => ({
-  MCPOAuthHandler: {},
-  MCPTokenStorage: {},
-  normalizeHttpError: jest.fn(),
-  extractWebSearchEnvVars: jest.fn(),
-}));
-
-jest.mock('~/models', () => ({
-  deleteAllUserSessions: (...args) => mockDeleteAllUserSessions(...args),
-  deleteAllSharedLinks: (...args) => mockDeleteAllSharedLinks(...args),
-  updateUserPlugins: (...args) => mockUpdateUserPlugins(...args),
-  deleteUserById: (...args) => mockDeleteUserById(...args),
-  deleteMessages: (...args) => mockDeleteMessages(...args),
-  deletePresets: (...args) => mockDeletePresets(...args),
-  deleteUserKey: (...args) => mockDeleteUserKey(...args),
-  getUserById: (...args) => mockGetUserById(...args),
-  deleteConvos: (...args) => mockDeleteConvos(...args),
-  deleteFiles: (...args) => mockDeleteFiles(...args),
-  updateUser: (...args) => mockUpdateUser(...args),
-  findToken: (...args) => mockFindToken(...args),
-  getFiles: (...args) => mockGetFiles(...args),
-}));
-
-jest.mock('~/db/models', () => ({
-  ConversationTag: { deleteMany: jest.fn() },
-  AgentApiKey: { deleteMany: jest.fn() },
-  Transaction: { deleteMany: jest.fn() },
-  MemoryEntry: { deleteMany: jest.fn() },
-  Assistant: { deleteMany: jest.fn() },
-  AclEntry: { deleteMany: jest.fn() },
-  Balance: { deleteMany: jest.fn() },
-  Action: { deleteMany: jest.fn() },
-  Group: { updateMany: jest.fn() },
-  Token: { deleteMany: jest.fn() },
-  User: {},
-}));
-
-jest.mock('~/server/services/PluginService', () => ({
-  updateUserPluginAuth: jest.fn(),
-  deleteUserPluginAuth: (...args) => mockDeleteUserPluginAuth(...args),
-}));
-
-jest.mock('~/server/services/twoFactorService', () => ({
-  verifyOTPOrBackupCode: (...args) => mockVerifyOTPOrBackupCode(...args),
-}));
-
-jest.mock('~/server/services/AuthService', () => ({
-  verifyEmail: jest.fn(),
-  resendVerificationEmail: jest.fn(),
-}));
-
-jest.mock('~/config', () => ({
-  getMCPManager: jest.fn(),
-  getFlowStateManager: jest.fn(),
-  getMCPServersRegistry: jest.fn(),
-}));
-
-jest.mock('~/server/services/Config/getCachedTools', () => ({
-  invalidateCachedTools: jest.fn(),
-}));
-
-jest.mock('~/server/services/Files/S3/crud', () => ({
-  needsRefresh: jest.fn(),
-  getNewS3URL: jest.fn(),
-}));
-
-jest.mock('~/server/services/Files/process', () => ({
-  processDeleteRequest: (...args) => mockProcessDeleteRequest(...args),
-}));
-
-jest.mock('~/server/services/Config', () => ({
-  getAppConfig: jest.fn(),
-}));
-
-jest.mock('~/models/ToolCall', () => ({
-  deleteToolCalls: (...args) => mockDeleteToolCalls(...args),
-}));
-
-jest.mock('~/models/Prompt', () => ({
-  deleteUserPrompts: (...args) => mockDeleteUserPrompts(...args),
-}));
-
-jest.mock('~/models/Agent', () => ({
-  deleteUserAgents: (...args) => mockDeleteUserAgents(...args),
-}));
-
-jest.mock('~/cache', () => ({
-  getLogStores: jest.fn(),
-}));
-
-const { deleteUserController } = require('~/server/controllers/UserController');
-
-function createRes() {
-  const res = {};
-  res.status = jest.fn().mockReturnValue(res);
-  res.json = jest.fn().mockReturnValue(res);
-  res.send = jest.fn().mockReturnValue(res);
-  return res;
-}
-
-function stubDeletionMocks() {
-  mockDeleteMessages.mockResolvedValue();
-  mockDeleteAllUserSessions.mockResolvedValue();
-  mockDeleteUserKey.mockResolvedValue();
-  mockDeletePresets.mockResolvedValue();
-  mockDeleteConvos.mockResolvedValue();
-  mockDeleteUserPluginAuth.mockResolvedValue();
-  mockDeleteUserById.mockResolvedValue();
-  mockDeleteAllSharedLinks.mockResolvedValue();
-  mockGetFiles.mockResolvedValue([]);
-  mockProcessDeleteRequest.mockResolvedValue();
-  mockDeleteFiles.mockResolvedValue();
-  mockDeleteToolCalls.mockResolvedValue();
-  mockDeleteUserAgents.mockResolvedValue();
-  mockDeleteUserPrompts.mockResolvedValue();
-}
-
-beforeEach(() => {
-  jest.clearAllMocks();
-  stubDeletionMocks();
-});
-
-describe('deleteUserController - 2FA enforcement', () => {
-  it('proceeds with deletion when 2FA is not enabled', async () => {
-    const req = { user: { id: 'user1', _id: 'user1', email: 'a@b.com' }, body: {} };
-    const res = createRes();
-    mockGetUserById.mockResolvedValue({ _id: 'user1', twoFactorEnabled: false });
-
-    await deleteUserController(req, res);
-
-    expect(res.status).toHaveBeenCalledWith(200);
-    expect(res.send).toHaveBeenCalledWith({ message: 'User deleted' });
-    expect(mockDeleteMessages).toHaveBeenCalled();
-    expect(mockVerifyOTPOrBackupCode).not.toHaveBeenCalled();
-  });
-
-  it('proceeds with deletion when user has no 2FA record', async () => {
-    const req = { user: { id: 'user1', _id: 'user1', email: 'a@b.com' }, body: {} };
-    const res = createRes();
-    mockGetUserById.mockResolvedValue(null);
-
-    await deleteUserController(req, res);
-
-    expect(res.status).toHaveBeenCalledWith(200);
-    expect(res.send).toHaveBeenCalledWith({ message: 'User deleted' });
-  });
-
-  it('returns error when 2FA is enabled and verification fails with 400', async () => {
-    const req = { user: { id: 'user1', _id: 'user1' }, body: {} };
-    const res = createRes();
-    mockGetUserById.mockResolvedValue({
-      _id: 'user1',
-      twoFactorEnabled: true,
-      totpSecret: 'enc-secret',
-    });
-    mockVerifyOTPOrBackupCode.mockResolvedValue({ verified: false, status: 400 });
-
-    await deleteUserController(req, res);
-
-    expect(res.status).toHaveBeenCalledWith(400);
-    expect(mockDeleteMessages).not.toHaveBeenCalled();
-  });
-
-  it('returns 401 when 2FA is enabled and invalid TOTP token provided', async () => {
-    const existingUser = {
-      _id: 'user1',
-      twoFactorEnabled: true,
-      totpSecret: 'enc-secret',
-    };
-    const req = { user: { id: 'user1', _id: 'user1' }, body: { token: 'wrong' } };
-    const res = createRes();
-    mockGetUserById.mockResolvedValue(existingUser);
-    mockVerifyOTPOrBackupCode.mockResolvedValue({
-      verified: false,
-      status: 401,
-      message: 'Invalid token or backup code',
-    });
-
-    await deleteUserController(req, res);
-
-    expect(mockVerifyOTPOrBackupCode).toHaveBeenCalledWith({
-      user: existingUser,
-      token: 'wrong',
-      backupCode: undefined,
-    });
-    expect(res.status).toHaveBeenCalledWith(401);
-    expect(res.json).toHaveBeenCalledWith({ message: 'Invalid token or backup code' });
-    expect(mockDeleteMessages).not.toHaveBeenCalled();
-  });
-
-  it('returns 401 when 2FA is enabled and invalid backup code provided', async () => {
-    const existingUser = {
-      _id: 'user1',
-      twoFactorEnabled: true,
-      totpSecret: 'enc-secret',
-      backupCodes: [],
-    };
-    const req = { user: { id: 'user1', _id: 'user1' }, body: { backupCode: 'bad-code' } };
-    const res = createRes();
-    mockGetUserById.mockResolvedValue(existingUser);
-    mockVerifyOTPOrBackupCode.mockResolvedValue({
-      verified: false,
-      status: 401,
-      message: 'Invalid token or backup code',
-    });
-
-    await deleteUserController(req, res);
-
-    expect(mockVerifyOTPOrBackupCode).toHaveBeenCalledWith({
-      user: existingUser,
-      token: undefined,
-      backupCode: 'bad-code',
-    });
-    expect(res.status).toHaveBeenCalledWith(401);
-    expect(mockDeleteMessages).not.toHaveBeenCalled();
-  });
-
-  it('deletes account when valid TOTP token provided with 2FA enabled', async () => {
-    const existingUser = {
-      _id: 'user1',
-      twoFactorEnabled: true,
-      totpSecret: 'enc-secret',
-    };
-    const req = {
-      user: { id: 'user1', _id: 'user1', email: 'a@b.com' },
-      body: { token: '123456' },
-    };
-    const res = createRes();
-    mockGetUserById.mockResolvedValue(existingUser);
-    mockVerifyOTPOrBackupCode.mockResolvedValue({ verified: true });
-
-    await deleteUserController(req, res);
-
-    expect(mockVerifyOTPOrBackupCode).toHaveBeenCalledWith({
-      user: existingUser,
-      token: '123456',
-      backupCode: undefined,
-    });
-    expect(res.status).toHaveBeenCalledWith(200);
-    expect(res.send).toHaveBeenCalledWith({ message: 'User deleted' });
-    expect(mockDeleteMessages).toHaveBeenCalled();
-  });
-
-  it('deletes account when valid backup code provided with 2FA enabled', async () => {
-    const existingUser = {
-      _id: 'user1',
-      twoFactorEnabled: true,
-      totpSecret: 'enc-secret',
-      backupCodes: [{ codeHash: 'h1', used: false }],
-    };
-    const req = {
-      user: { id: 'user1', _id: 'user1', email: 'a@b.com' },
-      body: { backupCode: 'valid-code' },
-    };
-    const res = createRes();
-    mockGetUserById.mockResolvedValue(existingUser);
-    mockVerifyOTPOrBackupCode.mockResolvedValue({ verified: true });
-
-    await deleteUserController(req, res);
-
-    expect(mockVerifyOTPOrBackupCode).toHaveBeenCalledWith({
-      user: existingUser,
-      token: undefined,
-      backupCode: 'valid-code',
-    });
-    expect(res.status).toHaveBeenCalledWith(200);
-    expect(res.send).toHaveBeenCalledWith({ message: 'User deleted' });
-    expect(mockDeleteMessages).toHaveBeenCalled();
-  });
-});
--- a/api/server/controllers/agents/tests/callbacks.spec.js
+++ b/api/server/controllers/agents/tests/callbacks.spec.js
@ -16,10 +16,13 @@ jest.mock('@librechat/data-schemas', () => ({
 }));

 jest.mock('@librechat/agents', () => ({
-  ...jest.requireActual('@librechat/agents'),
+  EnvVar: { CODE_API_KEY: 'CODE_API_KEY' },
+  Providers: { GOOGLE: 'google' },
+  GraphEvents: {},
  getMessageId: jest.fn(),
  ToolEndHandler: jest.fn(),
  handleToolCalls: jest.fn(),
+  ChatModelStreamHandler: jest.fn(),
 }));

 jest.mock('~/server/services/Files/Citations', () => ({
--- a/api/server/controllers/agents/tests/openai.spec.js
+++ b/api/server/controllers/agents/tests/openai.spec.js
@ -1,229 +0,0 @@
-/**
- * Unit tests for OpenAI-compatible API controller
- * Tests that recordCollectedUsage is called correctly for token spending
- */
-
-const mockSpendTokens = jest.fn().mockResolvedValue({});
-const mockSpendStructuredTokens = jest.fn().mockResolvedValue({});
-const mockRecordCollectedUsage = jest
-  .fn()
-  .mockResolvedValue({ input_tokens: 100, output_tokens: 50 });
-const mockGetBalanceConfig = jest.fn().mockReturnValue({ enabled: true });
-const mockGetTransactionsConfig = jest.fn().mockReturnValue({ enabled: true });
-
-jest.mock('nanoid', () => ({
-  nanoid: jest.fn(() => 'mock-nanoid-123'),
-}));
-
-jest.mock('@librechat/data-schemas', () => ({
-  logger: {
-    debug: jest.fn(),
-    error: jest.fn(),
-    warn: jest.fn(),
-  },
-}));
-
-jest.mock('@librechat/agents', () => ({
-  Callback: { TOOL_ERROR: 'TOOL_ERROR' },
-  ToolEndHandler: jest.fn(),
-  formatAgentMessages: jest.fn().mockReturnValue({
-    messages: [],
-    indexTokenCountMap: {},
-  }),
-}));
-
-jest.mock('@librechat/api', () => ({
-  writeSSE: jest.fn(),
-  createRun: jest.fn().mockResolvedValue({
-    processStream: jest.fn().mockResolvedValue(undefined),
-  }),
-  createChunk: jest.fn().mockReturnValue({}),
-  buildToolSet: jest.fn().mockReturnValue(new Set()),
-  sendFinalChunk: jest.fn(),
-  createSafeUser: jest.fn().mockReturnValue({ id: 'user-123' }),
-  validateRequest: jest
-    .fn()
-    .mockReturnValue({ request: { model: 'agent-123', messages: [], stream: false } }),
-  initializeAgent: jest.fn().mockResolvedValue({
-    model: 'gpt-4',
-    model_parameters: {},
-    toolRegistry: {},
-  }),
-  getBalanceConfig: mockGetBalanceConfig,
-  createErrorResponse: jest.fn(),
-  getTransactionsConfig: mockGetTransactionsConfig,
-  recordCollectedUsage: mockRecordCollectedUsage,
-  buildNonStreamingResponse: jest.fn().mockReturnValue({ id: 'resp-123' }),
-  createOpenAIStreamTracker: jest.fn().mockReturnValue({
-    addText: jest.fn(),
-    addReasoning: jest.fn(),
-    toolCalls: new Map(),
-    usage: { promptTokens: 0, completionTokens: 0, reasoningTokens: 0 },
-  }),
-  createOpenAIContentAggregator: jest.fn().mockReturnValue({
-    addText: jest.fn(),
-    addReasoning: jest.fn(),
-    getText: jest.fn().mockReturnValue(''),
-    getReasoning: jest.fn().mockReturnValue(''),
-    toolCalls: new Map(),
-    usage: { promptTokens: 100, completionTokens: 50, reasoningTokens: 0 },
-  }),
-  createToolExecuteHandler: jest.fn().mockReturnValue({ handle: jest.fn() }),
-  isChatCompletionValidationFailure: jest.fn().mockReturnValue(false),
-}));
-
-jest.mock('~/server/services/ToolService', () => ({
-  loadAgentTools: jest.fn().mockResolvedValue([]),
-  loadToolsForExecution: jest.fn().mockResolvedValue([]),
-}));
-
-jest.mock('~/models/spendTokens', () => ({
-  spendTokens: mockSpendTokens,
-  spendStructuredTokens: mockSpendStructuredTokens,
-}));
-
-const mockGetMultiplier = jest.fn().mockReturnValue(1);
-const mockGetCacheMultiplier = jest.fn().mockReturnValue(null);
-jest.mock('~/models/tx', () => ({
-  getMultiplier: mockGetMultiplier,
-  getCacheMultiplier: mockGetCacheMultiplier,
-}));
-
-jest.mock('~/server/controllers/agents/callbacks', () => ({
-  createToolEndCallback: jest.fn().mockReturnValue(jest.fn()),
-}));
-
-jest.mock('~/server/services/PermissionService', () => ({
-  findAccessibleResources: jest.fn().mockResolvedValue([]),
-}));
-
-jest.mock('~/models/Conversation', () => ({
-  getConvoFiles: jest.fn().mockResolvedValue([]),
-}));
-
-jest.mock('~/models/Agent', () => ({
-  getAgent: jest.fn().mockResolvedValue({
-    id: 'agent-123',
-    provider: 'openAI',
-    model_parameters: { model: 'gpt-4' },
-  }),
-  getAgents: jest.fn().mockResolvedValue([]),
-}));
-
-const mockUpdateBalance = jest.fn().mockResolvedValue({});
-const mockBulkInsertTransactions = jest.fn().mockResolvedValue(undefined);
-jest.mock('~/models', () => ({
-  getFiles: jest.fn(),
-  getUserKey: jest.fn(),
-  getMessages: jest.fn(),
-  updateFilesUsage: jest.fn(),
-  getUserKeyValues: jest.fn(),
-  getUserCodeFiles: jest.fn(),
-  getToolFilesByIds: jest.fn(),
-  getCodeGeneratedFiles: jest.fn(),
-  updateBalance: mockUpdateBalance,
-  bulkInsertTransactions: mockBulkInsertTransactions,
-}));
-
-describe('OpenAIChatCompletionController', () => {
-  let OpenAIChatCompletionController;
-  let req, res;
-
-  beforeEach(() => {
-    jest.clearAllMocks();
-
-    const controller = require('../openai');
-    OpenAIChatCompletionController = controller.OpenAIChatCompletionController;
-
-    req = {
-      body: {
-        model: 'agent-123',
-        messages: [{ role: 'user', content: 'Hello' }],
-        stream: false,
-      },
-      user: { id: 'user-123' },
-      config: {
-        endpoints: {
-          agents: { allowedProviders: ['openAI'] },
-        },
-      },
-      on: jest.fn(),
-    };
-
-    res = {
-      status: jest.fn().mockReturnThis(),
-      json: jest.fn(),
-      setHeader: jest.fn(),
-      flushHeaders: jest.fn(),
-      end: jest.fn(),
-      write: jest.fn(),
-    };
-  });
-
-  describe('token usage recording', () => {
-    it('should call recordCollectedUsage after successful non-streaming completion', async () => {
-      await OpenAIChatCompletionController(req, res);
-
-      expect(mockRecordCollectedUsage).toHaveBeenCalledTimes(1);
-      expect(mockRecordCollectedUsage).toHaveBeenCalledWith(
-        {
-          spendTokens: mockSpendTokens,
-          spendStructuredTokens: mockSpendStructuredTokens,
-          pricing: { getMultiplier: mockGetMultiplier, getCacheMultiplier: mockGetCacheMultiplier },
-          bulkWriteOps: {
-            insertMany: mockBulkInsertTransactions,
-            updateBalance: mockUpdateBalance,
-          },
-        },
-        expect.objectContaining({
-          user: 'user-123',
-          conversationId: expect.any(String),
-          collectedUsage: expect.any(Array),
-          context: 'message',
-          balance: { enabled: true },
-          transactions: { enabled: true },
-        }),
-      );
-    });
-
-    it('should pass balance and transactions config to recordCollectedUsage', async () => {
-      mockGetBalanceConfig.mockReturnValue({ enabled: true, startBalance: 1000 });
-      mockGetTransactionsConfig.mockReturnValue({ enabled: true, rateLimit: 100 });
-
-      await OpenAIChatCompletionController(req, res);
-
-      expect(mockRecordCollectedUsage).toHaveBeenCalledWith(
-        expect.any(Object),
-        expect.objectContaining({
-          balance: { enabled: true, startBalance: 1000 },
-          transactions: { enabled: true, rateLimit: 100 },
-        }),
-      );
-    });
-
-    it('should pass spendTokens, spendStructuredTokens, pricing, and bulkWriteOps as dependencies', async () => {
-      await OpenAIChatCompletionController(req, res);
-
-      const [deps] = mockRecordCollectedUsage.mock.calls[0];
-      expect(deps).toHaveProperty('spendTokens', mockSpendTokens);
-      expect(deps).toHaveProperty('spendStructuredTokens', mockSpendStructuredTokens);
-      expect(deps).toHaveProperty('pricing');
-      expect(deps.pricing).toHaveProperty('getMultiplier', mockGetMultiplier);
-      expect(deps.pricing).toHaveProperty('getCacheMultiplier', mockGetCacheMultiplier);
-      expect(deps).toHaveProperty('bulkWriteOps');
-      expect(deps.bulkWriteOps).toHaveProperty('insertMany', mockBulkInsertTransactions);
-      expect(deps.bulkWriteOps).toHaveProperty('updateBalance', mockUpdateBalance);
-    });
-
-    it('should include model from primaryConfig in recordCollectedUsage params', async () => {
-      await OpenAIChatCompletionController(req, res);
-
-      expect(mockRecordCollectedUsage).toHaveBeenCalledWith(
-        expect.any(Object),
-        expect.objectContaining({
-          model: 'gpt-4',
-        }),
-      );
-    });
-  });
-});
--- a/api/server/controllers/agents/tests/responses.unit.spec.js
+++ b/api/server/controllers/agents/tests/responses.unit.spec.js
@ -1,345 +0,0 @@
-/**
- * Unit tests for Open Responses API controller
- * Tests that recordCollectedUsage is called correctly for token spending
- */
-
-const mockSpendTokens = jest.fn().mockResolvedValue({});
-const mockSpendStructuredTokens = jest.fn().mockResolvedValue({});
-const mockRecordCollectedUsage = jest
-  .fn()
-  .mockResolvedValue({ input_tokens: 100, output_tokens: 50 });
-const mockGetBalanceConfig = jest.fn().mockReturnValue({ enabled: true });
-const mockGetTransactionsConfig = jest.fn().mockReturnValue({ enabled: true });
-
-jest.mock('nanoid', () => ({
-  nanoid: jest.fn(() => 'mock-nanoid-123'),
-}));
-
-jest.mock('uuid', () => ({
-  v4: jest.fn(() => 'mock-uuid-456'),
-}));
-
-jest.mock('@librechat/data-schemas', () => ({
-  logger: {
-    debug: jest.fn(),
-    error: jest.fn(),
-    warn: jest.fn(),
-  },
-}));
-
-jest.mock('@librechat/agents', () => ({
-  Callback: { TOOL_ERROR: 'TOOL_ERROR' },
-  ToolEndHandler: jest.fn(),
-  formatAgentMessages: jest.fn().mockReturnValue({
-    messages: [],
-    indexTokenCountMap: {},
-  }),
-}));
-
-jest.mock('@librechat/api', () => ({
-  createRun: jest.fn().mockResolvedValue({
-    processStream: jest.fn().mockResolvedValue(undefined),
-  }),
-  buildToolSet: jest.fn().mockReturnValue(new Set()),
-  createSafeUser: jest.fn().mockReturnValue({ id: 'user-123' }),
-  initializeAgent: jest.fn().mockResolvedValue({
-    model: 'claude-3',
-    model_parameters: {},
-    toolRegistry: {},
-  }),
-  getBalanceConfig: mockGetBalanceConfig,
-  getTransactionsConfig: mockGetTransactionsConfig,
-  recordCollectedUsage: mockRecordCollectedUsage,
-  createToolExecuteHandler: jest.fn().mockReturnValue({ handle: jest.fn() }),
-  // Responses API
-  writeDone: jest.fn(),
-  buildResponse: jest.fn().mockReturnValue({ id: 'resp_123', output: [] }),
-  generateResponseId: jest.fn().mockReturnValue('resp_mock-123'),
-  isValidationFailure: jest.fn().mockReturnValue(false),
-  emitResponseCreated: jest.fn(),
-  createResponseContext: jest.fn().mockReturnValue({ responseId: 'resp_123' }),
-  createResponseTracker: jest.fn().mockReturnValue({
-    usage: { promptTokens: 100, completionTokens: 50 },
-  }),
-  setupStreamingResponse: jest.fn(),
-  emitResponseInProgress: jest.fn(),
-  convertInputToMessages: jest.fn().mockReturnValue([]),
-  validateResponseRequest: jest.fn().mockReturnValue({
-    request: { model: 'agent-123', input: 'Hello', stream: false },
-  }),
-  buildAggregatedResponse: jest.fn().mockReturnValue({
-    id: 'resp_123',
-    status: 'completed',
-    output: [],
-    usage: { input_tokens: 100, output_tokens: 50, total_tokens: 150 },
-  }),
-  createResponseAggregator: jest.fn().mockReturnValue({
-    usage: { promptTokens: 100, completionTokens: 50 },
-  }),
-  sendResponsesErrorResponse: jest.fn(),
-  createResponsesEventHandlers: jest.fn().mockReturnValue({
-    handlers: {
-      on_message_delta: { handle: jest.fn() },
-      on_reasoning_delta: { handle: jest.fn() },
-      on_run_step: { handle: jest.fn() },
-      on_run_step_delta: { handle: jest.fn() },
-      on_chat_model_end: { handle: jest.fn() },
-    },
-    finalizeStream: jest.fn(),
-  }),
-  createAggregatorEventHandlers: jest.fn().mockReturnValue({
-    on_message_delta: { handle: jest.fn() },
-    on_reasoning_delta: { handle: jest.fn() },
-    on_run_step: { handle: jest.fn() },
-    on_run_step_delta: { handle: jest.fn() },
-    on_chat_model_end: { handle: jest.fn() },
-  }),
-}));
-
-jest.mock('~/server/services/ToolService', () => ({
-  loadAgentTools: jest.fn().mockResolvedValue([]),
-  loadToolsForExecution: jest.fn().mockResolvedValue([]),
-}));
-
-jest.mock('~/models/spendTokens', () => ({
-  spendTokens: mockSpendTokens,
-  spendStructuredTokens: mockSpendStructuredTokens,
-}));
-
-const mockGetMultiplier = jest.fn().mockReturnValue(1);
-const mockGetCacheMultiplier = jest.fn().mockReturnValue(null);
-jest.mock('~/models/tx', () => ({
-  getMultiplier: mockGetMultiplier,
-  getCacheMultiplier: mockGetCacheMultiplier,
-}));
-
-jest.mock('~/server/controllers/agents/callbacks', () => ({
-  createToolEndCallback: jest.fn().mockReturnValue(jest.fn()),
-  createResponsesToolEndCallback: jest.fn().mockReturnValue(jest.fn()),
-}));
-
-jest.mock('~/server/services/PermissionService', () => ({
-  findAccessibleResources: jest.fn().mockResolvedValue([]),
-}));
-
-jest.mock('~/models/Conversation', () => ({
-  getConvoFiles: jest.fn().mockResolvedValue([]),
-  saveConvo: jest.fn().mockResolvedValue({}),
-  getConvo: jest.fn().mockResolvedValue(null),
-}));
-
-jest.mock('~/models/Agent', () => ({
-  getAgent: jest.fn().mockResolvedValue({
-    id: 'agent-123',
-    name: 'Test Agent',
-    provider: 'anthropic',
-    model_parameters: { model: 'claude-3' },
-  }),
-  getAgents: jest.fn().mockResolvedValue([]),
-}));
-
-const mockUpdateBalance = jest.fn().mockResolvedValue({});
-const mockBulkInsertTransactions = jest.fn().mockResolvedValue(undefined);
-jest.mock('~/models', () => ({
-  getFiles: jest.fn(),
-  getUserKey: jest.fn(),
-  getMessages: jest.fn().mockResolvedValue([]),
-  saveMessage: jest.fn().mockResolvedValue({}),
-  updateFilesUsage: jest.fn(),
-  getUserKeyValues: jest.fn(),
-  getUserCodeFiles: jest.fn(),
-  getToolFilesByIds: jest.fn(),
-  getCodeGeneratedFiles: jest.fn(),
-  updateBalance: mockUpdateBalance,
-  bulkInsertTransactions: mockBulkInsertTransactions,
-}));
-
-describe('createResponse controller', () => {
-  let createResponse;
-  let req, res;
-
-  beforeEach(() => {
-    jest.clearAllMocks();
-
-    const controller = require('../responses');
-    createResponse = controller.createResponse;
-
-    req = {
-      body: {
-        model: 'agent-123',
-        input: 'Hello',
-        stream: false,
-      },
-      user: { id: 'user-123' },
-      config: {
-        endpoints: {
-          agents: { allowedProviders: ['anthropic'] },
-        },
-      },
-      on: jest.fn(),
-    };
-
-    res = {
-      status: jest.fn().mockReturnThis(),
-      json: jest.fn(),
-      setHeader: jest.fn(),
-      flushHeaders: jest.fn(),
-      end: jest.fn(),
-      write: jest.fn(),
-    };
-  });
-
-  describe('token usage recording - non-streaming', () => {
-    it('should call recordCollectedUsage after successful non-streaming completion', async () => {
-      await createResponse(req, res);
-
-      expect(mockRecordCollectedUsage).toHaveBeenCalledTimes(1);
-      expect(mockRecordCollectedUsage).toHaveBeenCalledWith(
-        {
-          spendTokens: mockSpendTokens,
-          spendStructuredTokens: mockSpendStructuredTokens,
-          pricing: { getMultiplier: mockGetMultiplier, getCacheMultiplier: mockGetCacheMultiplier },
-          bulkWriteOps: {
-            insertMany: mockBulkInsertTransactions,
-            updateBalance: mockUpdateBalance,
-          },
-        },
-        expect.objectContaining({
-          user: 'user-123',
-          conversationId: expect.any(String),
-          collectedUsage: expect.any(Array),
-          context: 'message',
-        }),
-      );
-    });
-
-    it('should pass balance and transactions config to recordCollectedUsage', async () => {
-      mockGetBalanceConfig.mockReturnValue({ enabled: true, startBalance: 2000 });
-      mockGetTransactionsConfig.mockReturnValue({ enabled: true });
-
-      await createResponse(req, res);
-
-      expect(mockRecordCollectedUsage).toHaveBeenCalledWith(
-        expect.any(Object),
-        expect.objectContaining({
-          balance: { enabled: true, startBalance: 2000 },
-          transactions: { enabled: true },
-        }),
-      );
-    });
-
-    it('should pass spendTokens, spendStructuredTokens, pricing, and bulkWriteOps as dependencies', async () => {
-      await createResponse(req, res);
-
-      const [deps] = mockRecordCollectedUsage.mock.calls[0];
-      expect(deps).toHaveProperty('spendTokens', mockSpendTokens);
-      expect(deps).toHaveProperty('spendStructuredTokens', mockSpendStructuredTokens);
-      expect(deps).toHaveProperty('pricing');
-      expect(deps.pricing).toHaveProperty('getMultiplier', mockGetMultiplier);
-      expect(deps.pricing).toHaveProperty('getCacheMultiplier', mockGetCacheMultiplier);
-      expect(deps).toHaveProperty('bulkWriteOps');
-      expect(deps.bulkWriteOps).toHaveProperty('insertMany', mockBulkInsertTransactions);
-      expect(deps.bulkWriteOps).toHaveProperty('updateBalance', mockUpdateBalance);
-    });
-
-    it('should include model from primaryConfig in recordCollectedUsage params', async () => {
-      await createResponse(req, res);
-
-      expect(mockRecordCollectedUsage).toHaveBeenCalledWith(
-        expect.any(Object),
-        expect.objectContaining({
-          model: 'claude-3',
-        }),
-      );
-    });
-  });
-
-  describe('token usage recording - streaming', () => {
-    beforeEach(() => {
-      req.body.stream = true;
-
-      const api = require('@librechat/api');
-      api.validateResponseRequest.mockReturnValue({
-        request: { model: 'agent-123', input: 'Hello', stream: true },
-      });
-    });
-
-    it('should call recordCollectedUsage after successful streaming completion', async () => {
-      await createResponse(req, res);
-
-      expect(mockRecordCollectedUsage).toHaveBeenCalledTimes(1);
-      expect(mockRecordCollectedUsage).toHaveBeenCalledWith(
-        {
-          spendTokens: mockSpendTokens,
-          spendStructuredTokens: mockSpendStructuredTokens,
-          pricing: { getMultiplier: mockGetMultiplier, getCacheMultiplier: mockGetCacheMultiplier },
-          bulkWriteOps: {
-            insertMany: mockBulkInsertTransactions,
-            updateBalance: mockUpdateBalance,
-          },
-        },
-        expect.objectContaining({
-          user: 'user-123',
-          context: 'message',
-        }),
-      );
-    });
-  });
-
-  describe('collectedUsage population', () => {
-    it('should collect usage from on_chat_model_end events', async () => {
-      const api = require('@librechat/api');
-
-      let capturedOnChatModelEnd;
-      api.createAggregatorEventHandlers.mockImplementation(() => {
-        return {
-          on_message_delta: { handle: jest.fn() },
-          on_reasoning_delta: { handle: jest.fn() },
-          on_run_step: { handle: jest.fn() },
-          on_run_step_delta: { handle: jest.fn() },
-          on_chat_model_end: {
-            handle: jest.fn((event, data) => {
-              if (capturedOnChatModelEnd) {
-                capturedOnChatModelEnd(event, data);
-              }
-            }),
-          },
-        };
-      });
-
-      api.createRun.mockImplementation(async ({ customHandlers }) => {
-        capturedOnChatModelEnd = (event, data) => {
-          customHandlers.on_chat_model_end.handle(event, data);
-        };
-
-        return {
-          processStream: jest.fn().mockImplementation(async () => {
-            customHandlers.on_chat_model_end.handle('on_chat_model_end', {
-              output: {
-                usage_metadata: {
-                  input_tokens: 150,
-                  output_tokens: 75,
-                  model: 'claude-3',
-                },
-              },
-            });
-          }),
-        };
-      });
-
-      await createResponse(req, res);
-
-      expect(mockRecordCollectedUsage).toHaveBeenCalledWith(
-        expect.any(Object),
-        expect.objectContaining({
-          collectedUsage: expect.arrayContaining([
-            expect.objectContaining({
-              input_tokens: 150,
-              output_tokens: 75,
-            }),
-          ]),
-        }),
-      );
-    });
-  });
-});
--- a/api/server/controllers/agents/tests/v1.duplicate-actions.spec.js
+++ b/api/server/controllers/agents/tests/v1.duplicate-actions.spec.js
@ -1,159 +0,0 @@
-jest.mock('~/server/services/PermissionService', () => ({
-  findPubliclyAccessibleResources: jest.fn(),
-  findAccessibleResources: jest.fn(),
-  hasPublicPermission: jest.fn(),
-  grantPermission: jest.fn().mockResolvedValue({}),
-}));
-
-jest.mock('~/server/services/Config', () => ({
-  getCachedTools: jest.fn(),
-  getMCPServerTools: jest.fn(),
-}));
-
-const mongoose = require('mongoose');
-const { actionDelimiter } = require('librechat-data-provider');
-const { agentSchema, actionSchema } = require('@librechat/data-schemas');
-const { MongoMemoryServer } = require('mongodb-memory-server');
-const { duplicateAgent } = require('../v1');
-
-let mongoServer;
-
-beforeAll(async () => {
-  mongoServer = await MongoMemoryServer.create();
-  const mongoUri = mongoServer.getUri();
-  if (!mongoose.models.Agent) {
-    mongoose.model('Agent', agentSchema);
-  }
-  if (!mongoose.models.Action) {
-    mongoose.model('Action', actionSchema);
-  }
-  await mongoose.connect(mongoUri);
-}, 20000);
-
-afterAll(async () => {
-  await mongoose.disconnect();
-  await mongoServer.stop();
-});
-
-beforeEach(async () => {
-  await mongoose.models.Agent.deleteMany({});
-  await mongoose.models.Action.deleteMany({});
-});
-
-describe('duplicateAgentHandler — action domain extraction', () => {
-  it('builds duplicated action entries using metadata.domain, not action_id', async () => {
-    const userId = new mongoose.Types.ObjectId();
-    const originalAgentId = `agent_original`;
-
-    const agent = await mongoose.models.Agent.create({
-      id: originalAgentId,
-      name: 'Test Agent',
-      author: userId.toString(),
-      provider: 'openai',
-      model: 'gpt-4',
-      tools: [],
-      actions: [`api.example.com${actionDelimiter}act_original`],
-      versions: [{ name: 'Test Agent', createdAt: new Date(), updatedAt: new Date() }],
-    });
-
-    await mongoose.models.Action.create({
-      user: userId,
-      action_id: 'act_original',
-      agent_id: originalAgentId,
-      metadata: { domain: 'api.example.com' },
-    });
-
-    const req = {
-      params: { id: agent.id },
-      user: { id: userId.toString() },
-    };
-    const res = {
-      status: jest.fn().mockReturnThis(),
-      json: jest.fn(),
-    };
-
-    await duplicateAgent(req, res);
-
-    expect(res.status).toHaveBeenCalledWith(201);
-
-    const { agent: newAgent, actions: newActions } = res.json.mock.calls[0][0];
-
-    expect(newAgent.id).not.toBe(originalAgentId);
-    expect(String(newAgent.author)).toBe(userId.toString());
-    expect(newActions).toHaveLength(1);
-    expect(newActions[0].metadata.domain).toBe('api.example.com');
-    expect(newActions[0].agent_id).toBe(newAgent.id);
-
-    for (const actionEntry of newAgent.actions) {
-      const [domain, actionId] = actionEntry.split(actionDelimiter);
-      expect(domain).toBe('api.example.com');
-      expect(actionId).toBeTruthy();
-      expect(actionId).not.toBe('act_original');
-    }
-
-    const allActions = await mongoose.models.Action.find({}).lean();
-    expect(allActions).toHaveLength(2);
-
-    const originalAction = allActions.find((a) => a.action_id === 'act_original');
-    expect(originalAction.agent_id).toBe(originalAgentId);
-
-    const duplicatedAction = allActions.find((a) => a.action_id !== 'act_original');
-    expect(duplicatedAction.agent_id).toBe(newAgent.id);
-    expect(duplicatedAction.metadata.domain).toBe('api.example.com');
-  });
-
-  it('strips sensitive metadata fields from duplicated actions', async () => {
-    const userId = new mongoose.Types.ObjectId();
-    const originalAgentId = 'agent_sensitive';
-
-    await mongoose.models.Agent.create({
-      id: originalAgentId,
-      name: 'Sensitive Agent',
-      author: userId.toString(),
-      provider: 'openai',
-      model: 'gpt-4',
-      tools: [],
-      actions: [`secure.api.com${actionDelimiter}act_secret`],
-      versions: [{ name: 'Sensitive Agent', createdAt: new Date(), updatedAt: new Date() }],
-    });
-
-    await mongoose.models.Action.create({
-      user: userId,
-      action_id: 'act_secret',
-      agent_id: originalAgentId,
-      metadata: {
-        domain: 'secure.api.com',
-        api_key: 'sk-secret-key-12345',
-        oauth_client_id: 'client_id_xyz',
-        oauth_client_secret: 'client_secret_xyz',
-      },
-    });
-
-    const req = {
-      params: { id: originalAgentId },
-      user: { id: userId.toString() },
-    };
-    const res = {
-      status: jest.fn().mockReturnThis(),
-      json: jest.fn(),
-    };
-
-    await duplicateAgent(req, res);
-
-    expect(res.status).toHaveBeenCalledWith(201);
-
-    const duplicatedAction = await mongoose.models.Action.findOne({
-      agent_id: { $ne: originalAgentId },
-    }).lean();
-
-    expect(duplicatedAction.metadata.domain).toBe('secure.api.com');
-    expect(duplicatedAction.metadata.api_key).toBeUndefined();
-    expect(duplicatedAction.metadata.oauth_client_id).toBeUndefined();
-    expect(duplicatedAction.metadata.oauth_client_secret).toBeUndefined();
-
-    const originalAction = await mongoose.models.Action.findOne({
-      action_id: 'act_secret',
-    }).lean();
-    expect(originalAction.metadata.api_key).toBe('sk-secret-key-12345');
-  });
-});
--- a/api/server/controllers/agents/callbacks.js
+++ b/api/server/controllers/agents/callbacks.js
@ -1,13 +1,16 @@
 const { nanoid } = require('nanoid');
+const { sendEvent, GenerationJobManager } = require('@librechat/api');
 const { logger } = require('@librechat/data-schemas');
-const { Constants, EnvVar, GraphEvents, ToolEndHandler } = require('@librechat/agents');
 const { Tools, StepTypes, FileContext, ErrorTypes } = require('librechat-data-provider');
 const {
-  sendEvent,
-  GenerationJobManager,
-  writeAttachmentEvent,
-  createToolExecuteHandler,
-} = require('@librechat/api');
+  EnvVar,
+  Providers,
+  GraphEvents,
+  getMessageId,
+  ToolEndHandler,
+  handleToolCalls,
+  ChatModelStreamHandler,
+} = require('@librechat/agents');
 const { processFileCitations } = require('~/server/services/Files/Citations');
 const { processCodeOutput } = require('~/server/services/Files/Code/process');
 const { loadAuthValues } = require('~/server/services/Tools/credentials');
@ -48,6 +51,8 @@ class ModelEndHandler {
    let errorMessage;
    try {
      const agentContext = graph.getAgentContext(metadata);
+      const isGoogle = agentContext.provider === Providers.GOOGLE;
+      const streamingDisabled = !!agentContext.clientOptions?.disableStreaming;
      if (data?.output?.additional_kwargs?.stop_reason === 'refusal') {
        const info = { ...data.output.additional_kwargs };
        errorMessage = JSON.stringify({
@ -62,6 +67,21 @@ class ModelEndHandler {
        });
      }

+      const toolCalls = data?.output?.tool_calls;
+      let hasUnprocessedToolCalls = false;
+      if (Array.isArray(toolCalls) && toolCalls.length > 0 && graph?.toolCallStepIds?.has) {
+        try {
+          hasUnprocessedToolCalls = toolCalls.some(
+            (tc) => tc?.id && !graph.toolCallStepIds.has(tc.id),
+          );
+        } catch {
+          hasUnprocessedToolCalls = false;
+        }
+      }
+      if (isGoogle || streamingDisabled || hasUnprocessedToolCalls) {
+        await handleToolCalls(toolCalls, metadata, graph);
+      }
+
      const usage = data?.output?.usage_metadata;
      if (!usage) {
        return this.finalize(errorMessage);
@ -72,6 +92,38 @@ class ModelEndHandler {
      }

      this.collectedUsage.push(usage);
+      if (!streamingDisabled) {
+        return this.finalize(errorMessage);
+      }
+      if (!data.output.content) {
+        return this.finalize(errorMessage);
+      }
+      const stepKey = graph.getStepKey(metadata);
+      const message_id = getMessageId(stepKey, graph) ?? '';
+      if (message_id) {
+        await graph.dispatchRunStep(stepKey, {
+          type: StepTypes.MESSAGE_CREATION,
+          message_creation: {
+            message_id,
+          },
+        });
+      }
+      const stepId = graph.getStepIdByKey(stepKey);
+      const content = data.output.content;
+      if (typeof content === 'string') {
+        await graph.dispatchMessageDelta(stepId, {
+          content: [
+            {
+              type: 'text',
+              text: content,
+            },
+          ],
+        });
+      } else if (content.every((c) => c.type?.startsWith('text'))) {
+        await graph.dispatchMessageDelta(stepId, {
+          content,
+        });
+      }
    } catch (error) {
      logger.error('Error handling model end event:', error);
      return this.finalize(errorMessage);
@ -94,26 +146,18 @@ function checkIfLastAgent(last_agent_id, langgraph_node) {

 /**
 * Helper to emit events either to res (standard mode) or to job emitter (resumable mode).
- * In Redis mode, awaits the emit to guarantee event ordering (critical for streaming deltas).
 * @param {ServerResponse} res - The server response object
 * @param {string | null} streamId - The stream ID for resumable mode, or null for standard mode
 * @param {Object} eventData - The event data to send
- * @returns {Promise<void>}
 */
-async function emitEvent(res, streamId, eventData) {
+function emitEvent(res, streamId, eventData) {
  if (streamId) {
-    await GenerationJobManager.emitChunk(streamId, eventData);
+    GenerationJobManager.emitChunk(streamId, eventData);
  } else {
    sendEvent(res, eventData);
  }
 }

-/**
- * @typedef {Object} ToolExecuteOptions
- * @property {(toolNames: string[]) => Promise<{loadedTools: StructuredTool[]}>} loadTools - Function to load tools by name
- * @property {Object} configurable - Configurable context for tool invocation
- */
-
 /**
 * Get default handlers for stream events.
 * @param {Object} options - The options object.
@ -122,7 +166,6 @@ async function emitEvent(res, streamId, eventData) {
 * @param {ToolEndCallback} options.toolEndCallback - Callback to use when tool ends.
 * @param {Array<UsageMetadata>} options.collectedUsage - The list of collected usage metadata.
 * @param {string | null} [options.streamId] - The stream ID for resumable mode, or null for standard mode.
- * @param {ToolExecuteOptions} [options.toolExecuteOptions] - Options for event-driven tool execution.
 * @returns {Record<string, t.EventHandler>} The default handlers.
 * @throws {Error} If the request is not found.
 */
@ -132,7 +175,6 @@ function getDefaultHandlers({
  toolEndCallback,
  collectedUsage,
  streamId = null,
-  toolExecuteOptions = null,
 }) {
  if (!res || !aggregateContent) {
    throw new Error(
@ -142,6 +184,7 @@ function getDefaultHandlers({
  const handlers = {
    [GraphEvents.CHAT_MODEL_END]: new ModelEndHandler(collectedUsage),
    [GraphEvents.TOOL_END]: new ToolEndHandler(toolEndCallback, logger),
+    [GraphEvents.CHAT_MODEL_STREAM]: new ChatModelStreamHandler(),
    [GraphEvents.ON_RUN_STEP]: {
      /**
       * Handle ON_RUN_STEP event.
@ -149,19 +192,18 @@ function getDefaultHandlers({
       * @param {StreamEventData} data - The event data.
       * @param {GraphRunnableConfig['configurable']} [metadata] The runnable metadata.
       */
-      handle: async (event, data, metadata) => {
-        aggregateContent({ event, data });
+      handle: (event, data, metadata) => {
        if (data?.stepDetails.type === StepTypes.TOOL_CALLS) {
-          await emitEvent(res, streamId, { event, data });
+          emitEvent(res, streamId, { event, data });
        } else if (checkIfLastAgent(metadata?.last_agent_id, metadata?.langgraph_node)) {
-          await emitEvent(res, streamId, { event, data });
+          emitEvent(res, streamId, { event, data });
        } else if (!metadata?.hide_sequential_outputs) {
-          await emitEvent(res, streamId, { event, data });
+          emitEvent(res, streamId, { event, data });
        } else {
          const agentName = metadata?.name ?? 'Agent';
          const isToolCall = data?.stepDetails.type === StepTypes.TOOL_CALLS;
          const action = isToolCall ? 'performing a task...' : 'thinking...';
-          await emitEvent(res, streamId, {
+          emitEvent(res, streamId, {
            event: 'on_agent_update',
            data: {
              runId: metadata?.run_id,
@ -169,6 +211,7 @@ function getDefaultHandlers({
            },
          });
        }
+        aggregateContent({ event, data });
      },
    },
    [GraphEvents.ON_RUN_STEP_DELTA]: {
@ -178,15 +221,15 @@ function getDefaultHandlers({
       * @param {StreamEventData} data - The event data.
       * @param {GraphRunnableConfig['configurable']} [metadata] The runnable metadata.
       */
-      handle: async (event, data, metadata) => {
-        aggregateContent({ event, data });
+      handle: (event, data, metadata) => {
        if (data?.delta.type === StepTypes.TOOL_CALLS) {
-          await emitEvent(res, streamId, { event, data });
+          emitEvent(res, streamId, { event, data });
        } else if (checkIfLastAgent(metadata?.last_agent_id, metadata?.langgraph_node)) {
-          await emitEvent(res, streamId, { event, data });
+          emitEvent(res, streamId, { event, data });
        } else if (!metadata?.hide_sequential_outputs) {
-          await emitEvent(res, streamId, { event, data });
+          emitEvent(res, streamId, { event, data });
        }
+        aggregateContent({ event, data });
      },
    },
    [GraphEvents.ON_RUN_STEP_COMPLETED]: {
@ -196,15 +239,15 @@ function getDefaultHandlers({
       * @param {StreamEventData & { result: ToolEndData }} data - The event data.
       * @param {GraphRunnableConfig['configurable']} [metadata] The runnable metadata.
       */
-      handle: async (event, data, metadata) => {
-        aggregateContent({ event, data });
+      handle: (event, data, metadata) => {
        if (data?.result != null) {
-          await emitEvent(res, streamId, { event, data });
+          emitEvent(res, streamId, { event, data });
        } else if (checkIfLastAgent(metadata?.last_agent_id, metadata?.langgraph_node)) {
-          await emitEvent(res, streamId, { event, data });
+          emitEvent(res, streamId, { event, data });
        } else if (!metadata?.hide_sequential_outputs) {
-          await emitEvent(res, streamId, { event, data });
+          emitEvent(res, streamId, { event, data });
        }
+        aggregateContent({ event, data });
      },
    },
    [GraphEvents.ON_MESSAGE_DELTA]: {
@ -214,13 +257,13 @@ function getDefaultHandlers({
       * @param {StreamEventData} data - The event data.
       * @param {GraphRunnableConfig['configurable']} [metadata] The runnable metadata.
       */
-      handle: async (event, data, metadata) => {
-        aggregateContent({ event, data });
+      handle: (event, data, metadata) => {
        if (checkIfLastAgent(metadata?.last_agent_id, metadata?.langgraph_node)) {
-          await emitEvent(res, streamId, { event, data });
+          emitEvent(res, streamId, { event, data });
        } else if (!metadata?.hide_sequential_outputs) {
-          await emitEvent(res, streamId, { event, data });
+          emitEvent(res, streamId, { event, data });
        }
+        aggregateContent({ event, data });
      },
    },
    [GraphEvents.ON_REASONING_DELTA]: {
@ -230,27 +273,22 @@ function getDefaultHandlers({
       * @param {StreamEventData} data - The event data.
       * @param {GraphRunnableConfig['configurable']} [metadata] The runnable metadata.
       */
-      handle: async (event, data, metadata) => {
-        aggregateContent({ event, data });
+      handle: (event, data, metadata) => {
        if (checkIfLastAgent(metadata?.last_agent_id, metadata?.langgraph_node)) {
-          await emitEvent(res, streamId, { event, data });
+          emitEvent(res, streamId, { event, data });
        } else if (!metadata?.hide_sequential_outputs) {
-          await emitEvent(res, streamId, { event, data });
+          emitEvent(res, streamId, { event, data });
        }
+        aggregateContent({ event, data });
      },
    },
  };

-  if (toolExecuteOptions) {
-    handlers[GraphEvents.ON_TOOL_EXECUTE] = createToolExecuteHandler(toolExecuteOptions);
-  }
-
  return handlers;
 }

 /**
 * Helper to write attachment events either to res or to job emitter.
- * Note: Attachments are not order-sensitive like deltas, so fire-and-forget is acceptable.
 * @param {ServerResponse} res - The server response object
 * @param {string | null} streamId - The stream ID for resumable mode, or null for standard mode
 * @param {Object} attachment - The attachment data
@ -403,10 +441,10 @@ function createToolEndCallback({ req, res, artifactPromises, streamId = null })
      return;
    }

-    const isCodeTool =
-      output.name === Tools.execute_code || output.name === Constants.PROGRAMMATIC_TOOL_CALLING;
-    if (!isCodeTool) {
-      return;
+    {
+      if (output.name !== Tools.execute_code) {
+        return;
+      }
    }

    if (!output.artifact.files) {
@ -450,226 +488,7 @@ function createToolEndCallback({ req, res, artifactPromises, streamId = null })
  };
 }

-/**
- * Helper to write attachment events in Open Responses format (librechat:attachment)
- * @param {ServerResponse} res - The server response object
- * @param {Object} tracker - The response tracker with sequence number
- * @param {Object} attachment - The attachment data
- * @param {Object} metadata - Additional metadata (messageId, conversationId)
- */
-function writeResponsesAttachment(res, tracker, attachment, metadata) {
-  const sequenceNumber = tracker.nextSequence();
-  writeAttachmentEvent(res, sequenceNumber, attachment, {
-    messageId: metadata.run_id,
-    conversationId: metadata.thread_id,
-  });
-}
-
-/**
- * Creates a tool end callback specifically for the Responses API.
- * Emits attachments as `librechat:attachment` events per the Open Responses extension spec.
- *
- * @param {Object} params
- * @param {ServerRequest} params.req
- * @param {ServerResponse} params.res
- * @param {Object} params.tracker - Response tracker with sequence number
- * @param {Promise<MongoFile | { filename: string; filepath: string; expires: number;} | null>[]} params.artifactPromises
- * @returns {ToolEndCallback} The tool end callback.
- */
-function createResponsesToolEndCallback({ req, res, tracker, artifactPromises }) {
-  /**
-   * @type {ToolEndCallback}
-   */
-  return async (data, metadata) => {
-    const output = data?.output;
-    if (!output) {
-      return;
-    }
-
-    if (!output.artifact) {
-      return;
-    }
-
-    if (output.artifact[Tools.file_search]) {
-      artifactPromises.push(
-        (async () => {
-          const user = req.user;
-          const attachment = await processFileCitations({
-            user,
-            metadata,
-            appConfig: req.config,
-            toolArtifact: output.artifact,
-            toolCallId: output.tool_call_id,
-          });
-          if (!attachment) {
-            return null;
-          }
-          // For Responses API, emit attachment during streaming
-          if (res.headersSent && !res.writableEnded) {
-            writeResponsesAttachment(res, tracker, attachment, metadata);
-          }
-          return attachment;
-        })().catch((error) => {
-          logger.error('Error processing file citations:', error);
-          return null;
-        }),
-      );
-    }
-
-    if (output.artifact[Tools.ui_resources]) {
-      artifactPromises.push(
-        (async () => {
-          const attachment = {
-            type: Tools.ui_resources,
-            toolCallId: output.tool_call_id,
-            [Tools.ui_resources]: output.artifact[Tools.ui_resources].data,
-          };
-          // For Responses API, always emit attachment during streaming
-          if (res.headersSent && !res.writableEnded) {
-            writeResponsesAttachment(res, tracker, attachment, metadata);
-          }
-          return attachment;
-        })().catch((error) => {
-          logger.error('Error processing artifact content:', error);
-          return null;
-        }),
-      );
-    }
-
-    if (output.artifact[Tools.web_search]) {
-      artifactPromises.push(
-        (async () => {
-          const attachment = {
-            type: Tools.web_search,
-            toolCallId: output.tool_call_id,
-            [Tools.web_search]: { ...output.artifact[Tools.web_search] },
-          };
-          // For Responses API, always emit attachment during streaming
-          if (res.headersSent && !res.writableEnded) {
-            writeResponsesAttachment(res, tracker, attachment, metadata);
-          }
-          return attachment;
-        })().catch((error) => {
-          logger.error('Error processing artifact content:', error);
-          return null;
-        }),
-      );
-    }
-
-    if (output.artifact.content) {
-      /** @type {FormattedContent[]} */
-      const content = output.artifact.content;
-      for (let i = 0; i < content.length; i++) {
-        const part = content[i];
-        if (!part) {
-          continue;
-        }
-        if (part.type !== 'image_url') {
-          continue;
-        }
-        const { url } = part.image_url;
-        artifactPromises.push(
-          (async () => {
-            const filename = `${output.name}_img_${nanoid()}`;
-            const file_id = output.artifact.file_ids?.[i];
-            const file = await saveBase64Image(url, {
-              req,
-              file_id,
-              filename,
-              endpoint: metadata.provider,
-              context: FileContext.image_generation,
-            });
-            const fileMetadata = Object.assign(file, {
-              toolCallId: output.tool_call_id,
-            });
-
-            if (!fileMetadata) {
-              return null;
-            }
-
-            // For Responses API, emit attachment during streaming
-            if (res.headersSent && !res.writableEnded) {
-              const attachment = {
-                file_id: fileMetadata.file_id,
-                filename: fileMetadata.filename,
-                type: fileMetadata.type,
-                url: fileMetadata.filepath,
-                width: fileMetadata.width,
-                height: fileMetadata.height,
-                tool_call_id: output.tool_call_id,
-              };
-              writeResponsesAttachment(res, tracker, attachment, metadata);
-            }
-
-            return fileMetadata;
-          })().catch((error) => {
-            logger.error('Error processing artifact content:', error);
-            return null;
-          }),
-        );
-      }
-      return;
-    }
-
-    const isCodeTool =
-      output.name === Tools.execute_code || output.name === Constants.PROGRAMMATIC_TOOL_CALLING;
-    if (!isCodeTool) {
-      return;
-    }
-
-    if (!output.artifact.files) {
-      return;
-    }
-
-    for (const file of output.artifact.files) {
-      const { id, name } = file;
-      artifactPromises.push(
-        (async () => {
-          const result = await loadAuthValues({
-            userId: req.user.id,
-            authFields: [EnvVar.CODE_API_KEY],
-          });
-          const fileMetadata = await processCodeOutput({
-            req,
-            id,
-            name,
-            apiKey: result[EnvVar.CODE_API_KEY],
-            messageId: metadata.run_id,
-            toolCallId: output.tool_call_id,
-            conversationId: metadata.thread_id,
-            session_id: output.artifact.session_id,
-          });
-
-          if (!fileMetadata) {
-            return null;
-          }
-
-          // For Responses API, emit attachment during streaming
-          if (res.headersSent && !res.writableEnded) {
-            const attachment = {
-              file_id: fileMetadata.file_id,
-              filename: fileMetadata.filename,
-              type: fileMetadata.type,
-              url: fileMetadata.filepath,
-              width: fileMetadata.width,
-              height: fileMetadata.height,
-              tool_call_id: output.tool_call_id,
-            };
-            writeResponsesAttachment(res, tracker, attachment, metadata);
-          }
-
-          return fileMetadata;
-        })().catch((error) => {
-          logger.error('Error processing code output:', error);
-          return null;
-        }),
-      );
-    }
-  };
-}
-
 module.exports = {
  getDefaultHandlers,
  createToolEndCallback,
-  createResponsesToolEndCallback,
 };
--- a/api/server/controllers/agents/client.js
+++ b/api/server/controllers/agents/client.js
@ -5,24 +5,18 @@ const {
  createRun,
  Tokenizer,
  checkAccess,
-  buildToolSet,
+  logAxiosError,
  sanitizeTitle,
-  logToolError,
-  payloadParser,
  resolveHeaders,
  createSafeUser,
  initializeAgent,
  getBalanceConfig,
-  omitTitleOptions,
  getProviderConfig,
  memoryInstructions,
-  createTokenCounter,
  applyContextToAgent,
-  recordCollectedUsage,
  GenerationJobManager,
  getTransactionsConfig,
  createMemoryProcessor,
-  createMultiAgentMapper,
  filterMalformedContentParts,
 } = require('@librechat/api');
 const {
@ -30,7 +24,9 @@ const {
  Providers,
  TitleMethod,
  formatMessage,
+  labelContentByAgent,
  formatAgentMessages,
+  getTokenCountForMessage,
  createMetadataAggregator,
 } = require('@librechat/agents');
 const {
@ -42,13 +38,11 @@ const {
  PermissionTypes,
  isAgentsEndpoint,
  isEphemeralAgentId,
+  bedrockInputSchema,
  removeNullishValues,
 } = require('librechat-data-provider');
-const { filterFilesByAgentAccess } = require('~/server/services/Files/permissions');
 const { spendTokens, spendStructuredTokens } = require('~/models/spendTokens');
 const { encodeAndFormat } = require('~/server/services/Files/images/encode');
-const { updateBalance, bulkInsertTransactions } = require('~/models');
-const { getMultiplier, getCacheMultiplier } = require('~/models/tx');
 const { createContextHandlers } = require('~/app/clients/prompts');
 const { getConvoFiles } = require('~/models/Conversation');
 const BaseClient = require('~/app/clients/BaseClient');
@ -57,6 +51,183 @@ const { loadAgent } = require('~/models/Agent');
 const { getMCPManager } = require('~/config');
 const db = require('~/models');

+const omitTitleOptions = new Set([
+  'stream',
+  'thinking',
+  'streaming',
+  'clientOptions',
+  'thinkingConfig',
+  'thinkingBudget',
+  'includeThoughts',
+  'maxOutputTokens',
+  'additionalModelRequestFields',
+]);
+
+/**
+ * @param {ServerRequest} req
+ * @param {Agent} agent
+ * @param {string} endpoint
+ */
+const payloadParser = ({ req, agent, endpoint }) => {
+  if (isAgentsEndpoint(endpoint)) {
+    return { model: undefined };
+  } else if (endpoint === EModelEndpoint.bedrock) {
+    const parsedValues = bedrockInputSchema.parse(agent.model_parameters);
+    if (parsedValues.thinking == null) {
+      parsedValues.thinking = false;
+    }
+    return parsedValues;
+  }
+  return req.body.endpointOption.model_parameters;
+};
+
+function createTokenCounter(encoding) {
+  return function (message) {
+    const countTokens = (text) => Tokenizer.getTokenCount(text, encoding);
+    return getTokenCountForMessage(message, countTokens);
+  };
+}
+
+function logToolError(graph, error, toolId) {
+  logAxiosError({
+    error,
+    message: `[api/server/controllers/agents/client.js #chatCompletion] Tool Error "${toolId}"`,
+  });
+}
+
+/** Regex pattern to match agent ID suffix (____N) */
+const AGENT_SUFFIX_PATTERN = /____(\d+)$/;
+
+/**
+ * Finds the primary agent ID within a set of agent IDs.
+ * Primary = no suffix (____N) or lowest suffix number.
+ * @param {Set<string>} agentIds
+ * @returns {string | null}
+ */
+function findPrimaryAgentId(agentIds) {
+  let primaryAgentId = null;
+  let lowestSuffixIndex = Infinity;
+
+  for (const agentId of agentIds) {
+    const suffixMatch = agentId.match(AGENT_SUFFIX_PATTERN);
+    if (!suffixMatch) {
+      return agentId;
+    }
+    const suffixIndex = parseInt(suffixMatch[1], 10);
+    if (suffixIndex < lowestSuffixIndex) {
+      lowestSuffixIndex = suffixIndex;
+      primaryAgentId = agentId;
+    }
+  }
+
+  return primaryAgentId;
+}
+
+/**
+ * Creates a mapMethod for getMessagesForConversation that processes agent content.
+ * - Strips agentId/groupId metadata from all content
+ * - For parallel agents (addedConvo with groupId): filters each group to its primary agent
+ * - For handoffs (agentId without groupId): keeps all content from all agents
+ * - For multi-agent: applies agent labels to content
+ *
+ * The key distinction:
+ * - Parallel execution (addedConvo): Parts have both agentId AND groupId
+ * - Handoffs: Parts only have agentId, no groupId
+ *
+ * @param {Agent} primaryAgent - Primary agent configuration
+ * @param {Map<string, Agent>} [agentConfigs] - Additional agent configurations
+ * @returns {(message: TMessage) => TMessage} Map method for processing messages
+ */
+function createMultiAgentMapper(primaryAgent, agentConfigs) {
+  const hasMultipleAgents = (primaryAgent.edges?.length ?? 0) > 0 || (agentConfigs?.size ?? 0) > 0;
+
+  /** @type {Record<string, string> | null} */
+  let agentNames = null;
+  if (hasMultipleAgents) {
+    agentNames = { [primaryAgent.id]: primaryAgent.name || 'Assistant' };
+    if (agentConfigs) {
+      for (const [agentId, agentConfig] of agentConfigs.entries()) {
+        agentNames[agentId] = agentConfig.name || agentConfig.id;
+      }
+    }
+  }
+
+  return (message) => {
+    if (message.isCreatedByUser || !Array.isArray(message.content)) {
+      return message;
+    }
+
+    // Check for metadata
+    const hasAgentMetadata = message.content.some((part) => part?.agentId || part?.groupId != null);
+    if (!hasAgentMetadata) {
+      return message;
+    }
+
+    try {
+      // Build a map of groupId -> Set of agentIds, to find primary per group
+      /** @type {Map<number, Set<string>>} */
+      const groupAgentMap = new Map();
+
+      for (const part of message.content) {
+        const groupId = part?.groupId;
+        const agentId = part?.agentId;
+        if (groupId != null && agentId) {
+          if (!groupAgentMap.has(groupId)) {
+            groupAgentMap.set(groupId, new Set());
+          }
+          groupAgentMap.get(groupId).add(agentId);
+        }
+      }
+
+      // For each group, find the primary agent
+      /** @type {Map<number, string>} */
+      const groupPrimaryMap = new Map();
+      for (const [groupId, agentIds] of groupAgentMap) {
+        const primary = findPrimaryAgentId(agentIds);
+        if (primary) {
+          groupPrimaryMap.set(groupId, primary);
+        }
+      }
+
+      /** @type {Array<TMessageContentParts>} */
+      const filteredContent = [];
+      /** @type {Record<number, string>} */
+      const agentIdMap = {};
+
+      for (const part of message.content) {
+        const agentId = part?.agentId;
+        const groupId = part?.groupId;
+
+        // Filtering logic:
+        // - No groupId (handoffs): always include
+        // - Has groupId (parallel): only include if it's the primary for that group
+        const isParallelPart = groupId != null;
+        const groupPrimary = isParallelPart ? groupPrimaryMap.get(groupId) : null;
+        const shouldInclude = !isParallelPart || !agentId || agentId === groupPrimary;
+
+        if (shouldInclude) {
+          const newIndex = filteredContent.length;
+          const { agentId: _a, groupId: _g, ...cleanPart } = part;
+          filteredContent.push(cleanPart);
+          if (agentId && hasMultipleAgents) {
+            agentIdMap[newIndex] = agentId;
+          }
+        }
+      }
+
+      const finalContent =
+        Object.keys(agentIdMap).length > 0 && agentNames
+          ? labelContentByAgent(filteredContent, agentIdMap, agentNames)
+          : filteredContent;
+
+      return { ...message, content: finalContent };
+    } catch (error) {
+      logger.error('[AgentClient] Error processing multi-agent message:', error);
+      return message;
+    }
+  };
+}
+
 class AgentClient extends BaseClient {
  constructor(options = {}) {
    super(null, options);
@ -124,9 +295,14 @@ class AgentClient extends BaseClient {
  checkVisionRequest() {}

  getSaveOptions() {
+    // TODO:
+    // would need to be override settings; otherwise, model needs to be undefined
+    // model: this.override.model,
+    // instructions: this.override.instructions,
+    // additional_instructions: this.override.additional_instructions,
    let runOptions = {};
    try {
-      runOptions = payloadParser(this.options) ?? {};
+      runOptions = payloadParser(this.options);
    } catch (error) {
      logger.error(
        '[api/server/controllers/agents/client.js #getSaveOptions] Error parsing options',
@ -137,14 +313,14 @@ class AgentClient extends BaseClient {
    return removeNullishValues(
      Object.assign(
        {
-          spec: this.options.spec,
-          iconURL: this.options.iconURL,
          endpoint: this.options.endpoint,
          agent_id: this.options.agent.id,
          modelLabel: this.options.modelLabel,
+          maxContextTokens: this.options.maxContextTokens,
          resendFiles: this.options.resendFiles,
          imageDetail: this.options.imageDetail,
-          maxContextTokens: this.maxContextTokens,
+          spec: this.options.spec,
+          iconURL: this.options.iconURL,
        },
        // TODO: PARSE OPTIONS BY PROVIDER, MAY CONTAIN SENSITIVE DATA
        runOptions,
@ -479,8 +655,6 @@ class AgentClient extends BaseClient {
        updateFilesUsage: db.updateFilesUsage,
        getUserKeyValues: db.getUserKeyValues,
        getToolFilesByIds: db.getToolFilesByIds,
-        getCodeGeneratedFiles: db.getCodeGeneratedFiles,
-        filterFilesByAgentAccess,
      },
    );

@ -629,29 +803,82 @@ class AgentClient extends BaseClient {
    context = 'message',
    collectedUsage = this.collectedUsage,
  }) {
-    const result = await recordCollectedUsage(
-      {
-        spendTokens,
-        spendStructuredTokens,
-        pricing: { getMultiplier, getCacheMultiplier },
-        bulkWriteOps: { insertMany: bulkInsertTransactions, updateBalance },
-      },
-      {
-        user: this.user ?? this.options.req.user?.id,
-        conversationId: this.conversationId,
-        collectedUsage,
-        model: model ?? this.model ?? this.options.agent.model_parameters.model,
+    if (!collectedUsage || !collectedUsage.length) {
+      return;
+    }
+    // Use first entry's input_tokens as the base input (represents initial user message context)
+    // Support both OpenAI format (input_token_details) and Anthropic format (cache_*_input_tokens)
+    const firstUsage = collectedUsage[0];
+    const input_tokens =
+      (firstUsage?.input_tokens || 0) +
+      (Number(firstUsage?.input_token_details?.cache_creation) ||
+        Number(firstUsage?.cache_creation_input_tokens) ||
+        0) +
+      (Number(firstUsage?.input_token_details?.cache_read) ||
+        Number(firstUsage?.cache_read_input_tokens) ||
+        0);
+
+    // Sum output_tokens directly from all entries - works for both sequential and parallel execution
+    // This avoids the incremental calculation that produced negative values for parallel agents
+    let total_output_tokens = 0;
+
+    for (const usage of collectedUsage) {
+      if (!usage) {
+        continue;
+      }
+
+      // Support both OpenAI format (input_token_details) and Anthropic format (cache_*_input_tokens)
+      const cache_creation =
+        Number(usage.input_token_details?.cache_creation) ||
+        Number(usage.cache_creation_input_tokens) ||
+        0;
+      const cache_read =
+        Number(usage.input_token_details?.cache_read) || Number(usage.cache_read_input_tokens) || 0;
+
+      // Accumulate output tokens for the usage summary
+      total_output_tokens += Number(usage.output_tokens) || 0;
+
+      const txMetadata = {
        context,
-        messageId: this.responseMessageId,
        balance,
        transactions,
+        conversationId: this.conversationId,
+        user: this.user ?? this.options.req.user?.id,
        endpointTokenConfig: this.options.endpointTokenConfig,
-      },
-    );
+        model: usage.model ?? model ?? this.model ?? this.options.agent.model_parameters.model,
+      };

-    if (result) {
-      this.usage = result;
+      if (cache_creation > 0 || cache_read > 0) {
+        spendStructuredTokens(txMetadata, {
+          promptTokens: {
+            input: usage.input_tokens,
+            write: cache_creation,
+            read: cache_read,
+          },
+          completionTokens: usage.output_tokens,
+        }).catch((err) => {
+          logger.error(
+            '[api/server/controllers/agents/client.js #recordCollectedUsage] Error spending structured tokens',
+            err,
+          );
+        });
+        continue;
+      }
+      spendTokens(txMetadata, {
+        promptTokens: usage.input_tokens,
+        completionTokens: usage.output_tokens,
+      }).catch((err) => {
+        logger.error(
+          '[api/server/controllers/agents/client.js #recordCollectedUsage] Error spending tokens',
+          err,
+        );
+      });
    }
+
+    this.usage = {
+      input_tokens,
+      output_tokens: total_output_tokens,
+    };
  }

  /**
@ -740,13 +967,13 @@ class AgentClient extends BaseClient {
          },
          user: createSafeUser(this.options.req.user),
        },
-        recursionLimit: agentsEConfig?.recursionLimit ?? 50,
+        recursionLimit: agentsEConfig?.recursionLimit ?? 25,
        signal: abortController.signal,
        streamMode: 'values',
        version: 'v2',
      };

-      const toolSet = buildToolSet(this.options.agent);
+      const toolSet = new Set((this.options.agent.tools ?? []).map((tool) => tool && tool.name));
      let { messages: initialMessages, indexTokenCountMap } = formatAgentMessages(
        payload,
        this.indexTokenCountMap,
@ -807,7 +1034,6 @@ class AgentClient extends BaseClient {

        run = await createRun({
          agents,
-          messages,
          indexTokenCountMap,
          runId: this.responseMessageId,
          signal: abortController.signal,
@ -843,10 +1069,9 @@ class AgentClient extends BaseClient {
        config.signal = null;
      };

-      const hideSequentialOutputs = config.configurable.hide_sequential_outputs;
      await runAgents(initialMessages);
      /** @deprecated Agent Chain */
-      if (hideSequentialOutputs) {
+      if (config.configurable.hide_sequential_outputs) {
        this.contentParts = this.contentParts.filter((part, index) => {
          // Include parts that are either:
          // 1. At or after the finalContentStart index
@ -1100,7 +1325,6 @@ class AgentClient extends BaseClient {
        model: clientOptions.model,
        balance: balanceConfig,
        transactions: transactionsConfig,
-        messageId: this.responseMessageId,
      }).catch((err) => {
        logger.error(
          '[api/server/controllers/agents/client.js #titleConvo] Error recording collected usage',
@ -1139,7 +1363,6 @@ class AgentClient extends BaseClient {
          model,
          context,
          balance,
-          messageId: this.responseMessageId,
          conversationId: this.conversationId,
          user: this.user ?? this.options.req.user?.id,
          endpointTokenConfig: this.options.endpointTokenConfig,
@ -1158,7 +1381,6 @@ class AgentClient extends BaseClient {
            model,
            balance,
            context: 'reasoning',
-            messageId: this.responseMessageId,
            conversationId: this.conversationId,
            user: this.user ?? this.options.req.user?.id,
            endpointTokenConfig: this.options.endpointTokenConfig,
@ -1174,11 +1396,7 @@ class AgentClient extends BaseClient {
    }
  }

-  /** Anthropic Claude models use a distinct BPE tokenizer; all others default to o200k_base. */
  getEncoding() {
-    if (this.model && this.model.toLowerCase().includes('claude')) {
-      return 'claude';
-    }
    return 'o200k_base';
  }

--- a/api/server/controllers/agents/client.test.js
+++ b/api/server/controllers/agents/client.test.js
@ -263,7 +263,6 @@ describe('AgentClient - titleConvo', () => {
        transactions: {
          enabled: true,
        },
-        messageId: 'response-123',
      });
    });

--- a/api/server/controllers/agents/filterAuthorizedTools.spec.js
+++ b/api/server/controllers/agents/filterAuthorizedTools.spec.js
@ -1,677 +0,0 @@
-const mongoose = require('mongoose');
-const { v4: uuidv4 } = require('uuid');
-const { Constants } = require('librechat-data-provider');
-const { agentSchema } = require('@librechat/data-schemas');
-const { MongoMemoryServer } = require('mongodb-memory-server');
-
-const d = Constants.mcp_delimiter;
-
-const mockGetAllServerConfigs = jest.fn();
-
-jest.mock('~/server/services/Config', () => ({
-  getCachedTools: jest.fn().mockResolvedValue({
-    web_search: true,
-    execute_code: true,
-    file_search: true,
-  }),
-}));
-
-jest.mock('~/config', () => ({
-  getMCPServersRegistry: jest.fn(() => ({
-    getAllServerConfigs: mockGetAllServerConfigs,
-  })),
-}));
-
-jest.mock('~/models/Project', () => ({
-  getProjectByName: jest.fn().mockResolvedValue(null),
-}));
-
-jest.mock('~/server/services/Files/strategies', () => ({
-  getStrategyFunctions: jest.fn(),
-}));
-
-jest.mock('~/server/services/Files/images/avatar', () => ({
-  resizeAvatar: jest.fn(),
-}));
-
-jest.mock('~/server/services/Files/S3/crud', () => ({
-  refreshS3Url: jest.fn(),
-}));
-
-jest.mock('~/server/services/Files/process', () => ({
-  filterFile: jest.fn(),
-}));
-
-jest.mock('~/models/Action', () => ({
-  updateAction: jest.fn(),
-  getActions: jest.fn().mockResolvedValue([]),
-}));
-
-jest.mock('~/models/File', () => ({
-  deleteFileByFilter: jest.fn(),
-}));
-
-jest.mock('~/server/services/PermissionService', () => ({
-  findAccessibleResources: jest.fn().mockResolvedValue([]),
-  findPubliclyAccessibleResources: jest.fn().mockResolvedValue([]),
-  grantPermission: jest.fn(),
-  hasPublicPermission: jest.fn().mockResolvedValue(false),
-  checkPermission: jest.fn().mockResolvedValue(true),
-}));
-
-jest.mock('~/models', () => ({
-  getCategoriesWithCounts: jest.fn(),
-}));
-
-jest.mock('~/cache', () => ({
-  getLogStores: jest.fn(() => ({
-    get: jest.fn(),
-    set: jest.fn(),
-    delete: jest.fn(),
-  })),
-}));
-
-const {
-  filterAuthorizedTools,
-  createAgent: createAgentHandler,
-  updateAgent: updateAgentHandler,
-  duplicateAgent: duplicateAgentHandler,
-  revertAgentVersion: revertAgentVersionHandler,
-} = require('./v1');
-
-const { getMCPServersRegistry } = require('~/config');
-
-let Agent;
-
-describe('MCP Tool Authorization', () => {
-  let mongoServer;
-  let mockReq;
-  let mockRes;
-
-  beforeAll(async () => {
-    mongoServer = await MongoMemoryServer.create();
-    const mongoUri = mongoServer.getUri();
-    await mongoose.connect(mongoUri);
-    Agent = mongoose.models.Agent || mongoose.model('Agent', agentSchema);
-  }, 20000);
-
-  afterAll(async () => {
-    await mongoose.disconnect();
-    await mongoServer.stop();
-  });
-
-  beforeEach(async () => {
-    await Agent.deleteMany({});
-    jest.clearAllMocks();
-
-    getMCPServersRegistry.mockImplementation(() => ({
-      getAllServerConfigs: mockGetAllServerConfigs,
-    }));
-    mockGetAllServerConfigs.mockResolvedValue({
-      authorizedServer: { type: 'sse', url: 'https://authorized.example.com' },
-      anotherServer: { type: 'sse', url: 'https://another.example.com' },
-    });
-
-    mockReq = {
-      user: {
-        id: new mongoose.Types.ObjectId().toString(),
-        role: 'USER',
-      },
-      body: {},
-      params: {},
-      query: {},
-      app: { locals: { fileStrategy: 'local' } },
-    };
-
-    mockRes = {
-      status: jest.fn().mockReturnThis(),
-      json: jest.fn().mockReturnThis(),
-    };
-  });
-
-  describe('filterAuthorizedTools', () => {
-    const availableTools = { web_search: true, custom_tool: true };
-    const userId = 'test-user-123';
-
-    test('should keep authorized MCP tools and strip unauthorized ones', async () => {
-      const result = await filterAuthorizedTools({
-        tools: [`toolA${d}authorizedServer`, `toolB${d}forbiddenServer`, 'web_search'],
-        userId,
-        availableTools,
-      });
-
-      expect(result).toContain(`toolA${d}authorizedServer`);
-      expect(result).toContain('web_search');
-      expect(result).not.toContain(`toolB${d}forbiddenServer`);
-    });
-
-    test('should keep system tools without querying MCP registry', async () => {
-      const result = await filterAuthorizedTools({
-        tools: ['execute_code', 'file_search', 'web_search'],
-        userId,
-        availableTools: {},
-      });
-
-      expect(result).toEqual(['execute_code', 'file_search', 'web_search']);
-      expect(mockGetAllServerConfigs).not.toHaveBeenCalled();
-    });
-
-    test('should not query MCP registry when no MCP tools are present', async () => {
-      const result = await filterAuthorizedTools({
-        tools: ['web_search', 'custom_tool'],
-        userId,
-        availableTools,
-      });
-
-      expect(result).toEqual(['web_search', 'custom_tool']);
-      expect(mockGetAllServerConfigs).not.toHaveBeenCalled();
-    });
-
-    test('should filter all MCP tools when registry is uninitialized', async () => {
-      getMCPServersRegistry.mockImplementation(() => {
-        throw new Error('MCPServersRegistry has not been initialized.');
-      });
-
-      const result = await filterAuthorizedTools({
-        tools: [`toolA${d}someServer`, 'web_search'],
-        userId,
-        availableTools,
-      });
-
-      expect(result).toEqual(['web_search']);
-      expect(result).not.toContain(`toolA${d}someServer`);
-    });
-
-    test('should handle mixed authorized and unauthorized MCP tools', async () => {
-      const result = await filterAuthorizedTools({
-        tools: [
-          'web_search',
-          `search${d}authorizedServer`,
-          `attack${d}victimServer`,
-          'execute_code',
-          `list${d}anotherServer`,
-          `steal${d}nonexistent`,
-        ],
-        userId,
-        availableTools,
-      });
-
-      expect(result).toEqual([
-        'web_search',
-        `search${d}authorizedServer`,
-        'execute_code',
-        `list${d}anotherServer`,
-      ]);
-    });
-
-    test('should handle empty tools array', async () => {
-      const result = await filterAuthorizedTools({
-        tools: [],
-        userId,
-        availableTools,
-      });
-
-      expect(result).toEqual([]);
-      expect(mockGetAllServerConfigs).not.toHaveBeenCalled();
-    });
-
-    test('should handle null/undefined tool entries gracefully', async () => {
-      const result = await filterAuthorizedTools({
-        tools: [null, undefined, '', 'web_search'],
-        userId,
-        availableTools,
-      });
-
-      expect(result).toEqual(['web_search']);
-    });
-
-    test('should call getAllServerConfigs with the correct userId', async () => {
-      await filterAuthorizedTools({
-        tools: [`tool${d}authorizedServer`],
-        userId: 'specific-user-id',
-        availableTools,
-      });
-
-      expect(mockGetAllServerConfigs).toHaveBeenCalledWith('specific-user-id');
-    });
-
-    test('should only call getAllServerConfigs once even with multiple MCP tools', async () => {
-      await filterAuthorizedTools({
-        tools: [`tool1${d}authorizedServer`, `tool2${d}anotherServer`, `tool3${d}unknownServer`],
-        userId,
-        availableTools,
-      });
-
-      expect(mockGetAllServerConfigs).toHaveBeenCalledTimes(1);
-    });
-
-    test('should preserve existing MCP tools when registry is unavailable', async () => {
-      getMCPServersRegistry.mockImplementation(() => {
-        throw new Error('MCPServersRegistry has not been initialized.');
-      });
-
-      const existingTools = [`toolA${d}serverA`, `toolB${d}serverB`];
-
-      const result = await filterAuthorizedTools({
-        tools: [...existingTools, `newTool${d}unknownServer`, 'web_search'],
-        userId,
-        availableTools,
-        existingTools,
-      });
-
-      expect(result).toContain(`toolA${d}serverA`);
-      expect(result).toContain(`toolB${d}serverB`);
-      expect(result).toContain('web_search');
-      expect(result).not.toContain(`newTool${d}unknownServer`);
-    });
-
-    test('should still reject all MCP tools when registry is unavailable and no existingTools', async () => {
-      getMCPServersRegistry.mockImplementation(() => {
-        throw new Error('MCPServersRegistry has not been initialized.');
-      });
-
-      const result = await filterAuthorizedTools({
-        tools: [`toolA${d}serverA`, 'web_search'],
-        userId,
-        availableTools,
-      });
-
-      expect(result).toEqual(['web_search']);
-    });
-
-    test('should not preserve malformed existing tools when registry is unavailable', async () => {
-      getMCPServersRegistry.mockImplementation(() => {
-        throw new Error('MCPServersRegistry has not been initialized.');
-      });
-
-      const malformedTool = `a${d}b${d}c`;
-      const result = await filterAuthorizedTools({
-        tools: [malformedTool, `legit${d}serverA`, 'web_search'],
-        userId,
-        availableTools,
-        existingTools: [malformedTool, `legit${d}serverA`],
-      });
-
-      expect(result).toContain(`legit${d}serverA`);
-      expect(result).toContain('web_search');
-      expect(result).not.toContain(malformedTool);
-    });
-
-    test('should reject malformed MCP tool keys with multiple delimiters', async () => {
-      const result = await filterAuthorizedTools({
-        tools: [
-          `attack${d}victimServer${d}authorizedServer`,
-          `legit${d}authorizedServer`,
-          `a${d}b${d}c${d}d`,
-          'web_search',
-        ],
-        userId,
-        availableTools,
-      });
-
-      expect(result).toEqual([`legit${d}authorizedServer`, 'web_search']);
-      expect(result).not.toContainEqual(expect.stringContaining('victimServer'));
-      expect(result).not.toContainEqual(expect.stringContaining(`a${d}b`));
-    });
-  });
-
-  describe('createAgentHandler - MCP tool authorization', () => {
-    test('should strip unauthorized MCP tools on create', async () => {
-      mockReq.body = {
-        provider: 'openai',
-        model: 'gpt-4',
-        name: 'MCP Test Agent',
-        tools: ['web_search', `validTool${d}authorizedServer`, `attack${d}forbiddenServer`],
-      };
-
-      await createAgentHandler(mockReq, mockRes);
-
-      expect(mockRes.status).toHaveBeenCalledWith(201);
-      const agent = mockRes.json.mock.calls[0][0];
-      expect(agent.tools).toContain('web_search');
-      expect(agent.tools).toContain(`validTool${d}authorizedServer`);
-      expect(agent.tools).not.toContain(`attack${d}forbiddenServer`);
-    });
-
-    test('should not 500 when MCP registry is uninitialized', async () => {
-      getMCPServersRegistry.mockImplementation(() => {
-        throw new Error('MCPServersRegistry has not been initialized.');
-      });
-
-      mockReq.body = {
-        provider: 'openai',
-        model: 'gpt-4',
-        name: 'MCP Uninitialized Test',
-        tools: [`tool${d}someServer`, 'web_search'],
-      };
-
-      await createAgentHandler(mockReq, mockRes);
-
-      expect(mockRes.status).toHaveBeenCalledWith(201);
-      const agent = mockRes.json.mock.calls[0][0];
-      expect(agent.tools).toEqual(['web_search']);
-    });
-
-    test('should store mcpServerNames only for authorized servers', async () => {
-      mockReq.body = {
-        provider: 'openai',
-        model: 'gpt-4',
-        name: 'MCP Names Test',
-        tools: [`toolA${d}authorizedServer`, `toolB${d}forbiddenServer`],
-      };
-
-      await createAgentHandler(mockReq, mockRes);
-
-      expect(mockRes.status).toHaveBeenCalledWith(201);
-      const agent = mockRes.json.mock.calls[0][0];
-      const agentInDb = await Agent.findOne({ id: agent.id });
-      expect(agentInDb.mcpServerNames).toContain('authorizedServer');
-      expect(agentInDb.mcpServerNames).not.toContain('forbiddenServer');
-    });
-  });
-
-  describe('updateAgentHandler - MCP tool authorization', () => {
-    let existingAgentId;
-    let existingAgentAuthorId;
-
-    beforeEach(async () => {
-      existingAgentAuthorId = new mongoose.Types.ObjectId();
-      const agent = await Agent.create({
-        id: `agent_${uuidv4()}`,
-        name: 'Original Agent',
-        provider: 'openai',
-        model: 'gpt-4',
-        author: existingAgentAuthorId,
-        tools: ['web_search', `existingTool${d}authorizedServer`],
-        mcpServerNames: ['authorizedServer'],
-        versions: [
-          {
-            name: 'Original Agent',
-            provider: 'openai',
-            model: 'gpt-4',
-            tools: ['web_search', `existingTool${d}authorizedServer`],
-            createdAt: new Date(),
-            updatedAt: new Date(),
-          },
-        ],
-      });
-      existingAgentId = agent.id;
-    });
-
-    test('should preserve existing MCP tools even if editor lacks access', async () => {
-      mockGetAllServerConfigs.mockResolvedValue({});
-
-      mockReq.user.id = existingAgentAuthorId.toString();
-      mockReq.params.id = existingAgentId;
-      mockReq.body = {
-        tools: ['web_search', `existingTool${d}authorizedServer`],
-      };
-
-      await updateAgentHandler(mockReq, mockRes);
-
-      expect(mockRes.json).toHaveBeenCalled();
-      const updatedAgent = mockRes.json.mock.calls[0][0];
-      expect(updatedAgent.tools).toContain(`existingTool${d}authorizedServer`);
-      expect(updatedAgent.tools).toContain('web_search');
-    });
-
-    test('should reject newly added unauthorized MCP tools', async () => {
-      mockReq.user.id = existingAgentAuthorId.toString();
-      mockReq.params.id = existingAgentId;
-      mockReq.body = {
-        tools: ['web_search', `existingTool${d}authorizedServer`, `attack${d}forbiddenServer`],
-      };
-
-      await updateAgentHandler(mockReq, mockRes);
-
-      expect(mockRes.json).toHaveBeenCalled();
-      const updatedAgent = mockRes.json.mock.calls[0][0];
-      expect(updatedAgent.tools).toContain('web_search');
-      expect(updatedAgent.tools).toContain(`existingTool${d}authorizedServer`);
-      expect(updatedAgent.tools).not.toContain(`attack${d}forbiddenServer`);
-    });
-
-    test('should allow adding authorized MCP tools', async () => {
-      mockReq.user.id = existingAgentAuthorId.toString();
-      mockReq.params.id = existingAgentId;
-      mockReq.body = {
-        tools: ['web_search', `existingTool${d}authorizedServer`, `newTool${d}anotherServer`],
-      };
-
-      await updateAgentHandler(mockReq, mockRes);
-
-      expect(mockRes.json).toHaveBeenCalled();
-      const updatedAgent = mockRes.json.mock.calls[0][0];
-      expect(updatedAgent.tools).toContain(`newTool${d}anotherServer`);
-    });
-
-    test('should not query MCP registry when no new MCP tools added', async () => {
-      mockReq.user.id = existingAgentAuthorId.toString();
-      mockReq.params.id = existingAgentId;
-      mockReq.body = {
-        tools: ['web_search', `existingTool${d}authorizedServer`],
-      };
-
-      await updateAgentHandler(mockReq, mockRes);
-
-      expect(mockGetAllServerConfigs).not.toHaveBeenCalled();
-    });
-
-    test('should preserve existing MCP tools when registry unavailable and user edits agent', async () => {
-      getMCPServersRegistry.mockImplementation(() => {
-        throw new Error('MCPServersRegistry has not been initialized.');
-      });
-
-      mockReq.user.id = existingAgentAuthorId.toString();
-      mockReq.params.id = existingAgentId;
-      mockReq.body = {
-        name: 'Renamed After Restart',
-        tools: ['web_search', `existingTool${d}authorizedServer`],
-      };
-
-      await updateAgentHandler(mockReq, mockRes);
-
-      expect(mockRes.json).toHaveBeenCalled();
-      const updatedAgent = mockRes.json.mock.calls[0][0];
-      expect(updatedAgent.tools).toContain(`existingTool${d}authorizedServer`);
-      expect(updatedAgent.tools).toContain('web_search');
-      expect(updatedAgent.name).toBe('Renamed After Restart');
-    });
-
-    test('should preserve existing MCP tools when server not in configs (disconnected)', async () => {
-      mockGetAllServerConfigs.mockResolvedValue({});
-
-      mockReq.user.id = existingAgentAuthorId.toString();
-      mockReq.params.id = existingAgentId;
-      mockReq.body = {
-        name: 'Edited While Disconnected',
-        tools: ['web_search', `existingTool${d}authorizedServer`],
-      };
-
-      await updateAgentHandler(mockReq, mockRes);
-
-      expect(mockRes.json).toHaveBeenCalled();
-      const updatedAgent = mockRes.json.mock.calls[0][0];
-      expect(updatedAgent.tools).toContain(`existingTool${d}authorizedServer`);
-      expect(updatedAgent.name).toBe('Edited While Disconnected');
-    });
-  });
-
-  describe('duplicateAgentHandler - MCP tool authorization', () => {
-    let sourceAgentId;
-    let sourceAgentAuthorId;
-
-    beforeEach(async () => {
-      sourceAgentAuthorId = new mongoose.Types.ObjectId();
-      const agent = await Agent.create({
-        id: `agent_${uuidv4()}`,
-        name: 'Source Agent',
-        provider: 'openai',
-        model: 'gpt-4',
-        author: sourceAgentAuthorId,
-        tools: ['web_search', `tool${d}authorizedServer`, `tool${d}forbiddenServer`],
-        mcpServerNames: ['authorizedServer', 'forbiddenServer'],
-        versions: [
-          {
-            name: 'Source Agent',
-            provider: 'openai',
-            model: 'gpt-4',
-            tools: ['web_search', `tool${d}authorizedServer`, `tool${d}forbiddenServer`],
-            createdAt: new Date(),
-            updatedAt: new Date(),
-          },
-        ],
-      });
-      sourceAgentId = agent.id;
-    });
-
-    test('should strip unauthorized MCP tools from duplicated agent', async () => {
-      mockGetAllServerConfigs.mockResolvedValue({
-        authorizedServer: { type: 'sse' },
-      });
-
-      mockReq.user.id = sourceAgentAuthorId.toString();
-      mockReq.params.id = sourceAgentId;
-
-      await duplicateAgentHandler(mockReq, mockRes);
-
-      expect(mockRes.status).toHaveBeenCalledWith(201);
-      const { agent: newAgent } = mockRes.json.mock.calls[0][0];
-      expect(newAgent.id).not.toBe(sourceAgentId);
-      expect(newAgent.tools).toContain('web_search');
-      expect(newAgent.tools).toContain(`tool${d}authorizedServer`);
-      expect(newAgent.tools).not.toContain(`tool${d}forbiddenServer`);
-
-      const agentInDb = await Agent.findOne({ id: newAgent.id });
-      expect(agentInDb.mcpServerNames).toContain('authorizedServer');
-      expect(agentInDb.mcpServerNames).not.toContain('forbiddenServer');
-    });
-
-    test('should preserve source agent MCP tools when registry is unavailable', async () => {
-      getMCPServersRegistry.mockImplementation(() => {
-        throw new Error('MCPServersRegistry has not been initialized.');
-      });
-
-      mockReq.user.id = sourceAgentAuthorId.toString();
-      mockReq.params.id = sourceAgentId;
-
-      await duplicateAgentHandler(mockReq, mockRes);
-
-      expect(mockRes.status).toHaveBeenCalledWith(201);
-      const { agent: newAgent } = mockRes.json.mock.calls[0][0];
-      expect(newAgent.tools).toContain('web_search');
-      expect(newAgent.tools).toContain(`tool${d}authorizedServer`);
-      expect(newAgent.tools).toContain(`tool${d}forbiddenServer`);
-    });
-  });
-
-  describe('revertAgentVersionHandler - MCP tool authorization', () => {
-    let existingAgentId;
-    let existingAgentAuthorId;
-
-    beforeEach(async () => {
-      existingAgentAuthorId = new mongoose.Types.ObjectId();
-      const agent = await Agent.create({
-        id: `agent_${uuidv4()}`,
-        name: 'Reverted Agent V2',
-        provider: 'openai',
-        model: 'gpt-4',
-        author: existingAgentAuthorId,
-        tools: ['web_search'],
-        versions: [
-          {
-            name: 'Reverted Agent V1',
-            provider: 'openai',
-            model: 'gpt-4',
-            tools: ['web_search', `oldTool${d}revokedServer`],
-            createdAt: new Date(Date.now() - 10000),
-            updatedAt: new Date(Date.now() - 10000),
-          },
-          {
-            name: 'Reverted Agent V2',
-            provider: 'openai',
-            model: 'gpt-4',
-            tools: ['web_search'],
-            createdAt: new Date(),
-            updatedAt: new Date(),
-          },
-        ],
-      });
-      existingAgentId = agent.id;
-    });
-
-    test('should strip unauthorized MCP tools after reverting to a previous version', async () => {
-      mockGetAllServerConfigs.mockResolvedValue({
-        authorizedServer: { type: 'sse' },
-      });
-
-      mockReq.user.id = existingAgentAuthorId.toString();
-      mockReq.params.id = existingAgentId;
-      mockReq.body = { version_index: 0 };
-
-      await revertAgentVersionHandler(mockReq, mockRes);
-
-      expect(mockRes.json).toHaveBeenCalled();
-      const result = mockRes.json.mock.calls[0][0];
-      expect(result.tools).toContain('web_search');
-      expect(result.tools).not.toContain(`oldTool${d}revokedServer`);
-
-      const agentInDb = await Agent.findOne({ id: existingAgentId });
-      expect(agentInDb.tools).toContain('web_search');
-      expect(agentInDb.tools).not.toContain(`oldTool${d}revokedServer`);
-    });
-
-    test('should keep authorized MCP tools after revert', async () => {
-      await Agent.updateOne(
-        { id: existingAgentId },
-        { $set: { 'versions.0.tools': ['web_search', `tool${d}authorizedServer`] } },
-      );
-
-      mockReq.user.id = existingAgentAuthorId.toString();
-      mockReq.params.id = existingAgentId;
-      mockReq.body = { version_index: 0 };
-
-      await revertAgentVersionHandler(mockReq, mockRes);
-
-      expect(mockRes.json).toHaveBeenCalled();
-      const result = mockRes.json.mock.calls[0][0];
-      expect(result.tools).toContain('web_search');
-      expect(result.tools).toContain(`tool${d}authorizedServer`);
-    });
-
-    test('should preserve version MCP tools when registry is unavailable on revert', async () => {
-      await Agent.updateOne(
-        { id: existingAgentId },
-        {
-          $set: {
-            'versions.0.tools': [
-              'web_search',
-              `validTool${d}authorizedServer`,
-              `otherTool${d}anotherServer`,
-            ],
-          },
-        },
-      );
-
-      getMCPServersRegistry.mockImplementation(() => {
-        throw new Error('MCPServersRegistry has not been initialized.');
-      });
-
-      mockReq.user.id = existingAgentAuthorId.toString();
-      mockReq.params.id = existingAgentId;
-      mockReq.body = { version_index: 0 };
-
-      await revertAgentVersionHandler(mockReq, mockRes);
-
-      expect(mockRes.json).toHaveBeenCalled();
-      const result = mockRes.json.mock.calls[0][0];
-      expect(result.tools).toContain('web_search');
-      expect(result.tools).toContain(`validTool${d}authorizedServer`);
-      expect(result.tools).toContain(`otherTool${d}anotherServer`);
-
-      const agentInDb = await Agent.findOne({ id: existingAgentId });
-      expect(agentInDb.tools).toContain(`validTool${d}authorizedServer`);
-      expect(agentInDb.tools).toContain(`otherTool${d}anotherServer`);
-    });
-  });
-});
--- a/api/server/controllers/agents/openai.js
+++ b/api/server/controllers/agents/openai.js
@ -1,714 +0,0 @@
-const { nanoid } = require('nanoid');
-const { logger } = require('@librechat/data-schemas');
-const { Callback, ToolEndHandler, formatAgentMessages } = require('@librechat/agents');
-const { EModelEndpoint, ResourceType, PermissionBits } = require('librechat-data-provider');
-const {
-  writeSSE,
-  createRun,
-  createChunk,
-  buildToolSet,
-  sendFinalChunk,
-  createSafeUser,
-  validateRequest,
-  initializeAgent,
-  getBalanceConfig,
-  createErrorResponse,
-  recordCollectedUsage,
-  getTransactionsConfig,
-  createToolExecuteHandler,
-  buildNonStreamingResponse,
-  createOpenAIStreamTracker,
-  createOpenAIContentAggregator,
-  isChatCompletionValidationFailure,
-} = require('@librechat/api');
-const { loadAgentTools, loadToolsForExecution } = require('~/server/services/ToolService');
-const { createToolEndCallback } = require('~/server/controllers/agents/callbacks');
-const { findAccessibleResources } = require('~/server/services/PermissionService');
-const { spendTokens, spendStructuredTokens } = require('~/models/spendTokens');
-const { getMultiplier, getCacheMultiplier } = require('~/models/tx');
-const { getConvoFiles } = require('~/models/Conversation');
-const { getAgent, getAgents } = require('~/models/Agent');
-const db = require('~/models');
-
-/**
- * Creates a tool loader function for the agent.
- * @param {AbortSignal} signal - The abort signal
- * @param {boolean} [definitionsOnly=true] - When true, returns only serializable
- *   tool definitions without creating full tool instances (for event-driven mode)
- */
-function createToolLoader(signal, definitionsOnly = true) {
-  return async function loadTools({
-    req,
-    res,
-    tools,
-    model,
-    agentId,
-    provider,
-    tool_options,
-    tool_resources,
-  }) {
-    const agent = { id: agentId, tools, provider, model, tool_options };
-    try {
-      return await loadAgentTools({
-        req,
-        res,
-        agent,
-        signal,
-        tool_resources,
-        definitionsOnly,
-        streamId: null, // No resumable stream for OpenAI compat
-      });
-    } catch (error) {
-      logger.error('Error loading tools for agent ' + agentId, error);
-    }
-  };
-}
-
-/**
- * Convert content part to internal format
- * @param {Object} part - Content part
- * @returns {Object} Converted part
- */
-function convertContentPart(part) {
-  if (part.type === 'text') {
-    return { type: 'text', text: part.text };
-  }
-  if (part.type === 'image_url') {
-    return { type: 'image_url', image_url: part.image_url };
-  }
-  return part;
-}
-
-/**
- * Convert OpenAI messages to internal format
- * @param {Array} messages - OpenAI format messages
- * @returns {Array} Internal format messages
- */
-function convertMessages(messages) {
-  return messages.map((msg) => {
-    let content;
-    if (typeof msg.content === 'string') {
-      content = msg.content;
-    } else if (msg.content) {
-      content = msg.content.map(convertContentPart);
-    } else {
-      content = '';
-    }
-
-    return {
-      role: msg.role,
-      content,
-      ...(msg.name && { name: msg.name }),
-      ...(msg.tool_calls && { tool_calls: msg.tool_calls }),
-      ...(msg.tool_call_id && { tool_call_id: msg.tool_call_id }),
-    };
-  });
-}
-
-/**
- * Send an error response in OpenAI format
- */
-function sendErrorResponse(res, statusCode, message, type = 'invalid_request_error', code = null) {
-  res.status(statusCode).json(createErrorResponse(message, type, code));
-}
-
-/**
- * OpenAI-compatible chat completions controller for agents.
- *
- * POST /v1/chat/completions
- *
- * Request format:
- * {
- *   "model": "agent_id_here",
- *   "messages": [{"role": "user", "content": "Hello!"}],
- *   "stream": true,
- *   "conversation_id": "optional",
- *   "parent_message_id": "optional"
- * }
- */
-const OpenAIChatCompletionController = async (req, res) => {
-  const appConfig = req.config;
-  const requestStartTime = Date.now();
-
-  const validation = validateRequest(req.body);
-  if (isChatCompletionValidationFailure(validation)) {
-    return sendErrorResponse(res, 400, validation.error);
-  }
-
-  const request = validation.request;
-  const agentId = request.model;
-
-  // Look up the agent
-  const agent = await getAgent({ id: agentId });
-  if (!agent) {
-    return sendErrorResponse(
-      res,
-      404,
-      `Agent not found: ${agentId}`,
-      'invalid_request_error',
-      'model_not_found',
-    );
-  }
-
-  const responseId = `chatcmpl-${nanoid()}`;
-  const conversationId = request.conversation_id ?? nanoid();
-  const parentMessageId = request.parent_message_id ?? null;
-  const created = Math.floor(Date.now() / 1000);
-
-  /** @type {import('@librechat/api').OpenAIResponseContext} — key must be `requestId` to match the type used by createChunk/buildNonStreamingResponse */
-  const context = {
-    created,
-    requestId: responseId,
-    model: agentId,
-  };
-
-  logger.debug(
-    `[OpenAI API] Response ${responseId} started for agent ${agentId}, stream: ${request.stream}`,
-  );
-
-  // Set up abort controller
-  const abortController = new AbortController();
-
-  // Handle client disconnect
-  req.on('close', () => {
-    if (!abortController.signal.aborted) {
-      abortController.abort();
-      logger.debug('[OpenAI API] Client disconnected, aborting');
-    }
-  });
-
-  try {
-    // Build allowed providers set
-    const allowedProviders = new Set(
-      appConfig?.endpoints?.[EModelEndpoint.agents]?.allowedProviders,
-    );
-
-    // Create tool loader
-    const loadTools = createToolLoader(abortController.signal);
-
-    // Initialize the agent first to check for disableStreaming
-    const endpointOption = {
-      endpoint: agent.provider,
-      model_parameters: agent.model_parameters ?? {},
-    };
-
-    const primaryConfig = await initializeAgent(
-      {
-        req,
-        res,
-        loadTools,
-        requestFiles: [],
-        conversationId,
-        parentMessageId,
-        agent,
-        endpointOption,
-        allowedProviders,
-        isInitialAgent: true,
-      },
-      {
-        getConvoFiles,
-        getFiles: db.getFiles,
-        getUserKey: db.getUserKey,
-        getMessages: db.getMessages,
-        updateFilesUsage: db.updateFilesUsage,
-        getUserKeyValues: db.getUserKeyValues,
-        getUserCodeFiles: db.getUserCodeFiles,
-        getToolFilesByIds: db.getToolFilesByIds,
-        getCodeGeneratedFiles: db.getCodeGeneratedFiles,
-      },
-    );
-
-    // Determine if streaming is enabled (check both request and agent config)
-    const streamingDisabled = !!primaryConfig.model_parameters?.disableStreaming;
-    const isStreaming = request.stream === true && !streamingDisabled;
-
-    // Create tracker for streaming or aggregator for non-streaming
-    const tracker = isStreaming ? createOpenAIStreamTracker() : null;
-    const aggregator = isStreaming ? null : createOpenAIContentAggregator();
-
-    // Set up response for streaming
-    if (isStreaming) {
-      res.setHeader('Content-Type', 'text/event-stream');
-      res.setHeader('Cache-Control', 'no-cache');
-      res.setHeader('Connection', 'keep-alive');
-      res.setHeader('X-Accel-Buffering', 'no');
-      res.flushHeaders();
-
-      // Send initial chunk with role
-      const initialChunk = createChunk(context, { role: 'assistant' });
-      writeSSE(res, initialChunk);
-    }
-
-    // Create handler config for OpenAI streaming (only used when streaming)
-    const handlerConfig = isStreaming
-      ? {
-          res,
-          context,
-          tracker,
-        }
-      : null;
-
-    const collectedUsage = [];
-    /** @type {Promise<import('librechat-data-provider').TAttachment | null>[]} */
-    const artifactPromises = [];
-
-    const toolEndCallback = createToolEndCallback({ req, res, artifactPromises, streamId: null });
-
-    const toolExecuteOptions = {
-      loadTools: async (toolNames) => {
-        return loadToolsForExecution({
-          req,
-          res,
-          agent,
-          toolNames,
-          signal: abortController.signal,
-          toolRegistry: primaryConfig.toolRegistry,
-          userMCPAuthMap: primaryConfig.userMCPAuthMap,
-          tool_resources: primaryConfig.tool_resources,
-          actionsEnabled: primaryConfig.actionsEnabled,
-        });
-      },
-      toolEndCallback,
-    };
-
-    const openaiMessages = convertMessages(request.messages);
-
-    const toolSet = buildToolSet(primaryConfig);
-    const { messages: formattedMessages, indexTokenCountMap } = formatAgentMessages(
-      openaiMessages,
-      {},
-      toolSet,
-    );
-
-    /**
-     * Create a simple handler that processes data
-     */
-    const createHandler = (processor) => ({
-      handle: (_event, data) => {
-        if (processor) {
-          processor(data);
-        }
-      },
-    });
-
-    /**
-     * Stream text content in OpenAI format
-     */
-    const streamText = (text) => {
-      if (!text) {
-        return;
-      }
-      if (isStreaming) {
-        tracker.addText();
-        writeSSE(res, createChunk(context, { content: text }));
-      } else {
-        aggregator.addText(text);
-      }
-    };
-
-    /**
-     * Stream reasoning content in OpenAI format (OpenRouter convention)
-     */
-    const streamReasoning = (text) => {
-      if (!text) {
-        return;
-      }
-      if (isStreaming) {
-        tracker.addReasoning();
-        writeSSE(res, createChunk(context, { reasoning: text }));
-      } else {
-        aggregator.addReasoning(text);
-      }
-    };
-
-    // Event handlers for OpenAI-compatible streaming
-    const handlers = {
-      // Text content streaming
-      on_message_delta: createHandler((data) => {
-        const content = data?.delta?.content;
-        if (Array.isArray(content)) {
-          for (const part of content) {
-            if (part.type === 'text' && part.text) {
-              streamText(part.text);
-            }
-          }
-        }
-      }),
-
-      // Reasoning/thinking content streaming
-      on_reasoning_delta: createHandler((data) => {
-        const content = data?.delta?.content;
-        if (Array.isArray(content)) {
-          for (const part of content) {
-            const text = part.think || part.text;
-            if (text) {
-              streamReasoning(text);
-            }
-          }
-        }
-      }),
-
-      // Tool call initiation - streams id and name (from on_run_step)
-      on_run_step: createHandler((data) => {
-        const stepDetails = data?.stepDetails;
-        if (stepDetails?.type === 'tool_calls' && stepDetails.tool_calls) {
-          for (const tc of stepDetails.tool_calls) {
-            const toolIndex = data.index ?? 0;
-            const toolId = tc.id ?? '';
-            const toolName = tc.name ?? '';
-            const toolCall = {
-              id: toolId,
-              type: 'function',
-              function: { name: toolName, arguments: '' },
-            };
-
-            // Track tool call in tracker or aggregator
-            if (isStreaming) {
-              if (!tracker.toolCalls.has(toolIndex)) {
-                tracker.toolCalls.set(toolIndex, toolCall);
-              }
-              // Stream initial tool call chunk (like OpenAI does)
-              writeSSE(
-                res,
-                createChunk(context, {
-                  tool_calls: [{ index: toolIndex, ...toolCall }],
-                }),
-              );
-            } else {
-              if (!aggregator.toolCalls.has(toolIndex)) {
-                aggregator.toolCalls.set(toolIndex, toolCall);
-              }
-            }
-          }
-        }
-      }),
-
-      // Tool call argument streaming (from on_run_step_delta)
-      on_run_step_delta: createHandler((data) => {
-        const delta = data?.delta;
-        if (delta?.type === 'tool_calls' && delta.tool_calls) {
-          for (const tc of delta.tool_calls) {
-            const args = tc.args ?? '';
-            if (!args) {
-              continue;
-            }
-
-            const toolIndex = tc.index ?? 0;
-
-            // Update tool call arguments
-            const targetMap = isStreaming ? tracker.toolCalls : aggregator.toolCalls;
-            const tracked = targetMap.get(toolIndex);
-            if (tracked) {
-              tracked.function.arguments += args;
-            }
-
-            // Stream argument delta (only for streaming)
-            if (isStreaming) {
-              writeSSE(
-                res,
-                createChunk(context, {
-                  tool_calls: [
-                    {
-                      index: toolIndex,
-                      function: { arguments: args },
-                    },
-                  ],
-                }),
-              );
-            }
-          }
-        }
-      }),
-
-      // Usage tracking
-      on_chat_model_end: createHandler((data) => {
-        const usage = data?.output?.usage_metadata;
-        if (usage) {
-          collectedUsage.push(usage);
-          const target = isStreaming ? tracker : aggregator;
-          target.usage.promptTokens += usage.input_tokens ?? 0;
-          target.usage.completionTokens += usage.output_tokens ?? 0;
-        }
-      }),
-      on_run_step_completed: createHandler(),
-      // Use proper ToolEndHandler for processing artifacts (images, file citations, code output)
-      on_tool_end: new ToolEndHandler(toolEndCallback, logger),
-      on_chain_stream: createHandler(),
-      on_chain_end: createHandler(),
-      on_agent_update: createHandler(),
-      on_custom_event: createHandler(),
-      // Event-driven tool execution handler
-      on_tool_execute: createToolExecuteHandler(toolExecuteOptions),
-    };
-
-    // Create and run the agent
-    const userId = req.user?.id ?? 'api-user';
-
-    // Extract userMCPAuthMap from primaryConfig (needed for MCP tool connections)
-    const userMCPAuthMap = primaryConfig.userMCPAuthMap;
-
-    const run = await createRun({
-      agents: [primaryConfig],
-      messages: formattedMessages,
-      indexTokenCountMap,
-      runId: responseId,
-      signal: abortController.signal,
-      customHandlers: handlers,
-      requestBody: {
-        messageId: responseId,
-        conversationId,
-      },
-      user: { id: userId },
-    });
-
-    if (!run) {
-      throw new Error('Failed to create agent run');
-    }
-
-    // Process the stream
-    const config = {
-      runName: 'AgentRun',
-      configurable: {
-        thread_id: conversationId,
-        user_id: userId,
-        user: createSafeUser(req.user),
-        requestBody: {
-          messageId: responseId,
-          conversationId,
-        },
-        ...(userMCPAuthMap != null && { userMCPAuthMap }),
-      },
-      signal: abortController.signal,
-      streamMode: 'values',
-      version: 'v2',
-    };
-
-    await run.processStream({ messages: formattedMessages }, config, {
-      callbacks: {
-        [Callback.TOOL_ERROR]: (graph, error, toolId) => {
-          logger.error(`[OpenAI API] Tool Error "${toolId}"`, error);
-        },
-      },
-    });
-
-    // Record token usage against balance
-    const balanceConfig = getBalanceConfig(appConfig);
-    const transactionsConfig = getTransactionsConfig(appConfig);
-    recordCollectedUsage(
-      {
-        spendTokens,
-        spendStructuredTokens,
-        pricing: { getMultiplier, getCacheMultiplier },
-        bulkWriteOps: { insertMany: db.bulkInsertTransactions, updateBalance: db.updateBalance },
-      },
-      {
-        user: userId,
-        conversationId,
-        collectedUsage,
-        context: 'message',
-        messageId: responseId,
-        balance: balanceConfig,
-        transactions: transactionsConfig,
-        model: primaryConfig.model || agent.model_parameters?.model,
-      },
-    ).catch((err) => {
-      logger.error('[OpenAI API] Error recording usage:', err);
-    });
-
-    // Finalize response
-    const duration = Date.now() - requestStartTime;
-    if (isStreaming) {
-      sendFinalChunk(handlerConfig);
-      res.end();
-      logger.debug(`[OpenAI API] Response ${responseId} completed in ${duration}ms (streaming)`);
-
-      // Wait for artifact processing after response ends (non-blocking)
-      if (artifactPromises.length > 0) {
-        Promise.all(artifactPromises).catch((artifactError) => {
-          logger.warn('[OpenAI API] Error processing artifacts:', artifactError);
-        });
-      }
-    } else {
-      // For non-streaming, wait for artifacts before sending response
-      if (artifactPromises.length > 0) {
-        try {
-          await Promise.all(artifactPromises);
-        } catch (artifactError) {
-          logger.warn('[OpenAI API] Error processing artifacts:', artifactError);
-        }
-      }
-
-      // Build usage from aggregated data
-      const usage = {
-        prompt_tokens: aggregator.usage.promptTokens,
-        completion_tokens: aggregator.usage.completionTokens,
-        total_tokens: aggregator.usage.promptTokens + aggregator.usage.completionTokens,
-      };
-
-      if (aggregator.usage.reasoningTokens > 0) {
-        usage.completion_tokens_details = {
-          reasoning_tokens: aggregator.usage.reasoningTokens,
-        };
-      }
-
-      const response = buildNonStreamingResponse(
-        context,
-        aggregator.getText(),
-        aggregator.getReasoning(),
-        aggregator.toolCalls,
-        usage,
-      );
-      res.json(response);
-      logger.debug(
-        `[OpenAI API] Response ${responseId} completed in ${duration}ms (non-streaming)`,
-      );
-    }
-  } catch (error) {
-    const errorMessage = error instanceof Error ? error.message : 'An error occurred';
-    logger.error('[OpenAI API] Error:', error);
-
-    // Check if we already started streaming (headers sent)
-    if (res.headersSent) {
-      // Headers already sent, send error in stream
-      const errorChunk = createChunk(context, { content: `\n\nError: ${errorMessage}` }, 'stop');
-      writeSSE(res, errorChunk);
-      writeSSE(res, '[DONE]');
-      res.end();
-    } else {
-      // Forward upstream provider status codes (e.g., Anthropic 400s) instead of masking as 500
-      const statusCode =
-        typeof error?.status === 'number' && error.status >= 400 && error.status < 600
-          ? error.status
-          : 500;
-      const errorType =
-        statusCode >= 400 && statusCode < 500 ? 'invalid_request_error' : 'server_error';
-      sendErrorResponse(res, statusCode, errorMessage, errorType);
-    }
-  }
-};
-
-/**
- * List available agents as models (filtered by remote access permissions)
- *
- * GET /v1/models
- */
-const ListModelsController = async (req, res) => {
-  try {
-    const userId = req.user?.id;
-    const userRole = req.user?.role;
-
-    if (!userId) {
-      return sendErrorResponse(res, 401, 'Authentication required', 'auth_error');
-    }
-
-    // Find agents the user has remote access to (VIEW permission on REMOTE_AGENT)
-    const accessibleAgentIds = await findAccessibleResources({
-      userId,
-      role: userRole,
-      resourceType: ResourceType.REMOTE_AGENT,
-      requiredPermissions: PermissionBits.VIEW,
-    });
-
-    // Get the accessible agents
-    let agents = [];
-    if (accessibleAgentIds.length > 0) {
-      agents = await getAgents({ _id: { $in: accessibleAgentIds } });
-    }
-
-    const models = agents.map((agent) => ({
-      id: agent.id,
-      object: 'model',
-      created: Math.floor(new Date(agent.createdAt || Date.now()).getTime() / 1000),
-      owned_by: 'librechat',
-      permission: [],
-      root: agent.id,
-      parent: null,
-      // LibreChat extensions
-      name: agent.name,
-      description: agent.description,
-      provider: agent.provider,
-    }));
-
-    res.json({
-      object: 'list',
-      data: models,
-    });
-  } catch (error) {
-    const errorMessage = error instanceof Error ? error.message : 'Failed to list models';
-    logger.error('[OpenAI API] Error listing models:', error);
-    sendErrorResponse(res, 500, errorMessage, 'server_error');
-  }
-};
-
-/**
- * Get a specific model/agent (with remote access permission check)
- *
- * GET /v1/models/:model
- */
-const GetModelController = async (req, res) => {
-  try {
-    const { model } = req.params;
-    const userId = req.user?.id;
-    const userRole = req.user?.role;
-
-    if (!userId) {
-      return sendErrorResponse(res, 401, 'Authentication required', 'auth_error');
-    }
-
-    const agent = await getAgent({ id: model });
-
-    if (!agent) {
-      return sendErrorResponse(
-        res,
-        404,
-        `Model not found: ${model}`,
-        'invalid_request_error',
-        'model_not_found',
-      );
-    }
-
-    // Check if user has remote access to this agent
-    const accessibleAgentIds = await findAccessibleResources({
-      userId,
-      role: userRole,
-      resourceType: ResourceType.REMOTE_AGENT,
-      requiredPermissions: PermissionBits.VIEW,
-    });
-
-    const hasAccess = accessibleAgentIds.some((id) => id.toString() === agent._id.toString());
-
-    if (!hasAccess) {
-      return sendErrorResponse(
-        res,
-        403,
-        `No remote access to model: ${model}`,
-        'permission_error',
-        'access_denied',
-      );
-    }
-
-    res.json({
-      id: agent.id,
-      object: 'model',
-      created: Math.floor(new Date(agent.createdAt || Date.now()).getTime() / 1000),
-      owned_by: 'librechat',
-      permission: [],
-      root: agent.id,
-      parent: null,
-      // LibreChat extensions
-      name: agent.name,
-      description: agent.description,
-      provider: agent.provider,
-    });
-  } catch (error) {
-    const errorMessage = error instanceof Error ? error.message : 'Failed to get model';
-    logger.error('[OpenAI API] Error getting model:', error);
-    sendErrorResponse(res, 500, errorMessage, 'server_error');
-  }
-};
-
-module.exports = {
-  OpenAIChatCompletionController,
-  ListModelsController,
-  GetModelController,
-};
--- a/api/server/controllers/agents/recordCollectedUsage.spec.js
+++ b/api/server/controllers/agents/recordCollectedUsage.spec.js
@ -2,37 +2,23 @@
 * Tests for AgentClient.recordCollectedUsage
 *
 * This is a critical function that handles token spending for agent LLM calls.
- * The client now delegates to the TS recordCollectedUsage from @librechat/api,
- * passing pricing and bulkWriteOps deps.
+ * It must correctly handle:
+ * - Sequential execution (single agent with tool calls)
+ * - Parallel execution (multiple agents with independent inputs)
+ * - Cache token handling (OpenAI and Anthropic formats)
 */

 const { EModelEndpoint } = require('librechat-data-provider');

+// Mock dependencies before requiring the module
 const mockSpendTokens = jest.fn().mockResolvedValue();
 const mockSpendStructuredTokens = jest.fn().mockResolvedValue();
-const mockGetMultiplier = jest.fn().mockReturnValue(1);
-const mockGetCacheMultiplier = jest.fn().mockReturnValue(null);
-const mockUpdateBalance = jest.fn().mockResolvedValue({});
-const mockBulkInsertTransactions = jest.fn().mockResolvedValue(undefined);
-const mockRecordCollectedUsage = jest
-  .fn()
-  .mockResolvedValue({ input_tokens: 100, output_tokens: 50 });

 jest.mock('~/models/spendTokens', () => ({
  spendTokens: (...args) => mockSpendTokens(...args),
  spendStructuredTokens: (...args) => mockSpendStructuredTokens(...args),
 }));

-jest.mock('~/models/tx', () => ({
-  getMultiplier: mockGetMultiplier,
-  getCacheMultiplier: mockGetCacheMultiplier,
-}));
-
-jest.mock('~/models', () => ({
-  updateBalance: mockUpdateBalance,
-  bulkInsertTransactions: mockBulkInsertTransactions,
-}));
-
 jest.mock('~/config', () => ({
  logger: {
    debug: jest.fn(),
@ -53,14 +39,6 @@ jest.mock('@librechat/agents', () => ({
  }),
 }));

-jest.mock('@librechat/api', () => {
-  const actual = jest.requireActual('@librechat/api');
-  return {
-    ...actual,
-    recordCollectedUsage: (...args) => mockRecordCollectedUsage(...args),
-  };
-});
-
 const AgentClient = require('./client');

 describe('AgentClient - recordCollectedUsage', () => {
@ -96,7 +74,30 @@ describe('AgentClient - recordCollectedUsage', () => {
  });

  describe('basic functionality', () => {
-    it('should delegate to recordCollectedUsage with full deps', async () => {
+    it('should return early if collectedUsage is empty', async () => {
+      await client.recordCollectedUsage({
+        collectedUsage: [],
+        balance: { enabled: true },
+        transactions: { enabled: true },
+      });
+
+      expect(mockSpendTokens).not.toHaveBeenCalled();
+      expect(mockSpendStructuredTokens).not.toHaveBeenCalled();
+      expect(client.usage).toBeUndefined();
+    });
+
+    it('should return early if collectedUsage is null', async () => {
+      await client.recordCollectedUsage({
+        collectedUsage: null,
+        balance: { enabled: true },
+        transactions: { enabled: true },
+      });
+
+      expect(mockSpendTokens).not.toHaveBeenCalled();
+      expect(client.usage).toBeUndefined();
+    });
+
+    it('should handle single usage entry correctly', async () => {
      const collectedUsage = [{ input_tokens: 100, output_tokens: 50, model: 'gpt-4' }];

      await client.recordCollectedUsage({
@ -105,57 +106,25 @@ describe('AgentClient - recordCollectedUsage', () => {
        transactions: { enabled: true },
      });

-      expect(mockRecordCollectedUsage).toHaveBeenCalledTimes(1);
-      const [deps, params] = mockRecordCollectedUsage.mock.calls[0];
-
-      expect(deps).toHaveProperty('spendTokens');
-      expect(deps).toHaveProperty('spendStructuredTokens');
-      expect(deps).toHaveProperty('pricing');
-      expect(deps.pricing).toHaveProperty('getMultiplier');
-      expect(deps.pricing).toHaveProperty('getCacheMultiplier');
-      expect(deps).toHaveProperty('bulkWriteOps');
-      expect(deps.bulkWriteOps).toHaveProperty('insertMany');
-      expect(deps.bulkWriteOps).toHaveProperty('updateBalance');
-
-      expect(params).toEqual(
+      expect(mockSpendTokens).toHaveBeenCalledTimes(1);
+      expect(mockSpendTokens).toHaveBeenCalledWith(
        expect.objectContaining({
-          user: 'user-123',
          conversationId: 'convo-123',
-          collectedUsage,
-          context: 'message',
-          balance: { enabled: true },
-          transactions: { enabled: true },
+          user: 'user-123',
+          model: 'gpt-4',
        }),
+        { promptTokens: 100, completionTokens: 50 },
      );
+      expect(client.usage.input_tokens).toBe(100);
+      expect(client.usage.output_tokens).toBe(50);
    });

-    it('should not set this.usage if collectedUsage is empty (returns undefined)', async () => {
-      mockRecordCollectedUsage.mockResolvedValue(undefined);
-
-      await client.recordCollectedUsage({
-        collectedUsage: [],
-        balance: { enabled: true },
-        transactions: { enabled: true },
-      });
-
-      expect(client.usage).toBeUndefined();
-    });
-
-    it('should not set this.usage if collectedUsage is null (returns undefined)', async () => {
-      mockRecordCollectedUsage.mockResolvedValue(undefined);
-
-      await client.recordCollectedUsage({
-        collectedUsage: null,
-        balance: { enabled: true },
-        transactions: { enabled: true },
-      });
-
-      expect(client.usage).toBeUndefined();
-    });
-
-    it('should set this.usage from recordCollectedUsage result', async () => {
-      mockRecordCollectedUsage.mockResolvedValue({ input_tokens: 200, output_tokens: 75 });
-      const collectedUsage = [{ input_tokens: 200, output_tokens: 75, model: 'gpt-4' }];
+    it('should skip null entries in collectedUsage', async () => {
+      const collectedUsage = [
+        { input_tokens: 100, output_tokens: 50, model: 'gpt-4' },
+        null,
+        { input_tokens: 200, output_tokens: 60, model: 'gpt-4' },
+      ];

      await client.recordCollectedUsage({
        collectedUsage,
@ -163,62 +132,82 @@ describe('AgentClient - recordCollectedUsage', () => {
        transactions: { enabled: true },
      });

-      expect(client.usage).toEqual({ input_tokens: 200, output_tokens: 75 });
+      expect(mockSpendTokens).toHaveBeenCalledTimes(2);
    });
  });

  describe('sequential execution (single agent with tool calls)', () => {
-    it('should pass all usage entries to recordCollectedUsage', async () => {
+    it('should calculate tokens correctly for sequential tool calls', async () => {
+      // Sequential flow: output of call N becomes part of input for call N+1
+      // Call 1: input=100, output=50
+      // Call 2: input=150 (100+50), output=30
+      // Call 3: input=180 (150+30), output=20
      const collectedUsage = [
        { input_tokens: 100, output_tokens: 50, model: 'gpt-4' },
        { input_tokens: 150, output_tokens: 30, model: 'gpt-4' },
        { input_tokens: 180, output_tokens: 20, model: 'gpt-4' },
      ];

-      mockRecordCollectedUsage.mockResolvedValue({ input_tokens: 100, output_tokens: 100 });
-
      await client.recordCollectedUsage({
        collectedUsage,
        balance: { enabled: true },
        transactions: { enabled: true },
      });

-      expect(mockRecordCollectedUsage).toHaveBeenCalledTimes(1);
-      const [, params] = mockRecordCollectedUsage.mock.calls[0];
-      expect(params.collectedUsage).toHaveLength(3);
+      expect(mockSpendTokens).toHaveBeenCalledTimes(3);
+      // Total output should be sum of all output_tokens: 50 + 30 + 20 = 100
      expect(client.usage.output_tokens).toBe(100);
-      expect(client.usage.input_tokens).toBe(100);
+      expect(client.usage.input_tokens).toBe(100); // First entry's input
    });
  });

  describe('parallel execution (multiple agents)', () => {
-    it('should pass parallel agent usage to recordCollectedUsage', async () => {
+    it('should handle parallel agents with independent input tokens', async () => {
+      // Parallel agents have INDEPENDENT input tokens (not cumulative)
+      // Agent A: input=100, output=50
+      // Agent B: input=80, output=40 (different context, not 100+50)
      const collectedUsage = [
        { input_tokens: 100, output_tokens: 50, model: 'gpt-4' },
        { input_tokens: 80, output_tokens: 40, model: 'gpt-4' },
      ];

-      mockRecordCollectedUsage.mockResolvedValue({ input_tokens: 100, output_tokens: 90 });
-
      await client.recordCollectedUsage({
        collectedUsage,
        balance: { enabled: true },
        transactions: { enabled: true },
      });

-      expect(mockRecordCollectedUsage).toHaveBeenCalledTimes(1);
-      expect(client.usage.output_tokens).toBe(90);
+      expect(mockSpendTokens).toHaveBeenCalledTimes(2);
+      // Expected total output: 50 + 40 = 90
+      // output_tokens must be positive and should reflect total output
      expect(client.usage.output_tokens).toBeGreaterThan(0);
    });

-    /** Bug regression: parallel agents where second agent has LOWER input tokens produced negative output via incremental calculation. */
-    it('should NOT produce negative output_tokens', async () => {
+    it('should NOT produce negative output_tokens for parallel execution', async () => {
+      // Critical bug scenario: parallel agents where second agent has LOWER input tokens
      const collectedUsage = [
        { input_tokens: 200, output_tokens: 100, model: 'gpt-4' },
        { input_tokens: 50, output_tokens: 30, model: 'gpt-4' },
      ];

-      mockRecordCollectedUsage.mockResolvedValue({ input_tokens: 200, output_tokens: 130 });
+      await client.recordCollectedUsage({
+        collectedUsage,
+        balance: { enabled: true },
+        transactions: { enabled: true },
+      });
+
+      // output_tokens MUST be positive for proper token tracking
+      expect(client.usage.output_tokens).toBeGreaterThan(0);
+      // Correct value should be 100 + 30 = 130
+    });
+
+    it('should calculate correct total output for parallel agents', async () => {
+      // Three parallel agents with independent contexts
+      const collectedUsage = [
+        { input_tokens: 100, output_tokens: 50, model: 'gpt-4' },
+        { input_tokens: 120, output_tokens: 60, model: 'gpt-4-turbo' },
+        { input_tokens: 80, output_tokens: 40, model: 'claude-3' },
+      ];

      await client.recordCollectedUsage({
        collectedUsage,
@ -226,44 +215,111 @@ describe('AgentClient - recordCollectedUsage', () => {
        transactions: { enabled: true },
      });

+      expect(mockSpendTokens).toHaveBeenCalledTimes(3);
+      // Total output should be 50 + 60 + 40 = 150
+      expect(client.usage.output_tokens).toBe(150);
+    });
+
+    it('should handle worst-case parallel scenario without negative tokens', async () => {
+      // Extreme case: first agent has very high input, subsequent have low
+      const collectedUsage = [
+        { input_tokens: 1000, output_tokens: 500, model: 'gpt-4' },
+        { input_tokens: 100, output_tokens: 50, model: 'gpt-4' },
+        { input_tokens: 50, output_tokens: 25, model: 'gpt-4' },
+      ];
+
+      await client.recordCollectedUsage({
+        collectedUsage,
+        balance: { enabled: true },
+        transactions: { enabled: true },
+      });
+
+      // Must be positive, should be 500 + 50 + 25 = 575
      expect(client.usage.output_tokens).toBeGreaterThan(0);
-      expect(client.usage.output_tokens).toBe(130);
+      expect(client.usage.output_tokens).toBe(575);
    });
  });

  describe('real-world scenarios', () => {
-    it('should correctly handle sequential tool calls with growing context', async () => {
-      const collectedUsage = [
-        { input_tokens: 31596, output_tokens: 151, model: 'claude-opus-4-5-20251101' },
-        { input_tokens: 35368, output_tokens: 150, model: 'claude-opus-4-5-20251101' },
-        { input_tokens: 58362, output_tokens: 295, model: 'claude-opus-4-5-20251101' },
-        { input_tokens: 112604, output_tokens: 193, model: 'claude-opus-4-5-20251101' },
-        { input_tokens: 257440, output_tokens: 2217, model: 'claude-opus-4-5-20251101' },
-      ];
-
-      mockRecordCollectedUsage.mockResolvedValue({ input_tokens: 31596, output_tokens: 3006 });
-
-      await client.recordCollectedUsage({
-        collectedUsage,
-        balance: { enabled: true },
-        transactions: { enabled: true },
-      });
-
-      expect(client.usage.input_tokens).toBe(31596);
-      expect(client.usage.output_tokens).toBe(3006);
-    });
-
-    it('should correctly handle cache tokens', async () => {
+    it('should correctly sum output tokens for sequential tool calls with growing context', async () => {
+      // Real production data: Claude Opus with multiple tool calls
+      // Context grows as tool results are added, but output_tokens should only count model generations
      const collectedUsage = [
        {
-          input_tokens: 788,
-          output_tokens: 163,
-          input_token_details: { cache_read: 0, cache_creation: 30808 },
+          input_tokens: 31596,
+          output_tokens: 151,
+          total_tokens: 31747,
+          input_token_details: { cache_read: 0, cache_creation: 0 },
+          model: 'claude-opus-4-5-20251101',
+        },
+        {
+          input_tokens: 35368,
+          output_tokens: 150,
+          total_tokens: 35518,
+          input_token_details: { cache_read: 0, cache_creation: 0 },
+          model: 'claude-opus-4-5-20251101',
+        },
+        {
+          input_tokens: 58362,
+          output_tokens: 295,
+          total_tokens: 58657,
+          input_token_details: { cache_read: 0, cache_creation: 0 },
+          model: 'claude-opus-4-5-20251101',
+        },
+        {
+          input_tokens: 112604,
+          output_tokens: 193,
+          total_tokens: 112797,
+          input_token_details: { cache_read: 0, cache_creation: 0 },
+          model: 'claude-opus-4-5-20251101',
+        },
+        {
+          input_tokens: 257440,
+          output_tokens: 2217,
+          total_tokens: 259657,
+          input_token_details: { cache_read: 0, cache_creation: 0 },
          model: 'claude-opus-4-5-20251101',
        },
      ];

-      mockRecordCollectedUsage.mockResolvedValue({ input_tokens: 31596, output_tokens: 163 });
+      await client.recordCollectedUsage({
+        collectedUsage,
+        balance: { enabled: true },
+        transactions: { enabled: true },
+      });
+
+      // input_tokens should be first entry's input (initial context)
+      expect(client.usage.input_tokens).toBe(31596);
+
+      // output_tokens should be sum of all model outputs: 151 + 150 + 295 + 193 + 2217 = 3006
+      // NOT the inflated value from incremental calculation (338,559)
+      expect(client.usage.output_tokens).toBe(3006);
+
+      // Verify spendTokens was called for each entry with correct values
+      expect(mockSpendTokens).toHaveBeenCalledTimes(5);
+      expect(mockSpendTokens).toHaveBeenNthCalledWith(
+        1,
+        expect.objectContaining({ model: 'claude-opus-4-5-20251101' }),
+        { promptTokens: 31596, completionTokens: 151 },
+      );
+      expect(mockSpendTokens).toHaveBeenNthCalledWith(
+        5,
+        expect.objectContaining({ model: 'claude-opus-4-5-20251101' }),
+        { promptTokens: 257440, completionTokens: 2217 },
+      );
+    });
+
+    it('should handle single followup message correctly', async () => {
+      // Real production data: followup to the above conversation
+      const collectedUsage = [
+        {
+          input_tokens: 263406,
+          output_tokens: 257,
+          total_tokens: 263663,
+          input_token_details: { cache_read: 0, cache_creation: 0 },
+          model: 'claude-opus-4-5-20251101',
+        },
+      ];

      await client.recordCollectedUsage({
        collectedUsage,
@ -271,14 +327,300 @@ describe('AgentClient - recordCollectedUsage', () => {
        transactions: { enabled: true },
      });

+      expect(client.usage.input_tokens).toBe(263406);
+      expect(client.usage.output_tokens).toBe(257);
+
+      expect(mockSpendTokens).toHaveBeenCalledTimes(1);
+      expect(mockSpendTokens).toHaveBeenCalledWith(
+        expect.objectContaining({ model: 'claude-opus-4-5-20251101' }),
+        { promptTokens: 263406, completionTokens: 257 },
+      );
+    });
+
+    it('should ensure output_tokens > 0 check passes for BaseClient.sendMessage', async () => {
+      // This verifies the fix for the duplicate token spending bug
+      // BaseClient.sendMessage checks: if (usage != null && Number(usage[this.outputTokensKey]) > 0)
+      const collectedUsage = [
+        {
+          input_tokens: 31596,
+          output_tokens: 151,
+          model: 'claude-opus-4-5-20251101',
+        },
+        {
+          input_tokens: 35368,
+          output_tokens: 150,
+          model: 'claude-opus-4-5-20251101',
+        },
+      ];
+
+      await client.recordCollectedUsage({
+        collectedUsage,
+        balance: { enabled: true },
+        transactions: { enabled: true },
+      });
+
+      const usage = client.getStreamUsage();
+
+      // The check that was failing before the fix
+      expect(usage).not.toBeNull();
+      expect(Number(usage.output_tokens)).toBeGreaterThan(0);
+
+      // Verify correct value
+      expect(usage.output_tokens).toBe(301); // 151 + 150
+    });
+
+    it('should correctly handle cache tokens with multiple tool calls', async () => {
+      // Real production data: Claude Opus with cache tokens (prompt caching)
+      // First entry has cache_creation, subsequent entries have cache_read
+      const collectedUsage = [
+        {
+          input_tokens: 788,
+          output_tokens: 163,
+          total_tokens: 951,
+          input_token_details: { cache_read: 0, cache_creation: 30808 },
+          model: 'claude-opus-4-5-20251101',
+        },
+        {
+          input_tokens: 3802,
+          output_tokens: 149,
+          total_tokens: 3951,
+          input_token_details: { cache_read: 30808, cache_creation: 768 },
+          model: 'claude-opus-4-5-20251101',
+        },
+        {
+          input_tokens: 26808,
+          output_tokens: 225,
+          total_tokens: 27033,
+          input_token_details: { cache_read: 31576, cache_creation: 0 },
+          model: 'claude-opus-4-5-20251101',
+        },
+        {
+          input_tokens: 80912,
+          output_tokens: 204,
+          total_tokens: 81116,
+          input_token_details: { cache_read: 31576, cache_creation: 0 },
+          model: 'claude-opus-4-5-20251101',
+        },
+        {
+          input_tokens: 136454,
+          output_tokens: 206,
+          total_tokens: 136660,
+          input_token_details: { cache_read: 31576, cache_creation: 0 },
+          model: 'claude-opus-4-5-20251101',
+        },
+        {
+          input_tokens: 146316,
+          output_tokens: 224,
+          total_tokens: 146540,
+          input_token_details: { cache_read: 31576, cache_creation: 0 },
+          model: 'claude-opus-4-5-20251101',
+        },
+        {
+          input_tokens: 150402,
+          output_tokens: 1248,
+          total_tokens: 151650,
+          input_token_details: { cache_read: 31576, cache_creation: 0 },
+          model: 'claude-opus-4-5-20251101',
+        },
+        {
+          input_tokens: 156268,
+          output_tokens: 139,
+          total_tokens: 156407,
+          input_token_details: { cache_read: 31576, cache_creation: 0 },
+          model: 'claude-opus-4-5-20251101',
+        },
+        {
+          input_tokens: 167126,
+          output_tokens: 2961,
+          total_tokens: 170087,
+          input_token_details: { cache_read: 31576, cache_creation: 0 },
+          model: 'claude-opus-4-5-20251101',
+        },
+      ];
+
+      await client.recordCollectedUsage({
+        collectedUsage,
+        balance: { enabled: true },
+        transactions: { enabled: true },
+      });
+
+      // input_tokens = first entry's input + cache_creation + cache_read
+      // = 788 + 30808 + 0 = 31596
      expect(client.usage.input_tokens).toBe(31596);
-      expect(client.usage.output_tokens).toBe(163);
+
+      // output_tokens = sum of all output_tokens
+      // = 163 + 149 + 225 + 204 + 206 + 224 + 1248 + 139 + 2961 = 5519
+      expect(client.usage.output_tokens).toBe(5519);
+
+      // First 2 entries have cache tokens, should use spendStructuredTokens
+      // Remaining 7 entries have cache_read but no cache_creation, still structured
+      expect(mockSpendStructuredTokens).toHaveBeenCalledTimes(9);
+      expect(mockSpendTokens).toHaveBeenCalledTimes(0);
+
+      // Verify first entry uses structured tokens with cache_creation
+      expect(mockSpendStructuredTokens).toHaveBeenNthCalledWith(
+        1,
+        expect.objectContaining({ model: 'claude-opus-4-5-20251101' }),
+        {
+          promptTokens: { input: 788, write: 30808, read: 0 },
+          completionTokens: 163,
+        },
+      );
+
+      // Verify second entry uses structured tokens with both cache_creation and cache_read
+      expect(mockSpendStructuredTokens).toHaveBeenNthCalledWith(
+        2,
+        expect.objectContaining({ model: 'claude-opus-4-5-20251101' }),
+        {
+          promptTokens: { input: 3802, write: 768, read: 30808 },
+          completionTokens: 149,
+        },
+      );
+    });
+  });
+
+  describe('cache token handling', () => {
+    it('should handle OpenAI format cache tokens (input_token_details)', async () => {
+      const collectedUsage = [
+        {
+          input_tokens: 100,
+          output_tokens: 50,
+          model: 'gpt-4',
+          input_token_details: {
+            cache_creation: 20,
+            cache_read: 10,
+          },
+        },
+      ];
+
+      await client.recordCollectedUsage({
+        collectedUsage,
+        balance: { enabled: true },
+        transactions: { enabled: true },
+      });
+
+      expect(mockSpendStructuredTokens).toHaveBeenCalledTimes(1);
+      expect(mockSpendStructuredTokens).toHaveBeenCalledWith(
+        expect.objectContaining({ model: 'gpt-4' }),
+        {
+          promptTokens: {
+            input: 100,
+            write: 20,
+            read: 10,
+          },
+          completionTokens: 50,
+        },
+      );
+    });
+
+    it('should handle Anthropic format cache tokens (cache_*_input_tokens)', async () => {
+      const collectedUsage = [
+        {
+          input_tokens: 100,
+          output_tokens: 50,
+          model: 'claude-3',
+          cache_creation_input_tokens: 25,
+          cache_read_input_tokens: 15,
+        },
+      ];
+
+      await client.recordCollectedUsage({
+        collectedUsage,
+        balance: { enabled: true },
+        transactions: { enabled: true },
+      });
+
+      expect(mockSpendStructuredTokens).toHaveBeenCalledTimes(1);
+      expect(mockSpendStructuredTokens).toHaveBeenCalledWith(
+        expect.objectContaining({ model: 'claude-3' }),
+        {
+          promptTokens: {
+            input: 100,
+            write: 25,
+            read: 15,
+          },
+          completionTokens: 50,
+        },
+      );
+    });
+
+    it('should use spendTokens for entries without cache tokens', async () => {
+      const collectedUsage = [{ input_tokens: 100, output_tokens: 50, model: 'gpt-4' }];
+
+      await client.recordCollectedUsage({
+        collectedUsage,
+        balance: { enabled: true },
+        transactions: { enabled: true },
+      });
+
+      expect(mockSpendTokens).toHaveBeenCalledTimes(1);
+      expect(mockSpendStructuredTokens).not.toHaveBeenCalled();
+    });
+
+    it('should handle mixed cache and non-cache entries', async () => {
+      const collectedUsage = [
+        { input_tokens: 100, output_tokens: 50, model: 'gpt-4' },
+        {
+          input_tokens: 150,
+          output_tokens: 30,
+          model: 'gpt-4',
+          input_token_details: { cache_creation: 10, cache_read: 5 },
+        },
+        { input_tokens: 200, output_tokens: 20, model: 'gpt-4' },
+      ];
+
+      await client.recordCollectedUsage({
+        collectedUsage,
+        balance: { enabled: true },
+        transactions: { enabled: true },
+      });
+
+      expect(mockSpendTokens).toHaveBeenCalledTimes(2);
+      expect(mockSpendStructuredTokens).toHaveBeenCalledTimes(1);
+    });
+
+    it('should include cache tokens in total input calculation', async () => {
+      const collectedUsage = [
+        {
+          input_tokens: 100,
+          output_tokens: 50,
+          model: 'gpt-4',
+          input_token_details: {
+            cache_creation: 20,
+            cache_read: 10,
+          },
+        },
+      ];
+
+      await client.recordCollectedUsage({
+        collectedUsage,
+        balance: { enabled: true },
+        transactions: { enabled: true },
+      });
+
+      // Total input should include cache tokens: 100 + 20 + 10 = 130
+      expect(client.usage.input_tokens).toBe(130);
    });
  });

  describe('model fallback', () => {
-    it('should use param model when available', async () => {
-      mockRecordCollectedUsage.mockResolvedValue({ input_tokens: 100, output_tokens: 50 });
+    it('should use usage.model when available', async () => {
+      const collectedUsage = [{ input_tokens: 100, output_tokens: 50, model: 'gpt-4-turbo' }];
+
+      await client.recordCollectedUsage({
+        model: 'fallback-model',
+        collectedUsage,
+        balance: { enabled: true },
+        transactions: { enabled: true },
+      });
+
+      expect(mockSpendTokens).toHaveBeenCalledWith(
+        expect.objectContaining({ model: 'gpt-4-turbo' }),
+        expect.any(Object),
+      );
+    });
+
+    it('should fallback to param model when usage.model is missing', async () => {
      const collectedUsage = [{ input_tokens: 100, output_tokens: 50 }];

      await client.recordCollectedUsage({
@ -288,13 +630,14 @@ describe('AgentClient - recordCollectedUsage', () => {
        transactions: { enabled: true },
      });

-      const [, params] = mockRecordCollectedUsage.mock.calls[0];
-      expect(params.model).toBe('param-model');
+      expect(mockSpendTokens).toHaveBeenCalledWith(
+        expect.objectContaining({ model: 'param-model' }),
+        expect.any(Object),
+      );
    });

    it('should fallback to client.model when param model is missing', async () => {
      client.model = 'client-model';
-      mockRecordCollectedUsage.mockResolvedValue({ input_tokens: 100, output_tokens: 50 });
      const collectedUsage = [{ input_tokens: 100, output_tokens: 50 }];

      await client.recordCollectedUsage({
@ -303,12 +646,13 @@ describe('AgentClient - recordCollectedUsage', () => {
        transactions: { enabled: true },
      });

-      const [, params] = mockRecordCollectedUsage.mock.calls[0];
-      expect(params.model).toBe('client-model');
+      expect(mockSpendTokens).toHaveBeenCalledWith(
+        expect.objectContaining({ model: 'client-model' }),
+        expect.any(Object),
+      );
    });

    it('should fallback to agent model_parameters.model as last resort', async () => {
-      mockRecordCollectedUsage.mockResolvedValue({ input_tokens: 100, output_tokens: 50 });
      const collectedUsage = [{ input_tokens: 100, output_tokens: 50 }];

      await client.recordCollectedUsage({
@ -317,14 +661,15 @@ describe('AgentClient - recordCollectedUsage', () => {
        transactions: { enabled: true },
      });

-      const [, params] = mockRecordCollectedUsage.mock.calls[0];
-      expect(params.model).toBe('gpt-4');
+      expect(mockSpendTokens).toHaveBeenCalledWith(
+        expect.objectContaining({ model: 'gpt-4' }),
+        expect.any(Object),
+      );
    });
  });

  describe('getStreamUsage integration', () => {
    it('should return the usage object set by recordCollectedUsage', async () => {
-      mockRecordCollectedUsage.mockResolvedValue({ input_tokens: 100, output_tokens: 50 });
      const collectedUsage = [{ input_tokens: 100, output_tokens: 50, model: 'gpt-4' }];

      await client.recordCollectedUsage({
@ -334,7 +679,10 @@ describe('AgentClient - recordCollectedUsage', () => {
      });

      const usage = client.getStreamUsage();
-      expect(usage).toEqual({ input_tokens: 100, output_tokens: 50 });
+      expect(usage).toEqual({
+        input_tokens: 100,
+        output_tokens: 50,
+      });
    });

    it('should return undefined before recordCollectedUsage is called', () => {
@ -342,9 +690,9 @@ describe('AgentClient - recordCollectedUsage', () => {
      expect(usage).toBeUndefined();
    });

-    /** Verifies usage passes the check in BaseClient.sendMessage: if (usage != null && Number(usage[this.outputTokensKey]) > 0) */
    it('should have output_tokens > 0 for BaseClient.sendMessage check', async () => {
-      mockRecordCollectedUsage.mockResolvedValue({ input_tokens: 200, output_tokens: 130 });
+      // This test verifies the usage will pass the check in BaseClient.sendMessage:
+      // if (usage != null && Number(usage[this.outputTokensKey]) > 0)
      const collectedUsage = [
        { input_tokens: 200, output_tokens: 100, model: 'gpt-4' },
        { input_tokens: 50, output_tokens: 30, model: 'gpt-4' },
--- a/api/server/controllers/agents/request.js
+++ b/api/server/controllers/agents/request.js
@ -3,9 +3,9 @@ const { Constants, ViolationTypes } = require('librechat-data-provider');
 const {
  sendEvent,
  getViolationInfo,
-  buildMessageFiles,
  GenerationJobManager,
  decrementPendingRequest,
+  sanitizeFileForTransmit,
  sanitizeMessageForTransmit,
  checkAndIncrementPendingRequest,
 } = require('@librechat/api');
@ -252,10 +252,13 @@ const ResumableAgentController = async (req, res, next, initializeClient, addTit
        conversation.title =
          conversation && !conversation.title ? null : conversation?.title || 'New Chat';

-        if (req.body.files && Array.isArray(client.options.attachments)) {
-          const files = buildMessageFiles(req.body.files, client.options.attachments);
-          if (files.length > 0) {
-            userMessage.files = files;
+        if (req.body.files && client.options?.attachments) {
+          userMessage.files = [];
+          const messageFiles = new Set(req.body.files.map((file) => file.file_id));
+          for (const attachment of client.options.attachments) {
+            if (messageFiles.has(attachment.file_id)) {
+              userMessage.files.push(sanitizeFileForTransmit(attachment));
+            }
          }
          delete userMessage.image_urls;
        }
@ -321,7 +324,7 @@ const ResumableAgentController = async (req, res, next, initializeClient, addTit
            conversationId: conversation?.conversationId,
          });

-          await GenerationJobManager.emitDone(streamId, finalEvent);
+          GenerationJobManager.emitDone(streamId, finalEvent);
          GenerationJobManager.completeJob(streamId);
          await decrementPendingRequest(userId);
        } else {
@ -341,7 +344,7 @@ const ResumableAgentController = async (req, res, next, initializeClient, addTit
            conversationId: conversation?.conversationId,
          });

-          await GenerationJobManager.emitDone(streamId, finalEvent);
+          GenerationJobManager.emitDone(streamId, finalEvent);
          GenerationJobManager.completeJob(streamId, 'Request aborted');
          await decrementPendingRequest(userId);
        }
@ -374,7 +377,7 @@ const ResumableAgentController = async (req, res, next, initializeClient, addTit
          // abortJob already handled emitDone and completeJob
        } else {
          logger.error(`[ResumableAgentController] Generation error for ${streamId}:`, error);
-          await GenerationJobManager.emitError(streamId, error.message || 'Generation failed');
+          GenerationJobManager.emitError(streamId, error.message || 'Generation failed');
          GenerationJobManager.completeJob(streamId, error.message);
        }

@ -403,7 +406,7 @@ const ResumableAgentController = async (req, res, next, initializeClient, addTit
      res.status(500).json({ error: error.message || 'Failed to start generation' });
    } else {
      // JSON already sent, emit error to stream so client can receive it
-      await GenerationJobManager.emitError(streamId, error.message || 'Failed to start generation');
+      GenerationJobManager.emitError(streamId, error.message || 'Failed to start generation');
    }
    GenerationJobManager.completeJob(streamId, error.message);
    await decrementPendingRequest(userId);
@ -636,10 +639,14 @@ const _LegacyAgentController = async (req, res, next, initializeClient, addTitle
    conversation.title =
      conversation && !conversation.title ? null : conversation?.title || 'New Chat';

-    if (req.body.files && Array.isArray(client.options.attachments)) {
-      const files = buildMessageFiles(req.body.files, client.options.attachments);
-      if (files.length > 0) {
-        userMessage.files = files;
+    // Process files if needed (sanitize to remove large text fields before transmission)
+    if (req.body.files && client.options?.attachments) {
+      userMessage.files = [];
+      const messageFiles = new Set(req.body.files.map((file) => file.file_id));
+      for (const attachment of client.options.attachments) {
+        if (messageFiles.has(attachment.file_id)) {
+          userMessage.files.push(sanitizeFileForTransmit(attachment));
+        }
      }
      delete userMessage.image_urls;
    }
--- a/api/server/controllers/agents/responses.js
+++ b/api/server/controllers/agents/responses.js
@ -1,912 +0,0 @@
-const { nanoid } = require('nanoid');
-const { v4: uuidv4 } = require('uuid');
-const { logger } = require('@librechat/data-schemas');
-const { Callback, ToolEndHandler, formatAgentMessages } = require('@librechat/agents');
-const { EModelEndpoint, ResourceType, PermissionBits } = require('librechat-data-provider');
-const {
-  createRun,
-  buildToolSet,
-  createSafeUser,
-  initializeAgent,
-  getBalanceConfig,
-  recordCollectedUsage,
-  getTransactionsConfig,
-  createToolExecuteHandler,
-  // Responses API
-  writeDone,
-  buildResponse,
-  generateResponseId,
-  isValidationFailure,
-  emitResponseCreated,
-  createResponseContext,
-  createResponseTracker,
-  setupStreamingResponse,
-  emitResponseInProgress,
-  convertInputToMessages,
-  validateResponseRequest,
-  buildAggregatedResponse,
-  createResponseAggregator,
-  sendResponsesErrorResponse,
-  createResponsesEventHandlers,
-  createAggregatorEventHandlers,
-} = require('@librechat/api');
-const {
-  createResponsesToolEndCallback,
-  createToolEndCallback,
-} = require('~/server/controllers/agents/callbacks');
-const { loadAgentTools, loadToolsForExecution } = require('~/server/services/ToolService');
-const { findAccessibleResources } = require('~/server/services/PermissionService');
-const { getConvoFiles, saveConvo, getConvo } = require('~/models/Conversation');
-const { spendTokens, spendStructuredTokens } = require('~/models/spendTokens');
-const { getMultiplier, getCacheMultiplier } = require('~/models/tx');
-const { getAgent, getAgents } = require('~/models/Agent');
-const db = require('~/models');
-
-/** @type {import('@librechat/api').AppConfig | null} */
-let appConfig = null;
-
-/**
- * Set the app config for the controller
- * @param {import('@librechat/api').AppConfig} config
- */
-function setAppConfig(config) {
-  appConfig = config;
-}
-
-/**
- * Creates a tool loader function for the agent.
- * @param {AbortSignal} signal - The abort signal
- * @param {boolean} [definitionsOnly=true] - When true, returns only serializable
- *   tool definitions without creating full tool instances (for event-driven mode)
- */
-function createToolLoader(signal, definitionsOnly = true) {
-  return async function loadTools({
-    req,
-    res,
-    tools,
-    model,
-    agentId,
-    provider,
-    tool_options,
-    tool_resources,
-  }) {
-    const agent = { id: agentId, tools, provider, model, tool_options };
-    try {
-      return await loadAgentTools({
-        req,
-        res,
-        agent,
-        signal,
-        tool_resources,
-        definitionsOnly,
-        streamId: null,
-      });
-    } catch (error) {
-      logger.error('Error loading tools for agent ' + agentId, error);
-    }
-  };
-}
-
-/**
- * Convert Open Responses input items to internal messages
- * @param {import('@librechat/api').InputItem[]} input
- * @returns {Array} Internal messages
- */
-function convertToInternalMessages(input) {
-  return convertInputToMessages(input);
-}
-
-/**
- * Load messages from a previous response/conversation
- * @param {string} conversationId - The conversation/response ID
- * @param {string} userId - The user ID
- * @returns {Promise<Array>} Messages from the conversation
- */
-async function loadPreviousMessages(conversationId, userId) {
-  try {
-    const messages = await db.getMessages({ conversationId, user: userId });
-    if (!messages || messages.length === 0) {
-      return [];
-    }
-
-    // Convert stored messages to internal format
-    return messages.map((msg) => {
-      const internalMsg = {
-        role: msg.isCreatedByUser ? 'user' : 'assistant',
-        content: '',
-        messageId: msg.messageId,
-      };
-
-      // Handle content - could be string or array
-      if (typeof msg.text === 'string') {
-        internalMsg.content = msg.text;
-      } else if (Array.isArray(msg.content)) {
-        // Handle content parts
-        internalMsg.content = msg.content;
-      } else if (msg.text) {
-        internalMsg.content = String(msg.text);
-      }
-
-      return internalMsg;
-    });
-  } catch (error) {
-    logger.error('[Responses API] Error loading previous messages:', error);
-    return [];
-  }
-}
-
-/**
- * Save input messages to database
- * @param {import('express').Request} req
- * @param {string} conversationId
- * @param {Array} inputMessages - Internal format messages
- * @param {string} agentId
- * @returns {Promise<void>}
- */
-async function saveInputMessages(req, conversationId, inputMessages, agentId) {
-  for (const msg of inputMessages) {
-    if (msg.role === 'user') {
-      await db.saveMessage(
-        req,
-        {
-          messageId: msg.messageId || nanoid(),
-          conversationId,
-          parentMessageId: null,
-          isCreatedByUser: true,
-          text: typeof msg.content === 'string' ? msg.content : JSON.stringify(msg.content),
-          sender: 'User',
-          endpoint: EModelEndpoint.agents,
-          model: agentId,
-        },
-        { context: 'Responses API - save user input' },
-      );
-    }
-  }
-}
-
-/**
- * Save response output to database
- * @param {import('express').Request} req
- * @param {string} conversationId
- * @param {string} responseId
- * @param {import('@librechat/api').Response} response
- * @param {string} agentId
- * @returns {Promise<void>}
- */
-async function saveResponseOutput(req, conversationId, responseId, response, agentId) {
-  // Extract text content from output items
-  let responseText = '';
-  for (const item of response.output) {
-    if (item.type === 'message' && item.content) {
-      for (const part of item.content) {
-        if (part.type === 'output_text' && part.text) {
-          responseText += part.text;
-        }
-      }
-    }
-  }
-
-  // Save the assistant message
-  await db.saveMessage(
-    req,
-    {
-      messageId: responseId,
-      conversationId,
-      parentMessageId: null,
-      isCreatedByUser: false,
-      text: responseText,
-      sender: 'Agent',
-      endpoint: EModelEndpoint.agents,
-      model: agentId,
-      finish_reason: response.status === 'completed' ? 'stop' : response.status,
-      tokenCount: response.usage?.output_tokens,
-    },
-    { context: 'Responses API - save assistant response' },
-  );
-}
-
-/**
- * Save or update conversation
- * @param {import('express').Request} req
- * @param {string} conversationId
- * @param {string} agentId
- * @param {object} agent
- * @returns {Promise<void>}
- */
-async function saveConversation(req, conversationId, agentId, agent) {
-  await saveConvo(
-    req,
-    {
-      conversationId,
-      endpoint: EModelEndpoint.agents,
-      agentId,
-      title: agent?.name || 'Open Responses Conversation',
-      model: agent?.model,
-    },
-    { context: 'Responses API - save conversation' },
-  );
-}
-
-/**
- * Convert stored messages to Open Responses output format
- * @param {Array} messages - Stored messages
- * @returns {Array} Output items
- */
-function convertMessagesToOutputItems(messages) {
-  const output = [];
-
-  for (const msg of messages) {
-    if (!msg.isCreatedByUser) {
-      output.push({
-        type: 'message',
-        id: msg.messageId,
-        role: 'assistant',
-        status: 'completed',
-        content: [
-          {
-            type: 'output_text',
-            text: msg.text || '',
-            annotations: [],
-          },
-        ],
-      });
-    }
-  }
-
-  return output;
-}
-
-/**
- * Create Response - POST /v1/responses
- *
- * Creates a model response following the Open Responses API specification.
- * Supports both streaming and non-streaming responses.
- *
- * @param {import('express').Request} req
- * @param {import('express').Response} res
- */
-const createResponse = async (req, res) => {
-  const requestStartTime = Date.now();
-
-  // Validate request
-  const validation = validateResponseRequest(req.body);
-  if (isValidationFailure(validation)) {
-    return sendResponsesErrorResponse(res, 400, validation.error);
-  }
-
-  const request = validation.request;
-  const agentId = request.model;
-  const isStreaming = request.stream === true;
-
-  // Look up the agent
-  const agent = await getAgent({ id: agentId });
-  if (!agent) {
-    return sendResponsesErrorResponse(
-      res,
-      404,
-      `Agent not found: ${agentId}`,
-      'not_found',
-      'model_not_found',
-    );
-  }
-
-  // Generate IDs
-  const responseId = generateResponseId();
-  const conversationId = request.previous_response_id ?? uuidv4();
-  const parentMessageId = null;
-
-  // Create response context
-  const context = createResponseContext(request, responseId);
-
-  logger.debug(
-    `[Responses API] Request ${responseId} started for agent ${agentId}, stream: ${isStreaming}`,
-  );
-
-  // Set up abort controller
-  const abortController = new AbortController();
-
-  // Handle client disconnect
-  req.on('close', () => {
-    if (!abortController.signal.aborted) {
-      abortController.abort();
-      logger.debug('[Responses API] Client disconnected, aborting');
-    }
-  });
-
-  try {
-    // Build allowed providers set
-    const allowedProviders = new Set(
-      appConfig?.endpoints?.[EModelEndpoint.agents]?.allowedProviders,
-    );
-
-    // Create tool loader
-    const loadTools = createToolLoader(abortController.signal);
-
-    // Initialize the agent first to check for disableStreaming
-    const endpointOption = {
-      endpoint: agent.provider,
-      model_parameters: agent.model_parameters ?? {},
-    };
-
-    const primaryConfig = await initializeAgent(
-      {
-        req,
-        res,
-        loadTools,
-        requestFiles: [],
-        conversationId,
-        parentMessageId,
-        agent,
-        endpointOption,
-        allowedProviders,
-        isInitialAgent: true,
-      },
-      {
-        getConvoFiles,
-        getFiles: db.getFiles,
-        getUserKey: db.getUserKey,
-        getMessages: db.getMessages,
-        updateFilesUsage: db.updateFilesUsage,
-        getUserKeyValues: db.getUserKeyValues,
-        getUserCodeFiles: db.getUserCodeFiles,
-        getToolFilesByIds: db.getToolFilesByIds,
-        getCodeGeneratedFiles: db.getCodeGeneratedFiles,
-      },
-    );
-
-    // Determine if streaming is enabled (check both request and agent config)
-    const streamingDisabled = !!primaryConfig.model_parameters?.disableStreaming;
-    const actuallyStreaming = isStreaming && !streamingDisabled;
-
-    // Load previous messages if previous_response_id is provided
-    let previousMessages = [];
-    if (request.previous_response_id) {
-      const userId = req.user?.id ?? 'api-user';
-      previousMessages = await loadPreviousMessages(request.previous_response_id, userId);
-    }
-
-    // Convert input to internal messages
-    const inputMessages = convertToInternalMessages(
-      typeof request.input === 'string' ? request.input : request.input,
-    );
-
-    // Merge previous messages with new input
-    const allMessages = [...previousMessages, ...inputMessages];
-
-    const toolSet = buildToolSet(primaryConfig);
-    const { messages: formattedMessages, indexTokenCountMap } = formatAgentMessages(
-      allMessages,
-      {},
-      toolSet,
-    );
-
-    // Create tracker for streaming or aggregator for non-streaming
-    const tracker = actuallyStreaming ? createResponseTracker() : null;
-    const aggregator = actuallyStreaming ? null : createResponseAggregator();
-
-    // Set up response for streaming
-    if (actuallyStreaming) {
-      setupStreamingResponse(res);
-
-      // Create handler config
-      const handlerConfig = {
-        res,
-        context,
-        tracker,
-      };
-
-      // Emit response.created then response.in_progress per Open Responses spec
-      emitResponseCreated(handlerConfig);
-      emitResponseInProgress(handlerConfig);
-
-      // Create event handlers
-      const { handlers: responsesHandlers, finalizeStream } =
-        createResponsesEventHandlers(handlerConfig);
-
-      // Collect usage for balance tracking
-      const collectedUsage = [];
-
-      // Artifact promises for processing tool outputs
-      /** @type {Promise<import('librechat-data-provider').TAttachment | null>[]} */
-      const artifactPromises = [];
-      // Use Responses API-specific callback that emits librechat:attachment events
-      const toolEndCallback = createResponsesToolEndCallback({
-        req,
-        res,
-        tracker,
-        artifactPromises,
-      });
-
-      // Create tool execute options for event-driven tool execution
-      const toolExecuteOptions = {
-        loadTools: async (toolNames) => {
-          return loadToolsForExecution({
-            req,
-            res,
-            agent,
-            toolNames,
-            signal: abortController.signal,
-            toolRegistry: primaryConfig.toolRegistry,
-            userMCPAuthMap: primaryConfig.userMCPAuthMap,
-            tool_resources: primaryConfig.tool_resources,
-            actionsEnabled: primaryConfig.actionsEnabled,
-          });
-        },
-        toolEndCallback,
-      };
-
-      // Combine handlers
-      const handlers = {
-        on_message_delta: responsesHandlers.on_message_delta,
-        on_reasoning_delta: responsesHandlers.on_reasoning_delta,
-        on_run_step: responsesHandlers.on_run_step,
-        on_run_step_delta: responsesHandlers.on_run_step_delta,
-        on_chat_model_end: {
-          handle: (event, data) => {
-            responsesHandlers.on_chat_model_end.handle(event, data);
-            const usage = data?.output?.usage_metadata;
-            if (usage) {
-              collectedUsage.push(usage);
-            }
-          },
-        },
-        on_tool_end: new ToolEndHandler(toolEndCallback, logger),
-        on_run_step_completed: { handle: () => {} },
-        on_chain_stream: { handle: () => {} },
-        on_chain_end: { handle: () => {} },
-        on_agent_update: { handle: () => {} },
-        on_custom_event: { handle: () => {} },
-        on_tool_execute: createToolExecuteHandler(toolExecuteOptions),
-      };
-
-      // Create and run the agent
-      const userId = req.user?.id ?? 'api-user';
-      const userMCPAuthMap = primaryConfig.userMCPAuthMap;
-
-      const run = await createRun({
-        agents: [primaryConfig],
-        messages: formattedMessages,
-        indexTokenCountMap,
-        runId: responseId,
-        signal: abortController.signal,
-        customHandlers: handlers,
-        requestBody: {
-          messageId: responseId,
-          conversationId,
-        },
-        user: { id: userId },
-      });
-
-      if (!run) {
-        throw new Error('Failed to create agent run');
-      }
-
-      // Process the stream
-      const config = {
-        runName: 'AgentRun',
-        configurable: {
-          thread_id: conversationId,
-          user_id: userId,
-          user: createSafeUser(req.user),
-          requestBody: {
-            messageId: responseId,
-            conversationId,
-          },
-          ...(userMCPAuthMap != null && { userMCPAuthMap }),
-        },
-        signal: abortController.signal,
-        streamMode: 'values',
-        version: 'v2',
-      };
-
-      await run.processStream({ messages: formattedMessages }, config, {
-        callbacks: {
-          [Callback.TOOL_ERROR]: (graph, error, toolId) => {
-            logger.error(`[Responses API] Tool Error "${toolId}"`, error);
-          },
-        },
-      });
-
-      // Record token usage against balance
-      const balanceConfig = getBalanceConfig(req.config);
-      const transactionsConfig = getTransactionsConfig(req.config);
-      recordCollectedUsage(
-        {
-          spendTokens,
-          spendStructuredTokens,
-          pricing: { getMultiplier, getCacheMultiplier },
-          bulkWriteOps: { insertMany: db.bulkInsertTransactions, updateBalance: db.updateBalance },
-        },
-        {
-          user: userId,
-          conversationId,
-          collectedUsage,
-          context: 'message',
-          messageId: responseId,
-          balance: balanceConfig,
-          transactions: transactionsConfig,
-          model: primaryConfig.model || agent.model_parameters?.model,
-        },
-      ).catch((err) => {
-        logger.error('[Responses API] Error recording usage:', err);
-      });
-
-      // Finalize the stream
-      finalizeStream();
-      res.end();
-
-      const duration = Date.now() - requestStartTime;
-      logger.debug(`[Responses API] Request ${responseId} completed in ${duration}ms (streaming)`);
-
-      // Save to database if store: true
-      if (request.store === true) {
-        try {
-          // Save conversation
-          await saveConversation(req, conversationId, agentId, agent);
-
-          // Save input messages
-          await saveInputMessages(req, conversationId, inputMessages, agentId);
-
-          // Build response for saving (use tracker with buildResponse for streaming)
-          const finalResponse = buildResponse(context, tracker, 'completed');
-          await saveResponseOutput(req, conversationId, responseId, finalResponse, agentId);
-
-          logger.debug(
-            `[Responses API] Stored response ${responseId} in conversation ${conversationId}`,
-          );
-        } catch (saveError) {
-          logger.error('[Responses API] Error saving response:', saveError);
-          // Don't fail the request if saving fails
-        }
-      }
-
-      // Wait for artifact processing after response ends (non-blocking)
-      if (artifactPromises.length > 0) {
-        Promise.all(artifactPromises).catch((artifactError) => {
-          logger.warn('[Responses API] Error processing artifacts:', artifactError);
-        });
-      }
-    } else {
-      const aggregatorHandlers = createAggregatorEventHandlers(aggregator);
-
-      // Collect usage for balance tracking
-      const collectedUsage = [];
-
-      /** @type {Promise<import('librechat-data-provider').TAttachment | null>[]} */
-      const artifactPromises = [];
-      const toolEndCallback = createToolEndCallback({ req, res, artifactPromises, streamId: null });
-
-      const toolExecuteOptions = {
-        loadTools: async (toolNames) => {
-          return loadToolsForExecution({
-            req,
-            res,
-            agent,
-            toolNames,
-            signal: abortController.signal,
-            toolRegistry: primaryConfig.toolRegistry,
-            userMCPAuthMap: primaryConfig.userMCPAuthMap,
-            tool_resources: primaryConfig.tool_resources,
-            actionsEnabled: primaryConfig.actionsEnabled,
-          });
-        },
-        toolEndCallback,
-      };
-
-      const handlers = {
-        on_message_delta: aggregatorHandlers.on_message_delta,
-        on_reasoning_delta: aggregatorHandlers.on_reasoning_delta,
-        on_run_step: aggregatorHandlers.on_run_step,
-        on_run_step_delta: aggregatorHandlers.on_run_step_delta,
-        on_chat_model_end: {
-          handle: (event, data) => {
-            aggregatorHandlers.on_chat_model_end.handle(event, data);
-            const usage = data?.output?.usage_metadata;
-            if (usage) {
-              collectedUsage.push(usage);
-            }
-          },
-        },
-        on_tool_end: new ToolEndHandler(toolEndCallback, logger),
-        on_run_step_completed: { handle: () => {} },
-        on_chain_stream: { handle: () => {} },
-        on_chain_end: { handle: () => {} },
-        on_agent_update: { handle: () => {} },
-        on_custom_event: { handle: () => {} },
-        on_tool_execute: createToolExecuteHandler(toolExecuteOptions),
-      };
-
-      const userId = req.user?.id ?? 'api-user';
-      const userMCPAuthMap = primaryConfig.userMCPAuthMap;
-
-      const run = await createRun({
-        agents: [primaryConfig],
-        messages: formattedMessages,
-        indexTokenCountMap,
-        runId: responseId,
-        signal: abortController.signal,
-        customHandlers: handlers,
-        requestBody: {
-          messageId: responseId,
-          conversationId,
-        },
-        user: { id: userId },
-      });
-
-      if (!run) {
-        throw new Error('Failed to create agent run');
-      }
-
-      const config = {
-        runName: 'AgentRun',
-        configurable: {
-          thread_id: conversationId,
-          user_id: userId,
-          user: createSafeUser(req.user),
-          requestBody: {
-            messageId: responseId,
-            conversationId,
-          },
-          ...(userMCPAuthMap != null && { userMCPAuthMap }),
-        },
-        signal: abortController.signal,
-        streamMode: 'values',
-        version: 'v2',
-      };
-
-      await run.processStream({ messages: formattedMessages }, config, {
-        callbacks: {
-          [Callback.TOOL_ERROR]: (graph, error, toolId) => {
-            logger.error(`[Responses API] Tool Error "${toolId}"`, error);
-          },
-        },
-      });
-
-      // Record token usage against balance
-      const balanceConfig = getBalanceConfig(req.config);
-      const transactionsConfig = getTransactionsConfig(req.config);
-      recordCollectedUsage(
-        {
-          spendTokens,
-          spendStructuredTokens,
-          pricing: { getMultiplier, getCacheMultiplier },
-          bulkWriteOps: { insertMany: db.bulkInsertTransactions, updateBalance: db.updateBalance },
-        },
-        {
-          user: userId,
-          conversationId,
-          collectedUsage,
-          context: 'message',
-          messageId: responseId,
-          balance: balanceConfig,
-          transactions: transactionsConfig,
-          model: primaryConfig.model || agent.model_parameters?.model,
-        },
-      ).catch((err) => {
-        logger.error('[Responses API] Error recording usage:', err);
-      });
-
-      if (artifactPromises.length > 0) {
-        try {
-          await Promise.all(artifactPromises);
-        } catch (artifactError) {
-          logger.warn('[Responses API] Error processing artifacts:', artifactError);
-        }
-      }
-
-      const response = buildAggregatedResponse(context, aggregator);
-
-      if (request.store === true) {
-        try {
-          await saveConversation(req, conversationId, agentId, agent);
-
-          await saveInputMessages(req, conversationId, inputMessages, agentId);
-
-          await saveResponseOutput(req, conversationId, responseId, response, agentId);
-
-          logger.debug(
-            `[Responses API] Stored response ${responseId} in conversation ${conversationId}`,
-          );
-        } catch (saveError) {
-          logger.error('[Responses API] Error saving response:', saveError);
-          // Don't fail the request if saving fails
-        }
-      }
-
-      res.json(response);
-
-      const duration = Date.now() - requestStartTime;
-      logger.debug(
-        `[Responses API] Request ${responseId} completed in ${duration}ms (non-streaming)`,
-      );
-    }
-  } catch (error) {
-    const errorMessage = error instanceof Error ? error.message : 'An error occurred';
-    logger.error('[Responses API] Error:', error);
-
-    // Check if we already started streaming (headers sent)
-    if (res.headersSent) {
-      // Headers already sent, write error event and close
-      writeDone(res);
-      res.end();
-    } else {
-      // Forward upstream provider status codes (e.g., Anthropic 400s) instead of masking as 500
-      const statusCode =
-        typeof error?.status === 'number' && error.status >= 400 && error.status < 600
-          ? error.status
-          : 500;
-      const errorType = statusCode >= 400 && statusCode < 500 ? 'invalid_request' : 'server_error';
-      sendResponsesErrorResponse(res, statusCode, errorMessage, errorType);
-    }
-  }
-};
-
-/**
- * List available agents as models - GET /v1/models (also works with /v1/responses/models)
- *
- * Returns a list of available agents the user has remote access to.
- *
- * @param {import('express').Request} req
- * @param {import('express').Response} res
- */
-const listModels = async (req, res) => {
-  try {
-    const userId = req.user?.id;
-    const userRole = req.user?.role;
-
-    if (!userId) {
-      return sendResponsesErrorResponse(res, 401, 'Authentication required', 'auth_error');
-    }
-
-    // Find agents the user has remote access to (VIEW permission on REMOTE_AGENT)
-    const accessibleAgentIds = await findAccessibleResources({
-      userId,
-      role: userRole,
-      resourceType: ResourceType.REMOTE_AGENT,
-      requiredPermissions: PermissionBits.VIEW,
-    });
-
-    // Get the accessible agents
-    let agents = [];
-    if (accessibleAgentIds.length > 0) {
-      agents = await getAgents({ _id: { $in: accessibleAgentIds } });
-    }
-
-    // Convert to models format
-    const models = agents.map((agent) => ({
-      id: agent.id,
-      object: 'model',
-      created: Math.floor(new Date(agent.createdAt).getTime() / 1000),
-      owned_by: agent.author ?? 'librechat',
-      // Additional metadata
-      name: agent.name,
-      description: agent.description,
-      provider: agent.provider,
-    }));
-
-    res.json({
-      object: 'list',
-      data: models,
-    });
-  } catch (error) {
-    logger.error('[Responses API] Error listing models:', error);
-    sendResponsesErrorResponse(
-      res,
-      500,
-      error instanceof Error ? error.message : 'Failed to list models',
-      'server_error',
-    );
-  }
-};
-
-/**
- * Get Response - GET /v1/responses/:id
- *
- * Retrieves a stored response by its ID.
- * The response ID maps to a conversationId in LibreChat's storage.
- *
- * @param {import('express').Request} req
- * @param {import('express').Response} res
- */
-const getResponse = async (req, res) => {
-  try {
-    const responseId = req.params.id;
-    const userId = req.user?.id;
-
-    if (!responseId) {
-      return sendResponsesErrorResponse(res, 400, 'Response ID is required');
-    }
-
-    // The responseId could be either the response ID or the conversation ID
-    // Try to find a conversation with this ID
-    const conversation = await getConvo(userId, responseId);
-
-    if (!conversation) {
-      return sendResponsesErrorResponse(
-        res,
-        404,
-        `Response not found: ${responseId}`,
-        'not_found',
-        'response_not_found',
-      );
-    }
-
-    // Load messages for this conversation
-    const messages = await db.getMessages({ conversationId: responseId, user: userId });
-
-    if (!messages || messages.length === 0) {
-      return sendResponsesErrorResponse(
-        res,
-        404,
-        `No messages found for response: ${responseId}`,
-        'not_found',
-        'response_not_found',
-      );
-    }
-
-    // Convert messages to Open Responses output format
-    const output = convertMessagesToOutputItems(messages);
-
-    // Find the last assistant message for usage info
-    const lastAssistantMessage = messages.filter((m) => !m.isCreatedByUser).pop();
-
-    // Build the response object
-    const response = {
-      id: responseId,
-      object: 'response',
-      created_at: Math.floor(new Date(conversation.createdAt || Date.now()).getTime() / 1000),
-      completed_at: Math.floor(new Date(conversation.updatedAt || Date.now()).getTime() / 1000),
-      status: 'completed',
-      incomplete_details: null,
-      model: conversation.agentId || conversation.model || 'unknown',
-      previous_response_id: null,
-      instructions: null,
-      output,
-      error: null,
-      tools: [],
-      tool_choice: 'auto',
-      truncation: 'disabled',
-      parallel_tool_calls: true,
-      text: { format: { type: 'text' } },
-      temperature: 1,
-      top_p: 1,
-      presence_penalty: 0,
-      frequency_penalty: 0,
-      top_logprobs: null,
-      reasoning: null,
-      user: userId,
-      usage: lastAssistantMessage?.tokenCount
-        ? {
-            input_tokens: 0,
-            output_tokens: lastAssistantMessage.tokenCount,
-            total_tokens: lastAssistantMessage.tokenCount,
-          }
-        : null,
-      max_output_tokens: null,
-      max_tool_calls: null,
-      store: true,
-      background: false,
-      service_tier: 'default',
-      metadata: {},
-      safety_identifier: null,
-      prompt_cache_key: null,
-    };
-
-    res.json(response);
-  } catch (error) {
-    logger.error('[Responses API] Error getting response:', error);
-    sendResponsesErrorResponse(
-      res,
-      500,
-      error instanceof Error ? error.message : 'Failed to get response',
-      'server_error',
-    );
-  }
-};
-
-module.exports = {
-  createResponse,
-  getResponse,
-  listModels,
-  setAppConfig,
-};
--- a/api/server/controllers/agents/v1.js
+++ b/api/server/controllers/agents/v1.js
@ -6,15 +6,12 @@ const {
  agentCreateSchema,
  agentUpdateSchema,
  refreshListAvatars,
-  collectEdgeAgentIds,
  mergeAgentOcrConversion,
  MAX_AVATAR_REFRESH_AGENTS,
  convertOcrToContextInPlace,
 } = require('@librechat/api');
 const {
-  Time,
  Tools,
-  CacheKeys,
  Constants,
  FileSources,
  ResourceType,
@ -24,6 +21,8 @@ const {
  PermissionBits,
  actionDelimiter,
  removeNullishValues,
+  CacheKeys,
+  Time,
 } = require('librechat-data-provider');
 const {
  getListAgentsByAccess,
@ -36,7 +35,6 @@ const {
 } = require('~/models/Agent');
 const {
  findPubliclyAccessibleResources,
-  getResourcePermissionsMap,
  findAccessibleResources,
  hasPublicPermission,
  grantPermission,
@ -49,7 +47,6 @@ const { refreshS3Url } = require('~/server/services/Files/S3/crud');
 const { filterFile } = require('~/server/services/Files/process');
 const { updateAction, getActions } = require('~/models/Action');
 const { getCachedTools } = require('~/server/services/Config');
-const { getMCPServersRegistry } = require('~/config');
 const { getLogStores } = require('~/cache');

 const systemTools = {
@ -61,116 +58,6 @@ const systemTools = {
 const MAX_SEARCH_LEN = 100;
 const escapeRegex = (str = '') => str.replace(/[.*+?^${}()|[\]\\]/g, '\\$&');

-/**
- * Validates that the requesting user has VIEW access to every agent referenced in edges.
- * Agents that do not exist in the database are skipped — at create time, the `from` field
- * often references the agent being built, which has no DB record yet.
- * @param {import('librechat-data-provider').GraphEdge[]} edges
- * @param {string} userId
- * @param {string} userRole - Used for group/role principal resolution
- * @returns {Promise<string[]>} Agent IDs the user cannot VIEW (empty if all accessible)
- */
-const validateEdgeAgentAccess = async (edges, userId, userRole) => {
-  const edgeAgentIds = collectEdgeAgentIds(edges);
-  if (edgeAgentIds.size === 0) {
-    return [];
-  }
-
-  const agents = (await Promise.all([...edgeAgentIds].map((id) => getAgent({ id })))).filter(
-    Boolean,
-  );
-
-  if (agents.length === 0) {
-    return [];
-  }
-
-  const permissionsMap = await getResourcePermissionsMap({
-    userId,
-    role: userRole,
-    resourceType: ResourceType.AGENT,
-    resourceIds: agents.map((a) => a._id),
-  });
-
-  return agents
-    .filter((a) => {
-      const bits = permissionsMap.get(a._id.toString()) ?? 0;
-      return (bits & PermissionBits.VIEW) === 0;
-    })
-    .map((a) => a.id);
-};
-
-/**
- * Filters tools to only include those the user is authorized to use.
- * MCP tools must match the exact format `{toolName}_mcp_{serverName}` (exactly 2 segments).
- * Multi-delimiter keys are rejected to prevent authorization/execution mismatch.
- * Non-MCP tools must appear in availableTools (global tool cache) or systemTools.
- *
- * When `existingTools` is provided and the MCP registry is unavailable (e.g. server restart),
- * tools already present on the agent are preserved rather than stripped — they were validated
- * when originally added, and we cannot re-verify them without the registry.
- * @param {object} params
- * @param {string[]} params.tools - Raw tool strings from the request
- * @param {string} params.userId - Requesting user ID for MCP server access check
- * @param {Record<string, unknown>} params.availableTools - Global non-MCP tool cache
- * @param {string[]} [params.existingTools] - Tools already persisted on the agent document
- * @returns {Promise<string[]>} Only the authorized subset of tools
- */
-const filterAuthorizedTools = async ({ tools, userId, availableTools, existingTools }) => {
-  const filteredTools = [];
-  let mcpServerConfigs;
-  let registryUnavailable = false;
-  const existingToolSet = existingTools?.length ? new Set(existingTools) : null;
-
-  for (const tool of tools) {
-    if (availableTools[tool] || systemTools[tool]) {
-      filteredTools.push(tool);
-      continue;
-    }
-
-    if (!tool?.includes(Constants.mcp_delimiter)) {
-      continue;
-    }
-
-    if (mcpServerConfigs === undefined) {
-      try {
-        mcpServerConfigs = (await getMCPServersRegistry().getAllServerConfigs(userId)) ?? {};
-      } catch (e) {
-        logger.warn(
-          '[filterAuthorizedTools] MCP registry unavailable, filtering all MCP tools',
-          e.message,
-        );
-        mcpServerConfigs = {};
-        registryUnavailable = true;
-      }
-    }
-
-    const parts = tool.split(Constants.mcp_delimiter);
-    if (parts.length !== 2) {
-      logger.warn(
-        `[filterAuthorizedTools] Rejected malformed MCP tool key "${tool}" for user ${userId}`,
-      );
-      continue;
-    }
-
-    if (registryUnavailable && existingToolSet?.has(tool)) {
-      filteredTools.push(tool);
-      continue;
-    }
-
-    const [, serverName] = parts;
-    if (!serverName || !Object.hasOwn(mcpServerConfigs, serverName)) {
-      logger.warn(
-        `[filterAuthorizedTools] Rejected MCP tool "${tool}" — server "${serverName}" not accessible to user ${userId}`,
-      );
-      continue;
-    }
-
-    filteredTools.push(tool);
-  }
-
-  return filteredTools;
-};
-
 /**
 * Creates an Agent.
 * @route POST /Agents
@ -188,46 +75,35 @@ const createAgentHandler = async (req, res) => {
      agentData.model_parameters = removeNullishValues(agentData.model_parameters, true);
    }

-    const { id: userId, role: userRole } = req.user;
-
-    if (agentData.edges?.length) {
-      const unauthorized = await validateEdgeAgentAccess(agentData.edges, userId, userRole);
-      if (unauthorized.length > 0) {
-        return res.status(403).json({
-          error: 'You do not have access to one or more agents referenced in edges',
-          agent_ids: unauthorized,
-        });
-      }
-    }
+    const { id: userId } = req.user;

    agentData.id = `agent_${nanoid()}`;
    agentData.author = userId;
    agentData.tools = [];

    const availableTools = (await getCachedTools()) ?? {};
-    agentData.tools = await filterAuthorizedTools({ tools, userId, availableTools });
+    for (const tool of tools) {
+      if (availableTools[tool]) {
+        agentData.tools.push(tool);
+      } else if (systemTools[tool]) {
+        agentData.tools.push(tool);
+      } else if (tool.includes(Constants.mcp_delimiter)) {
+        agentData.tools.push(tool);
+      }
+    }

    const agent = await createAgent(agentData);

+    // Automatically grant owner permissions to the creator
    try {
-      await Promise.all([
-        grantPermission({
-          principalType: PrincipalType.USER,
-          principalId: userId,
-          resourceType: ResourceType.AGENT,
-          resourceId: agent._id,
-          accessRoleId: AccessRoleIds.AGENT_OWNER,
-          grantedBy: userId,
-        }),
-        grantPermission({
-          principalType: PrincipalType.USER,
-          principalId: userId,
-          resourceType: ResourceType.REMOTE_AGENT,
-          resourceId: agent._id,
-          accessRoleId: AccessRoleIds.REMOTE_AGENT_OWNER,
-          grantedBy: userId,
-        }),
-      ]);
+      await grantPermission({
+        principalType: PrincipalType.USER,
+        principalId: userId,
+        resourceType: ResourceType.AGENT,
+        resourceId: agent._id,
+        accessRoleId: AccessRoleIds.AGENT_OWNER,
+        grantedBy: userId,
+      });
      logger.debug(
        `[createAgent] Granted owner permissions to user ${userId} for agent ${agent.id}`,
      );
@ -358,17 +234,6 @@ const updateAgentHandler = async (req, res) => {
      updateData.avatar = avatarField;
    }

-    if (updateData.edges?.length) {
-      const { id: userId, role: userRole } = req.user;
-      const unauthorized = await validateEdgeAgentAccess(updateData.edges, userId, userRole);
-      if (unauthorized.length > 0) {
-        return res.status(403).json({
-          error: 'You do not have access to one or more agents referenced in edges',
-          agent_ids: unauthorized,
-        });
-      }
-    }
-
    // Convert OCR to context in incoming updateData
    convertOcrToContextInPlace(updateData);

@ -387,26 +252,6 @@ const updateAgentHandler = async (req, res) => {
      updateData.tools = ocrConversion.tools;
    }

-    if (updateData.tools) {
-      const existingToolSet = new Set(existingAgent.tools ?? []);
-      const newMCPTools = updateData.tools.filter(
-        (t) => !existingToolSet.has(t) && t?.includes(Constants.mcp_delimiter),
-      );
-
-      if (newMCPTools.length > 0) {
-        const availableTools = (await getCachedTools()) ?? {};
-        const approvedNew = await filterAuthorizedTools({
-          tools: newMCPTools,
-          userId: req.user.id,
-          availableTools,
-        });
-        const rejectedSet = new Set(newMCPTools.filter((t) => !approvedNew.includes(t)));
-        if (rejectedSet.size > 0) {
-          updateData.tools = updateData.tools.filter((t) => !rejectedSet.has(t));
-        }
-      }
-    }
-
    let updatedAgent =
      Object.keys(updateData).length > 0
        ? await updateAgent({ id }, updateData, {
@ -517,7 +362,7 @@ const duplicateAgentHandler = async (req, res) => {
     */
    const duplicateAction = async (action) => {
      const newActionId = nanoid();
-      const { domain } = action.metadata;
+      const [domain] = action.action_id.split(actionDelimiter);
      const fullActionId = `${domain}${actionDelimiter}${newActionId}`;

      // Sanitize sensitive metadata before persisting
@ -527,7 +372,7 @@ const duplicateAgentHandler = async (req, res) => {
      }

      const newAction = await updateAction(
-        { action_id: newActionId, agent_id: newAgentId },
+        { action_id: newActionId },
        {
          metadata: filteredMetadata,
          agent_id: newAgentId,
@ -549,38 +394,18 @@ const duplicateAgentHandler = async (req, res) => {

    const agentActions = await Promise.all(promises);
    newAgentData.actions = agentActions;
-
-    if (newAgentData.tools?.length) {
-      const availableTools = (await getCachedTools()) ?? {};
-      newAgentData.tools = await filterAuthorizedTools({
-        tools: newAgentData.tools,
-        userId,
-        availableTools,
-        existingTools: newAgentData.tools,
-      });
-    }
-
    const newAgent = await createAgent(newAgentData);

+    // Automatically grant owner permissions to the duplicator
    try {
-      await Promise.all([
-        grantPermission({
-          principalType: PrincipalType.USER,
-          principalId: userId,
-          resourceType: ResourceType.AGENT,
-          resourceId: newAgent._id,
-          accessRoleId: AccessRoleIds.AGENT_OWNER,
-          grantedBy: userId,
-        }),
-        grantPermission({
-          principalType: PrincipalType.USER,
-          principalId: userId,
-          resourceType: ResourceType.REMOTE_AGENT,
-          resourceId: newAgent._id,
-          accessRoleId: AccessRoleIds.REMOTE_AGENT_OWNER,
-          grantedBy: userId,
-        }),
-      ]);
+      await grantPermission({
+        principalType: PrincipalType.USER,
+        principalId: userId,
+        resourceType: ResourceType.AGENT,
+        resourceId: newAgent._id,
+        accessRoleId: AccessRoleIds.AGENT_OWNER,
+        grantedBy: userId,
+      });
      logger.debug(
        `[duplicateAgent] Granted owner permissions to user ${userId} for duplicated agent ${newAgent.id}`,
      );
@ -687,10 +512,10 @@ const getListAgentsHandler = async (req, res) => {
     */
    const cache = getLogStores(CacheKeys.S3_EXPIRY_INTERVAL);
    const refreshKey = `${userId}:agents_avatar_refresh`;
-    let cachedRefresh = await cache.get(refreshKey);
-    const isValidCachedRefresh =
-      cachedRefresh != null && typeof cachedRefresh === 'object' && cachedRefresh.urlCache != null;
-    if (!isValidCachedRefresh) {
+    const alreadyChecked = await cache.get(refreshKey);
+    if (alreadyChecked) {
+      logger.debug('[/Agents] S3 avatar refresh already checked, skipping');
+    } else {
      try {
        const fullList = await getListAgentsByAccess({
          accessibleIds,
@ -698,19 +523,16 @@ const getListAgentsHandler = async (req, res) => {
          limit: MAX_AVATAR_REFRESH_AGENTS,
          after: null,
        });
-        const { urlCache } = await refreshListAvatars({
+        await refreshListAvatars({
          agents: fullList?.data ?? [],
          userId,
          refreshS3Url,
          updateAgent,
        });
-        cachedRefresh = { urlCache };
-        await cache.set(refreshKey, cachedRefresh, Time.THIRTY_MINUTES);
+        await cache.set(refreshKey, true, Time.THIRTY_MINUTES);
      } catch (err) {
        logger.error('[/Agents] Error refreshing avatars for full list: %o', err);
      }
-    } else {
-      logger.debug('[/Agents] S3 avatar refresh already checked, skipping');
    }

    // Use the new ACL-aware function
@ -728,20 +550,11 @@ const getListAgentsHandler = async (req, res) => {

    const publicSet = new Set(publiclyAccessibleIds.map((oid) => oid.toString()));

-    const urlCache = cachedRefresh?.urlCache;
    data.data = agents.map((agent) => {
      try {
        if (agent?._id && publicSet.has(agent._id.toString())) {
          agent.isPublic = true;
        }
-        if (
-          urlCache &&
-          agent?.id &&
-          agent?.avatar?.source === FileSources.s3 &&
-          urlCache[agent.id]
-        ) {
-          agent.avatar = { ...agent.avatar, filepath: urlCache[agent.id] };
-        }
      } catch (e) {
        // Silently ignore mapping errors
        void e;
@ -827,14 +640,6 @@ const uploadAgentAvatarHandler = async (req, res) => {
    const updatedAgent = await updateAgent({ id: agent_id }, data, {
      updatingUserId: req.user.id,
    });
-
-    try {
-      const avatarCache = getLogStores(CacheKeys.S3_EXPIRY_INTERVAL);
-      await avatarCache.delete(`${req.user.id}:agents_avatar_refresh`);
-    } catch (cacheErr) {
-      logger.error('[/:agent_id/avatar] Error invalidating avatar refresh cache', cacheErr);
-    }
-
    res.status(201).json(updatedAgent);
  } catch (error) {
    const message = 'An error occurred while updating the Agent Avatar';
@ -888,24 +693,7 @@ const revertAgentVersionHandler = async (req, res) => {

    // Permissions are enforced via route middleware (ACL EDIT)

-    let updatedAgent = await revertAgentVersion({ id }, version_index);
-
-    if (updatedAgent.tools?.length) {
-      const availableTools = (await getCachedTools()) ?? {};
-      const filteredTools = await filterAuthorizedTools({
-        tools: updatedAgent.tools,
-        userId: req.user.id,
-        availableTools,
-        existingTools: updatedAgent.tools,
-      });
-      if (filteredTools.length !== updatedAgent.tools.length) {
-        updatedAgent = await updateAgent(
-          { id },
-          { tools: filteredTools },
-          { updatingUserId: req.user.id },
-        );
-      }
-    }
+    const updatedAgent = await revertAgentVersion({ id }, version_index);

    if (updatedAgent.author) {
      updatedAgent.author = updatedAgent.author.toString();
@ -973,5 +761,4 @@ module.exports = {
  uploadAgentAvatar: uploadAgentAvatarHandler,
  revertAgentVersion: revertAgentVersionHandler,
  getAgentCategories,
-  filterAuthorizedTools,
 };
--- a/api/server/controllers/agents/v1.spec.js
+++ b/api/server/controllers/agents/v1.spec.js
@ -2,7 +2,7 @@ const mongoose = require('mongoose');
 const { nanoid } = require('nanoid');
 const { v4: uuidv4 } = require('uuid');
 const { agentSchema } = require('@librechat/data-schemas');
-const { FileSources, PermissionBits } = require('librechat-data-provider');
+const { FileSources } = require('librechat-data-provider');
 const { MongoMemoryServer } = require('mongodb-memory-server');

 // Only mock the dependencies that are not database-related
@ -46,9 +46,9 @@ jest.mock('~/models/File', () => ({
 jest.mock('~/server/services/PermissionService', () => ({
  findAccessibleResources: jest.fn().mockResolvedValue([]),
  findPubliclyAccessibleResources: jest.fn().mockResolvedValue([]),
-  getResourcePermissionsMap: jest.fn().mockResolvedValue(new Map()),
  grantPermission: jest.fn(),
  hasPublicPermission: jest.fn().mockResolvedValue(false),
+  checkPermission: jest.fn().mockResolvedValue(true),
 }));

 jest.mock('~/models', () => ({
@ -59,7 +59,6 @@ jest.mock('~/models', () => ({
 const mockCache = {
  get: jest.fn(),
  set: jest.fn(),
-  delete: jest.fn(),
 };
 jest.mock('~/cache', () => ({
  getLogStores: jest.fn(() => mockCache),
@ -74,7 +73,6 @@ const {
 const {
  findAccessibleResources,
  findPubliclyAccessibleResources,
-  getResourcePermissionsMap,
 } = require('~/server/services/PermissionService');

 const { refreshS3Url } = require('~/server/services/Files/S3/crud');
@ -1311,7 +1309,7 @@ describe('Agent Controllers - Mass Assignment Protection', () => {
    });

    test('should skip avatar refresh if cache hit', async () => {
-      mockCache.get.mockResolvedValue({ urlCache: {} });
+      mockCache.get.mockResolvedValue(true);
      findAccessibleResources.mockResolvedValue([agentWithS3Avatar._id]);
      findPubliclyAccessibleResources.mockResolvedValue([]);

@ -1350,12 +1348,8 @@ describe('Agent Controllers - Mass Assignment Protection', () => {
      // Verify S3 URL was refreshed
      expect(refreshS3Url).toHaveBeenCalled();

-      // Verify cache was set with urlCache map, not a plain boolean
-      expect(mockCache.set).toHaveBeenCalledWith(
-        expect.any(String),
-        expect.objectContaining({ urlCache: expect.any(Object) }),
-        expect.any(Number),
-      );
+      // Verify cache was set
+      expect(mockCache.set).toHaveBeenCalled();

      // Verify response was returned
      expect(mockRes.json).toHaveBeenCalled();
@ -1569,191 +1563,5 @@ describe('Agent Controllers - Mass Assignment Protection', () => {
      // Verify that the handler completed successfully
      expect(mockRes.json).toHaveBeenCalled();
    });
-
-    test('should treat legacy boolean cache entry as a miss and run refresh', async () => {
-      // Simulate a cache entry written by the pre-fix code
-      mockCache.get.mockResolvedValue(true);
-      findAccessibleResources.mockResolvedValue([agentWithS3Avatar._id]);
-      findPubliclyAccessibleResources.mockResolvedValue([]);
-      refreshS3Url.mockResolvedValue('new-s3-path.jpg');
-
-      const mockReq = {
-        user: { id: userA.toString(), role: 'USER' },
-        query: {},
-      };
-      const mockRes = {
-        status: jest.fn().mockReturnThis(),
-        json: jest.fn().mockReturnThis(),
-      };
-
-      await getListAgentsHandler(mockReq, mockRes);
-
-      // Boolean true fails the shape guard, so refresh must run
-      expect(refreshS3Url).toHaveBeenCalled();
-      // Cache is overwritten with the proper format
-      expect(mockCache.set).toHaveBeenCalledWith(
-        expect.any(String),
-        expect.objectContaining({ urlCache: expect.any(Object) }),
-        expect.any(Number),
-      );
-    });
-
-    test('should apply cached urlCache filepath to paginated response on cache hit', async () => {
-      const agentId = agentWithS3Avatar.id;
-      const cachedUrl = 'cached-presigned-url.jpg';
-
-      mockCache.get.mockResolvedValue({ urlCache: { [agentId]: cachedUrl } });
-      findAccessibleResources.mockResolvedValue([agentWithS3Avatar._id]);
-      findPubliclyAccessibleResources.mockResolvedValue([]);
-
-      const mockReq = {
-        user: { id: userA.toString(), role: 'USER' },
-        query: {},
-      };
-      const mockRes = {
-        status: jest.fn().mockReturnThis(),
-        json: jest.fn().mockReturnThis(),
-      };
-
-      await getListAgentsHandler(mockReq, mockRes);
-
-      expect(refreshS3Url).not.toHaveBeenCalled();
-
-      const responseData = mockRes.json.mock.calls[0][0];
-      const agent = responseData.data.find((a) => a.id === agentId);
-      // Cached URL is served, not the stale DB value 'old-s3-path.jpg'
-      expect(agent.avatar.filepath).toBe(cachedUrl);
-    });
-
-    test('should preserve DB filepath for agents absent from urlCache on cache hit', async () => {
-      mockCache.get.mockResolvedValue({ urlCache: {} });
-      findAccessibleResources.mockResolvedValue([agentWithS3Avatar._id]);
-      findPubliclyAccessibleResources.mockResolvedValue([]);
-
-      const mockReq = {
-        user: { id: userA.toString(), role: 'USER' },
-        query: {},
-      };
-      const mockRes = {
-        status: jest.fn().mockReturnThis(),
-        json: jest.fn().mockReturnThis(),
-      };
-
-      await getListAgentsHandler(mockReq, mockRes);
-
-      expect(refreshS3Url).not.toHaveBeenCalled();
-
-      const responseData = mockRes.json.mock.calls[0][0];
-      const agent = responseData.data.find((a) => a.id === agentWithS3Avatar.id);
-      expect(agent.avatar.filepath).toBe('old-s3-path.jpg');
-    });
-  });
-
-  describe('Edge ACL validation', () => {
-    let targetAgent;
-
-    beforeEach(async () => {
-      targetAgent = await Agent.create({
-        id: `agent_${nanoid()}`,
-        author: new mongoose.Types.ObjectId().toString(),
-        name: 'Target Agent',
-        provider: 'openai',
-        model: 'gpt-4',
-        tools: [],
-      });
-    });
-
-    test('createAgentHandler should return 403 when user lacks VIEW on an edge-referenced agent', async () => {
-      const permMap = new Map();
-      getResourcePermissionsMap.mockResolvedValueOnce(permMap);
-
-      mockReq.body = {
-        name: 'Attacker Agent',
-        provider: 'openai',
-        model: 'gpt-4',
-        edges: [{ from: 'self_placeholder', to: targetAgent.id, edgeType: 'handoff' }],
-      };
-
-      await createAgentHandler(mockReq, mockRes);
-
-      expect(mockRes.status).toHaveBeenCalledWith(403);
-      const response = mockRes.json.mock.calls[0][0];
-      expect(response.agent_ids).toContain(targetAgent.id);
-    });
-
-    test('createAgentHandler should succeed when user has VIEW on all edge-referenced agents', async () => {
-      const permMap = new Map([[targetAgent._id.toString(), 1]]);
-      getResourcePermissionsMap.mockResolvedValueOnce(permMap);
-
-      mockReq.body = {
-        name: 'Legit Agent',
-        provider: 'openai',
-        model: 'gpt-4',
-        edges: [{ from: 'self_placeholder', to: targetAgent.id, edgeType: 'handoff' }],
-      };
-
-      await createAgentHandler(mockReq, mockRes);
-
-      expect(mockRes.status).toHaveBeenCalledWith(201);
-    });
-
-    test('createAgentHandler should allow edges referencing non-existent agents (self-reference at create time)', async () => {
-      mockReq.body = {
-        name: 'Self-Ref Agent',
-        provider: 'openai',
-        model: 'gpt-4',
-        edges: [{ from: 'agent_does_not_exist_yet', to: 'agent_also_new', edgeType: 'handoff' }],
-      };
-
-      await createAgentHandler(mockReq, mockRes);
-
-      expect(mockRes.status).toHaveBeenCalledWith(201);
-    });
-
-    test('updateAgentHandler should return 403 when user lacks VIEW on an edge-referenced agent', async () => {
-      const ownedAgent = await Agent.create({
-        id: `agent_${nanoid()}`,
-        author: mockReq.user.id,
-        name: 'Owned Agent',
-        provider: 'openai',
-        model: 'gpt-4',
-        tools: [],
-      });
-
-      const permMap = new Map([[ownedAgent._id.toString(), PermissionBits.VIEW]]);
-      getResourcePermissionsMap.mockResolvedValueOnce(permMap);
-
-      mockReq.params = { id: ownedAgent.id };
-      mockReq.body = {
-        edges: [{ from: ownedAgent.id, to: targetAgent.id, edgeType: 'handoff' }],
-      };
-
-      await updateAgentHandler(mockReq, mockRes);
-
-      expect(mockRes.status).toHaveBeenCalledWith(403);
-      const response = mockRes.json.mock.calls[0][0];
-      expect(response.agent_ids).toContain(targetAgent.id);
-      expect(response.agent_ids).not.toContain(ownedAgent.id);
-    });
-
-    test('updateAgentHandler should succeed when edges field is absent from payload', async () => {
-      const ownedAgent = await Agent.create({
-        id: `agent_${nanoid()}`,
-        author: mockReq.user.id,
-        name: 'Owned Agent',
-        provider: 'openai',
-        model: 'gpt-4',
-        tools: [],
-      });
-
-      mockReq.params = { id: ownedAgent.id };
-      mockReq.body = { name: 'Renamed Agent' };
-
-      await updateAgentHandler(mockReq, mockRes);
-
-      expect(mockRes.status).not.toHaveBeenCalledWith(403);
-      const response = mockRes.json.mock.calls[0][0];
-      expect(response.name).toBe('Renamed Agent');
-    });
  });
 });
--- a/api/server/controllers/auth/LogoutController.js
+++ b/api/server/controllers/auth/LogoutController.js
@ -8,16 +8,13 @@ const logoutController = async (req, res) => {
  const parsedCookies = req.headers.cookie ? cookies.parse(req.headers.cookie) : {};
  const isOpenIdUser = req.user?.openidId != null && req.user?.provider === 'openid';

-  /** For OpenID users, read tokens from session (with cookie fallback) */
+  /** For OpenID users, read refresh token from session; for others, use cookie */
  let refreshToken;
-  let idToken;
  if (isOpenIdUser && req.session?.openidTokens) {
    refreshToken = req.session.openidTokens.refreshToken;
-    idToken = req.session.openidTokens.idToken;
    delete req.session.openidTokens;
  }
  refreshToken = refreshToken || parsedCookies.refreshToken;
-  idToken = idToken || parsedCookies.openid_id_token;

  try {
    const logout = await logoutUser(req, refreshToken);
@ -25,7 +22,6 @@ const logoutController = async (req, res) => {

    res.clearCookie('refreshToken');
    res.clearCookie('openid_access_token');
-    res.clearCookie('openid_id_token');
    res.clearCookie('openid_user_id');
    res.clearCookie('token_provider');
    const response = { message };
@ -34,34 +30,21 @@ const logoutController = async (req, res) => {
      isEnabled(process.env.OPENID_USE_END_SESSION_ENDPOINT) &&
      process.env.OPENID_ISSUER
    ) {
-      let openIdConfig;
-      try {
-        openIdConfig = getOpenIdConfig();
-      } catch (err) {
-        logger.warn('[logoutController] OpenID config not available:', err.message);
-      }
-      if (openIdConfig) {
-        const endSessionEndpoint = openIdConfig.serverMetadata().end_session_endpoint;
+      const openIdConfig = getOpenIdConfig();
+      if (!openIdConfig) {
+        logger.warn(
+          '[logoutController] OpenID config not found. Please verify that the open id configuration and initialization are correct.',
+        );
+      } else {
+        const endSessionEndpoint = openIdConfig
+          ? openIdConfig.serverMetadata().end_session_endpoint
+          : null;
        if (endSessionEndpoint) {
          const endSessionUrl = new URL(endSessionEndpoint);
          /** Redirect back to app's login page after IdP logout */
          const postLogoutRedirectUri =
            process.env.OPENID_POST_LOGOUT_REDIRECT_URI || `${process.env.DOMAIN_CLIENT}/login`;
          endSessionUrl.searchParams.set('post_logout_redirect_uri', postLogoutRedirectUri);
-
-          /** Add id_token_hint (preferred) or client_id for OIDC spec compliance */
-          if (idToken) {
-            endSessionUrl.searchParams.set('id_token_hint', idToken);
-          } else if (process.env.OPENID_CLIENT_ID) {
-            endSessionUrl.searchParams.set('client_id', process.env.OPENID_CLIENT_ID);
-          } else {
-            logger.warn(
-              '[logoutController] Neither id_token_hint nor OPENID_CLIENT_ID is available. ' +
-                'To enable id_token_hint, set OPENID_REUSE_TOKENS=true. ' +
-                'The OIDC end-session request may be rejected by the identity provider.',
-            );
-          }
-
          response.redirect = endSessionUrl.toString();
        } else {
          logger.warn(
--- a/api/server/controllers/auth/LogoutController.spec.js
+++ b/api/server/controllers/auth/LogoutController.spec.js
@ -1,259 +0,0 @@
-const cookies = require('cookie');
-
-const mockLogoutUser = jest.fn();
-const mockLogger = { warn: jest.fn(), error: jest.fn() };
-const mockIsEnabled = jest.fn();
-const mockGetOpenIdConfig = jest.fn();
-
-jest.mock('cookie');
-jest.mock('@librechat/api', () => ({ isEnabled: (...args) => mockIsEnabled(...args) }));
-jest.mock('@librechat/data-schemas', () => ({ logger: mockLogger }));
-jest.mock('~/server/services/AuthService', () => ({
-  logoutUser: (...args) => mockLogoutUser(...args),
-}));
-jest.mock('~/strategies', () => ({ getOpenIdConfig: () => mockGetOpenIdConfig() }));
-
-const { logoutController } = require('./LogoutController');
-
-function buildReq(overrides = {}) {
-  return {
-    user: { _id: 'user1', openidId: 'oid1', provider: 'openid' },
-    headers: { cookie: 'refreshToken=rt1' },
-    session: {
-      openidTokens: { refreshToken: 'srt', idToken: 'small-id-token' },
-      destroy: jest.fn(),
-    },
-    ...overrides,
-  };
-}
-
-function buildRes() {
-  const res = {
-    status: jest.fn().mockReturnThis(),
-    send: jest.fn().mockReturnThis(),
-    json: jest.fn().mockReturnThis(),
-    clearCookie: jest.fn(),
-  };
-  return res;
-}
-
-const ORIGINAL_ENV = process.env;
-
-beforeEach(() => {
-  jest.clearAllMocks();
-  process.env = {
-    ...ORIGINAL_ENV,
-    OPENID_USE_END_SESSION_ENDPOINT: 'true',
-    OPENID_ISSUER: 'https://idp.example.com',
-    OPENID_CLIENT_ID: 'my-client-id',
-    DOMAIN_CLIENT: 'https://app.example.com',
-  };
-  cookies.parse.mockReturnValue({ refreshToken: 'cookie-rt' });
-  mockLogoutUser.mockResolvedValue({ status: 200, message: 'Logout successful' });
-  mockIsEnabled.mockReturnValue(true);
-  mockGetOpenIdConfig.mockReturnValue({
-    serverMetadata: () => ({
-      end_session_endpoint: 'https://idp.example.com/logout',
-    }),
-  });
-});
-
-afterAll(() => {
-  process.env = ORIGINAL_ENV;
-});
-
-describe('LogoutController', () => {
-  describe('id_token_hint from session', () => {
-    it('sets id_token_hint when session has idToken', async () => {
-      const req = buildReq();
-      const res = buildRes();
-
-      await logoutController(req, res);
-
-      const body = res.send.mock.calls[0][0];
-      expect(body.redirect).toContain('id_token_hint=small-id-token');
-      expect(body.redirect).not.toContain('client_id=');
-    });
-  });
-
-  describe('id_token_hint from cookie fallback', () => {
-    it('uses cookie id_token when session has no tokens', async () => {
-      cookies.parse.mockReturnValue({
-        refreshToken: 'cookie-rt',
-        openid_id_token: 'cookie-id-token',
-      });
-      const req = buildReq({ session: { destroy: jest.fn() } });
-      const res = buildRes();
-
-      await logoutController(req, res);
-
-      const body = res.send.mock.calls[0][0];
-      expect(body.redirect).toContain('id_token_hint=cookie-id-token');
-    });
-  });
-
-  describe('client_id fallback', () => {
-    it('falls back to client_id when no idToken is available', async () => {
-      cookies.parse.mockReturnValue({ refreshToken: 'cookie-rt' });
-      const req = buildReq({ session: { destroy: jest.fn() } });
-      const res = buildRes();
-
-      await logoutController(req, res);
-
-      const body = res.send.mock.calls[0][0];
-      expect(body.redirect).toContain('client_id=my-client-id');
-      expect(body.redirect).not.toContain('id_token_hint=');
-    });
-
-    it('does not produce client_id=undefined when OPENID_CLIENT_ID is unset', async () => {
-      delete process.env.OPENID_CLIENT_ID;
-      cookies.parse.mockReturnValue({ refreshToken: 'cookie-rt' });
-      const req = buildReq({ session: { destroy: jest.fn() } });
-      const res = buildRes();
-
-      await logoutController(req, res);
-
-      const body = res.send.mock.calls[0][0];
-      expect(body.redirect).not.toContain('client_id=');
-      expect(body.redirect).not.toContain('undefined');
-      expect(mockLogger.warn).toHaveBeenCalledWith(
-        expect.stringContaining('Neither id_token_hint nor OPENID_CLIENT_ID'),
-      );
-    });
-  });
-
-  describe('OPENID_USE_END_SESSION_ENDPOINT disabled', () => {
-    it('does not include redirect when disabled', async () => {
-      mockIsEnabled.mockReturnValue(false);
-      const req = buildReq();
-      const res = buildRes();
-
-      await logoutController(req, res);
-
-      const body = res.send.mock.calls[0][0];
-      expect(body.redirect).toBeUndefined();
-    });
-  });
-
-  describe('OPENID_ISSUER unset', () => {
-    it('does not include redirect when OPENID_ISSUER is missing', async () => {
-      delete process.env.OPENID_ISSUER;
-      const req = buildReq();
-      const res = buildRes();
-
-      await logoutController(req, res);
-
-      const body = res.send.mock.calls[0][0];
-      expect(body.redirect).toBeUndefined();
-    });
-  });
-
-  describe('non-OpenID user', () => {
-    it('does not include redirect for non-OpenID users', async () => {
-      const req = buildReq({
-        user: { _id: 'user1', provider: 'local' },
-      });
-      const res = buildRes();
-
-      await logoutController(req, res);
-
-      const body = res.send.mock.calls[0][0];
-      expect(body.redirect).toBeUndefined();
-    });
-  });
-
-  describe('post_logout_redirect_uri', () => {
-    it('uses OPENID_POST_LOGOUT_REDIRECT_URI when set', async () => {
-      process.env.OPENID_POST_LOGOUT_REDIRECT_URI = 'https://custom.example.com/logged-out';
-      const req = buildReq();
-      const res = buildRes();
-
-      await logoutController(req, res);
-
-      const body = res.send.mock.calls[0][0];
-      const url = new URL(body.redirect);
-      expect(url.searchParams.get('post_logout_redirect_uri')).toBe(
-        'https://custom.example.com/logged-out',
-      );
-    });
-
-    it('defaults to DOMAIN_CLIENT/login when OPENID_POST_LOGOUT_REDIRECT_URI is unset', async () => {
-      delete process.env.OPENID_POST_LOGOUT_REDIRECT_URI;
-      const req = buildReq();
-      const res = buildRes();
-
-      await logoutController(req, res);
-
-      const body = res.send.mock.calls[0][0];
-      const url = new URL(body.redirect);
-      expect(url.searchParams.get('post_logout_redirect_uri')).toBe(
-        'https://app.example.com/login',
-      );
-    });
-  });
-
-  describe('OpenID config not available', () => {
-    it('warns and returns no redirect when getOpenIdConfig throws', async () => {
-      mockGetOpenIdConfig.mockImplementation(() => {
-        throw new Error('OpenID configuration has not been initialized');
-      });
-      const req = buildReq();
-      const res = buildRes();
-
-      await logoutController(req, res);
-
-      const body = res.send.mock.calls[0][0];
-      expect(body.redirect).toBeUndefined();
-      expect(mockLogger.warn).toHaveBeenCalledWith(
-        expect.stringContaining('OpenID config not available'),
-        'OpenID configuration has not been initialized',
-      );
-    });
-  });
-
-  describe('end_session_endpoint not in metadata', () => {
-    it('warns and returns no redirect when end_session_endpoint is missing', async () => {
-      mockGetOpenIdConfig.mockReturnValue({
-        serverMetadata: () => ({}),
-      });
-      const req = buildReq();
-      const res = buildRes();
-
-      await logoutController(req, res);
-
-      const body = res.send.mock.calls[0][0];
-      expect(body.redirect).toBeUndefined();
-      expect(mockLogger.warn).toHaveBeenCalledWith(
-        expect.stringContaining('end_session_endpoint not found'),
-      );
-    });
-  });
-
-  describe('error handling', () => {
-    it('returns 500 on logoutUser error', async () => {
-      mockLogoutUser.mockRejectedValue(new Error('session error'));
-      const req = buildReq();
-      const res = buildRes();
-
-      await logoutController(req, res);
-
-      expect(res.status).toHaveBeenCalledWith(500);
-      expect(res.json).toHaveBeenCalledWith({ message: 'session error' });
-    });
-  });
-
-  describe('cookie clearing', () => {
-    it('clears all auth cookies on successful logout', async () => {
-      const req = buildReq();
-      const res = buildRes();
-
-      await logoutController(req, res);
-
-      expect(res.clearCookie).toHaveBeenCalledWith('refreshToken');
-      expect(res.clearCookie).toHaveBeenCalledWith('openid_access_token');
-      expect(res.clearCookie).toHaveBeenCalledWith('openid_id_token');
-      expect(res.clearCookie).toHaveBeenCalledWith('openid_user_id');
-      expect(res.clearCookie).toHaveBeenCalledWith('token_provider');
-    });
-  });
-});
--- a/api/server/controllers/auth/oauth.js
+++ b/api/server/controllers/auth/oauth.js
@ -1,79 +0,0 @@
-const { CacheKeys } = require('librechat-data-provider');
-const { logger, DEFAULT_SESSION_EXPIRY } = require('@librechat/data-schemas');
-const {
-  isEnabled,
-  getAdminPanelUrl,
-  isAdminPanelRedirect,
-  generateAdminExchangeCode,
-} = require('@librechat/api');
-const { syncUserEntraGroupMemberships } = require('~/server/services/PermissionService');
-const { setAuthTokens, setOpenIDAuthTokens } = require('~/server/services/AuthService');
-const getLogStores = require('~/cache/getLogStores');
-const { checkBan } = require('~/server/middleware');
-const { generateToken } = require('~/models');
-
-const domains = {
-  client: process.env.DOMAIN_CLIENT,
-  server: process.env.DOMAIN_SERVER,
-};
-
-function createOAuthHandler(redirectUri = domains.client) {
-  /**
-   * A handler to process OAuth authentication results.
-   * @type {Function}
-   * @param {ServerRequest} req - Express request object.
-   * @param {ServerResponse} res - Express response object.
-   * @param {NextFunction} next - Express next middleware function.
-   */
-  return async (req, res, next) => {
-    try {
-      if (res.headersSent) {
-        return;
-      }
-
-      await checkBan(req, res);
-      if (req.banned) {
-        return;
-      }
-
-      /** Check if this is an admin panel redirect (cross-origin) */
-      if (isAdminPanelRedirect(redirectUri, getAdminPanelUrl(), domains.client)) {
-        /** For admin panel, generate exchange code instead of setting cookies */
-        const cache = getLogStores(CacheKeys.ADMIN_OAUTH_EXCHANGE);
-        const sessionExpiry = Number(process.env.SESSION_EXPIRY) || DEFAULT_SESSION_EXPIRY;
-        const token = await generateToken(req.user, sessionExpiry);
-
-        /** Get refresh token from tokenset for OpenID users */
-        const refreshToken =
-          req.user.tokenset?.refresh_token || req.user.federatedTokens?.refresh_token;
-
-        const exchangeCode = await generateAdminExchangeCode(cache, req.user, token, refreshToken);
-
-        const callbackUrl = new URL(redirectUri);
-        callbackUrl.searchParams.set('code', exchangeCode);
-        logger.info(`[OAuth] Admin panel redirect with exchange code for user: ${req.user.email}`);
-        return res.redirect(callbackUrl.toString());
-      }
-
-      /** Standard OAuth flow - set cookies and redirect */
-      if (
-        req.user &&
-        req.user.provider == 'openid' &&
-        isEnabled(process.env.OPENID_REUSE_TOKENS) === true
-      ) {
-        await syncUserEntraGroupMemberships(req.user, req.user.tokenset.access_token);
-        setOpenIDAuthTokens(req.user.tokenset, req, res, req.user._id.toString());
-      } else {
-        await setAuthTokens(req.user._id, res);
-      }
-      res.redirect(redirectUri);
-    } catch (err) {
-      logger.error('Error in setting authentication tokens:', err);
-      next(err);
-    }
-  };
-}
-
-module.exports = {
-  createOAuthHandler,
-};
--- a/api/server/controllers/mcp.js
+++ b/api/server/controllers/mcp.js
@ -7,11 +7,9 @@
 */
 const { logger } = require('@librechat/data-schemas');
 const {
-  MCPErrorCodes,
-  redactServerSecrets,
-  redactAllServerSecrets,
  isMCPDomainNotAllowedError,
  isMCPInspectionFailedError,
+  MCPErrorCodes,
 } = require('@librechat/api');
 const { Constants, MCPServerUserInputSchema } = require('librechat-data-provider');
 const { cacheMCPServerTools, getMCPServerTools } = require('~/server/services/Config');
@ -183,8 +181,10 @@ const getMCPServersList = async (req, res) => {
      return res.status(401).json({ message: 'Unauthorized' });
    }

+    // 2. Get all server configs from registry (YAML + DB)
    const serverConfigs = await getMCPServersRegistry().getAllServerConfigs(userId);
-    return res.json(redactAllServerSecrets(serverConfigs));
+
+    return res.json(serverConfigs);
  } catch (error) {
    logger.error('[getMCPServersList]', error);
    res.status(500).json({ error: error.message });
@ -215,7 +215,7 @@ const createMCPServerController = async (req, res) => {
    );
    res.status(201).json({
      serverName: result.serverName,
-      ...redactServerSecrets(result.config),
+      ...result.config,
    });
  } catch (error) {
    logger.error('[createMCPServer]', error);
@ -243,7 +243,7 @@ const getMCPServerById = async (req, res) => {
      return res.status(404).json({ message: 'MCP server not found' });
    }

-    res.status(200).json(redactServerSecrets(parsedConfig));
+    res.status(200).json(parsedConfig);
  } catch (error) {
    logger.error('[getMCPServerById]', error);
    res.status(500).json({ message: error.message });
@ -274,7 +274,7 @@ const updateMCPServerController = async (req, res) => {
      userId,
    );

-    res.status(200).json(redactServerSecrets(parsedConfig));
+    res.status(200).json(parsedConfig);
  } catch (error) {
    logger.error('[updateMCPServer]', error);
    const mcpErrorResponse = handleMCPError(error, res);
--- a/api/server/experimental.js
+++ b/api/server/experimental.js
@ -14,7 +14,6 @@ const { logger } = require('@librechat/data-schemas');
 const mongoSanitize = require('express-mongo-sanitize');
 const {
  isEnabled,
-  apiNotFound,
  ErrorController,
  performStartupChecks,
  handleJsonParseError,
@ -298,10 +297,8 @@ if (cluster.isMaster) {
    /** Routes */
    app.use('/oauth', routes.oauth);
    app.use('/api/auth', routes.auth);
-    app.use('/api/admin', routes.adminAuth);
    app.use('/api/actions', routes.actions);
    app.use('/api/keys', routes.keys);
-    app.use('/api/api-keys', routes.apiKeys);
    app.use('/api/user', routes.user);
    app.use('/api/search', routes.search);
    app.use('/api/messages', routes.messages);
@ -312,6 +309,7 @@ if (cluster.isMaster) {
    app.use('/api/endpoints', routes.endpoints);
    app.use('/api/balance', routes.balance);
    app.use('/api/models', routes.models);
+    app.use('/api/plugins', routes.plugins);
    app.use('/api/config', routes.config);
    app.use('/api/assistants', routes.assistants);
    app.use('/api/files', await routes.files.initialize());
@ -325,8 +323,8 @@ if (cluster.isMaster) {
    app.use('/api/tags', routes.tags);
    app.use('/api/mcp', routes.mcp);

-    /** 404 for unmatched API routes */
-    app.use('/api', apiNotFound);
+    /** Error handler */
+    app.use(ErrorController);

    /** SPA fallback - serve index.html for all unmatched routes */
    app.use((req, res) => {
@ -344,9 +342,6 @@ if (cluster.isMaster) {
      res.send(updatedIndexHtml);
    });

-    /** Error handler (must be last - Express identifies error middleware by its 4-arg signature) */
-    app.use(ErrorController);
-
    /** Start listening on shared port (cluster will distribute connections) */
    app.listen(port, host, async (err) => {
      if (err) {
--- a/api/server/index.js
+++ b/api/server/index.js
@ -12,14 +12,12 @@ const { logger } = require('@librechat/data-schemas');
 const mongoSanitize = require('express-mongo-sanitize');
 const {
  isEnabled,
-  apiNotFound,
  ErrorController,
-  memoryDiagnostics,
  performStartupChecks,
  handleJsonParseError,
+  initializeFileStorage,
  GenerationJobManager,
  createStreamServices,
-  initializeFileStorage,
 } = require('@librechat/api');
 const { connectDb, indexSync } = require('~/db');
 const initializeOAuthReconnectManager = require('./services/initializeOAuthReconnectManager');
@ -136,10 +134,8 @@ const startServer = async () => {
  app.use('/oauth', routes.oauth);
  /* API Endpoints */
  app.use('/api/auth', routes.auth);
-  app.use('/api/admin', routes.adminAuth);
  app.use('/api/actions', routes.actions);
  app.use('/api/keys', routes.keys);
-  app.use('/api/api-keys', routes.apiKeys);
  app.use('/api/user', routes.user);
  app.use('/api/search', routes.search);
  app.use('/api/messages', routes.messages);
@ -164,10 +160,8 @@ const startServer = async () => {
  app.use('/api/tags', routes.tags);
  app.use('/api/mcp', routes.mcp);

-  /** 404 for unmatched API routes */
-  app.use('/api', apiNotFound);
+  app.use(ErrorController);

-  /** SPA fallback - serve index.html for all unmatched routes */
  app.use((req, res) => {
    res.set({
      'Cache-Control': process.env.INDEX_CACHE_CONTROL || 'no-cache, no-store, must-revalidate',
@ -183,9 +177,6 @@ const startServer = async () => {
    res.send(updatedIndexHtml);
  });

-  /** Error handler (must be last - Express identifies error middleware by its 4-arg signature) */
-  app.use(ErrorController);
-
  app.listen(port, host, async (err) => {
    if (err) {
      logger.error('Failed to start server:', err);
@ -208,11 +199,6 @@ const startServer = async () => {
    const streamServices = createStreamServices();
    GenerationJobManager.configure(streamServices);
    GenerationJobManager.initialize();
-
-    const inspectFlags = process.execArgv.some((arg) => arg.startsWith('--inspect'));
-    if (inspectFlags || isEnabled(process.env.MEM_DIAG)) {
-      memoryDiagnostics.start();
-    }
  });
 };

@ -263,15 +249,6 @@ process.on('uncaughtException', (err) => {
    return;
  }

-  if (isEnabled(process.env.CONTINUE_ON_UNCAUGHT_EXCEPTION)) {
-    logger.error('Unhandled error encountered. The app will continue running.', {
-      name: err?.name,
-      message: err?.message,
-      stack: err?.stack,
-    });
-    return;
-  }
-
  process.exit(1);
 });

--- a/api/server/index.spec.js
+++ b/api/server/index.spec.js
@ -100,40 +100,6 @@ describe('Server Configuration', () => {
    expect(response.headers['expires']).toBe('0');
  });

-  it('should return 404 JSON for undefined API routes', async () => {
-    const response = await request(app).get('/api/nonexistent');
-    expect(response.status).toBe(404);
-    expect(response.body).toEqual({ message: 'Endpoint not found' });
-  });
-
-  it('should return 404 JSON for nested undefined API routes', async () => {
-    const response = await request(app).get('/api/nonexistent/nested/path');
-    expect(response.status).toBe(404);
-    expect(response.body).toEqual({ message: 'Endpoint not found' });
-  });
-
-  it('should return 404 JSON for non-GET methods on undefined API routes', async () => {
-    const post = await request(app).post('/api/nonexistent');
-    expect(post.status).toBe(404);
-    expect(post.body).toEqual({ message: 'Endpoint not found' });
-
-    const del = await request(app).delete('/api/nonexistent');
-    expect(del.status).toBe(404);
-    expect(del.body).toEqual({ message: 'Endpoint not found' });
-  });
-
-  it('should return 404 JSON for the /api root path', async () => {
-    const response = await request(app).get('/api');
-    expect(response.status).toBe(404);
-    expect(response.body).toEqual({ message: 'Endpoint not found' });
-  });
-
-  it('should serve SPA HTML for non-API unmatched routes', async () => {
-    const response = await request(app).get('/this/does/not/exist');
-    expect(response.status).toBe(200);
-    expect(response.headers['content-type']).toMatch(/html/);
-  });
-
  it('should return 500 for unknown errors via ErrorController', async () => {
    // Testing the error handling here on top of unit tests to ensure the middleware is correctly integrated

--- a/api/server/middleware/abortMiddleware.js
+++ b/api/server/middleware/abortMiddleware.js
@ -1,19 +1,17 @@
 const { logger } = require('@librechat/data-schemas');
 const {
+  countTokens,
  isEnabled,
  sendEvent,
-  countTokens,
  GenerationJobManager,
-  recordCollectedUsage,
  sanitizeMessageForTransmit,
 } = require('@librechat/api');
 const { isAssistantsEndpoint, ErrorTypes } = require('librechat-data-provider');
-const { saveMessage, getConvo, updateBalance, bulkInsertTransactions } = require('~/models');
 const { spendTokens, spendStructuredTokens } = require('~/models/spendTokens');
 const { truncateText, smartTruncateText } = require('~/app/clients/prompts');
-const { getMultiplier, getCacheMultiplier } = require('~/models/tx');
 const clearPendingReq = require('~/cache/clearPendingReq');
 const { sendError } = require('~/server/middleware/error');
+const { saveMessage, getConvo } = require('~/models');
 const { abortRun } = require('./abortRun');

 /**
@ -29,35 +27,62 @@ const { abortRun } = require('./abortRun');
 * @param {string} params.conversationId - Conversation ID
 * @param {Array<Object>} params.collectedUsage - Usage metadata from all models
 * @param {string} [params.fallbackModel] - Fallback model name if not in usage
- * @param {string} [params.messageId] - The response message ID for transaction correlation
 */
-async function spendCollectedUsage({
-  userId,
-  conversationId,
-  collectedUsage,
-  fallbackModel,
-  messageId,
-}) {
+async function spendCollectedUsage({ userId, conversationId, collectedUsage, fallbackModel }) {
  if (!collectedUsage || collectedUsage.length === 0) {
    return;
  }

-  await recordCollectedUsage(
-    {
-      spendTokens,
-      spendStructuredTokens,
-      pricing: { getMultiplier, getCacheMultiplier },
-      bulkWriteOps: { insertMany: bulkInsertTransactions, updateBalance },
-    },
-    {
-      user: userId,
-      conversationId,
-      collectedUsage,
+  const spendPromises = [];
+
+  for (const usage of collectedUsage) {
+    if (!usage) {
+      continue;
+    }
+
+    // Support both OpenAI format (input_token_details) and Anthropic format (cache_*_input_tokens)
+    const cache_creation =
+      Number(usage.input_token_details?.cache_creation) ||
+      Number(usage.cache_creation_input_tokens) ||
+      0;
+    const cache_read =
+      Number(usage.input_token_details?.cache_read) || Number(usage.cache_read_input_tokens) || 0;
+
+    const txMetadata = {
      context: 'abort',
-      messageId,
-      model: fallbackModel,
-    },
-  );
+      conversationId,
+      user: userId,
+      model: usage.model ?? fallbackModel,
+    };
+
+    if (cache_creation > 0 || cache_read > 0) {
+      spendPromises.push(
+        spendStructuredTokens(txMetadata, {
+          promptTokens: {
+            input: usage.input_tokens,
+            write: cache_creation,
+            read: cache_read,
+          },
+          completionTokens: usage.output_tokens,
+        }).catch((err) => {
+          logger.error('[abortMiddleware] Error spending structured tokens for abort', err);
+        }),
+      );
+      continue;
+    }
+
+    spendPromises.push(
+      spendTokens(txMetadata, {
+        promptTokens: usage.input_tokens,
+        completionTokens: usage.output_tokens,
+      }).catch((err) => {
+        logger.error('[abortMiddleware] Error spending tokens for abort', err);
+      }),
+    );
+  }
+
+  // Wait for all token spending to complete
+  await Promise.all(spendPromises);

  // Clear the array to prevent double-spending from the AgentClient finally block.
  // The collectedUsage array is shared by reference with AgentClient.collectedUsage,
@ -119,7 +144,6 @@ async function abortMessage(req, res) {
      conversationId: jobData?.conversationId,
      collectedUsage,
      fallbackModel: jobData?.model,
-      messageId: jobData?.responseMessageId,
    });
  } else {
    // Fallback: no collected usage, use text-based token counting for primary model only
@ -268,5 +292,4 @@ const handleAbortError = async (res, req, error, data) => {
 module.exports = {
  handleAbort,
  handleAbortError,
-  spendCollectedUsage,
 };
--- a/api/server/middleware/abortMiddleware.spec.js
+++ b/api/server/middleware/abortMiddleware.spec.js
@ -4,32 +4,16 @@
 * This tests the token spending logic for abort scenarios,
 * particularly for parallel agents (addedConvo) where multiple
 * models need their tokens spent.
- *
- * spendCollectedUsage delegates to recordCollectedUsage from @librechat/api,
- * passing pricing + bulkWriteOps deps, with context: 'abort'.
- * After spending, it clears the collectedUsage array to prevent double-spending
- * from the AgentClient finally block (which shares the same array reference).
 */

 const mockSpendTokens = jest.fn().mockResolvedValue();
 const mockSpendStructuredTokens = jest.fn().mockResolvedValue();
-const mockRecordCollectedUsage = jest
-  .fn()
-  .mockResolvedValue({ input_tokens: 100, output_tokens: 50 });
-
-const mockGetMultiplier = jest.fn().mockReturnValue(1);
-const mockGetCacheMultiplier = jest.fn().mockReturnValue(null);

 jest.mock('~/models/spendTokens', () => ({
  spendTokens: (...args) => mockSpendTokens(...args),
  spendStructuredTokens: (...args) => mockSpendStructuredTokens(...args),
 }));

-jest.mock('~/models/tx', () => ({
-  getMultiplier: mockGetMultiplier,
-  getCacheMultiplier: mockGetCacheMultiplier,
-}));
-
 jest.mock('@librechat/data-schemas', () => ({
  logger: {
    debug: jest.fn(),
@ -46,7 +30,6 @@ jest.mock('@librechat/api', () => ({
  GenerationJobManager: {
    abortJob: jest.fn(),
  },
-  recordCollectedUsage: mockRecordCollectedUsage,
  sanitizeMessageForTransmit: jest.fn((msg) => msg),
 }));

@ -66,27 +49,94 @@ jest.mock('~/server/middleware/error', () => ({
  sendError: jest.fn(),
 }));

-const mockUpdateBalance = jest.fn().mockResolvedValue({});
-const mockBulkInsertTransactions = jest.fn().mockResolvedValue(undefined);
 jest.mock('~/models', () => ({
  saveMessage: jest.fn().mockResolvedValue(),
  getConvo: jest.fn().mockResolvedValue({ title: 'Test Chat' }),
-  updateBalance: mockUpdateBalance,
-  bulkInsertTransactions: mockBulkInsertTransactions,
 }));

 jest.mock('./abortRun', () => ({
  abortRun: jest.fn(),
 }));

-const { spendCollectedUsage } = require('./abortMiddleware');
+// Import the module after mocks are set up
+// We need to extract the spendCollectedUsage function for testing
+// Since it's not exported, we'll test it through the handleAbort flow

 describe('abortMiddleware - spendCollectedUsage', () => {
  beforeEach(() => {
    jest.clearAllMocks();
  });

-  describe('spendCollectedUsage delegation', () => {
+  describe('spendCollectedUsage logic', () => {
+    // Since spendCollectedUsage is not exported, we test the logic directly
+    // by replicating the function here for unit testing
+
+    const spendCollectedUsage = async ({
+      userId,
+      conversationId,
+      collectedUsage,
+      fallbackModel,
+    }) => {
+      if (!collectedUsage || collectedUsage.length === 0) {
+        return;
+      }
+
+      const spendPromises = [];
+
+      for (const usage of collectedUsage) {
+        if (!usage) {
+          continue;
+        }
+
+        const cache_creation =
+          Number(usage.input_token_details?.cache_creation) ||
+          Number(usage.cache_creation_input_tokens) ||
+          0;
+        const cache_read =
+          Number(usage.input_token_details?.cache_read) ||
+          Number(usage.cache_read_input_tokens) ||
+          0;
+
+        const txMetadata = {
+          context: 'abort',
+          conversationId,
+          user: userId,
+          model: usage.model ?? fallbackModel,
+        };
+
+        if (cache_creation > 0 || cache_read > 0) {
+          spendPromises.push(
+            mockSpendStructuredTokens(txMetadata, {
+              promptTokens: {
+                input: usage.input_tokens,
+                write: cache_creation,
+                read: cache_read,
+              },
+              completionTokens: usage.output_tokens,
+            }).catch(() => {
+              // Log error but don't throw
+            }),
+          );
+          continue;
+        }
+
+        spendPromises.push(
+          mockSpendTokens(txMetadata, {
+            promptTokens: usage.input_tokens,
+            completionTokens: usage.output_tokens,
+          }).catch(() => {
+            // Log error but don't throw
+          }),
+        );
+      }
+
+      // Wait for all token spending to complete
+      await Promise.all(spendPromises);
+
+      // Clear the array to prevent double-spending
+      collectedUsage.length = 0;
+    };
+
    it('should return early if collectedUsage is empty', async () => {
      await spendCollectedUsage({
        userId: 'user-123',
@ -95,7 +145,8 @@ describe('abortMiddleware - spendCollectedUsage', () => {
        fallbackModel: 'gpt-4',
      });

-      expect(mockRecordCollectedUsage).not.toHaveBeenCalled();
+      expect(mockSpendTokens).not.toHaveBeenCalled();
+      expect(mockSpendStructuredTokens).not.toHaveBeenCalled();
    });

    it('should return early if collectedUsage is null', async () => {
@ -106,10 +157,28 @@ describe('abortMiddleware - spendCollectedUsage', () => {
        fallbackModel: 'gpt-4',
      });

-      expect(mockRecordCollectedUsage).not.toHaveBeenCalled();
+      expect(mockSpendTokens).not.toHaveBeenCalled();
+      expect(mockSpendStructuredTokens).not.toHaveBeenCalled();
    });

-    it('should call recordCollectedUsage with abort context and full deps', async () => {
+    it('should skip null entries in collectedUsage', async () => {
+      const collectedUsage = [
+        { input_tokens: 100, output_tokens: 50, model: 'gpt-4' },
+        null,
+        { input_tokens: 200, output_tokens: 60, model: 'gpt-4' },
+      ];
+
+      await spendCollectedUsage({
+        userId: 'user-123',
+        conversationId: 'convo-123',
+        collectedUsage,
+        fallbackModel: 'gpt-4',
+      });
+
+      expect(mockSpendTokens).toHaveBeenCalledTimes(2);
+    });
+
+    it('should spend tokens for single model', async () => {
      const collectedUsage = [{ input_tokens: 100, output_tokens: 50, model: 'gpt-4' }];

      await spendCollectedUsage({
@ -117,35 +186,21 @@ describe('abortMiddleware - spendCollectedUsage', () => {
        conversationId: 'convo-123',
        collectedUsage,
        fallbackModel: 'gpt-4',
-        messageId: 'msg-123',
      });

-      expect(mockRecordCollectedUsage).toHaveBeenCalledTimes(1);
-      expect(mockRecordCollectedUsage).toHaveBeenCalledWith(
-        {
-          spendTokens: expect.any(Function),
-          spendStructuredTokens: expect.any(Function),
-          pricing: {
-            getMultiplier: mockGetMultiplier,
-            getCacheMultiplier: mockGetCacheMultiplier,
-          },
-          bulkWriteOps: {
-            insertMany: mockBulkInsertTransactions,
-            updateBalance: mockUpdateBalance,
-          },
-        },
-        {
-          user: 'user-123',
-          conversationId: 'convo-123',
-          collectedUsage,
+      expect(mockSpendTokens).toHaveBeenCalledTimes(1);
+      expect(mockSpendTokens).toHaveBeenCalledWith(
+        expect.objectContaining({
          context: 'abort',
-          messageId: 'msg-123',
+          conversationId: 'convo-123',
+          user: 'user-123',
          model: 'gpt-4',
-        },
+        }),
+        { promptTokens: 100, completionTokens: 50 },
      );
    });

-    it('should pass context abort for multiple models (parallel agents)', async () => {
+    it('should spend tokens for multiple models (parallel agents)', async () => {
      const collectedUsage = [
        { input_tokens: 100, output_tokens: 50, model: 'gpt-4' },
        { input_tokens: 80, output_tokens: 40, model: 'claude-3' },
@ -159,17 +214,136 @@ describe('abortMiddleware - spendCollectedUsage', () => {
        fallbackModel: 'gpt-4',
      });

-      expect(mockRecordCollectedUsage).toHaveBeenCalledTimes(1);
-      expect(mockRecordCollectedUsage).toHaveBeenCalledWith(
-        expect.any(Object),
-        expect.objectContaining({
-          context: 'abort',
-          collectedUsage,
-        }),
+      expect(mockSpendTokens).toHaveBeenCalledTimes(3);
+
+      // Verify each model was called
+      expect(mockSpendTokens).toHaveBeenNthCalledWith(
+        1,
+        expect.objectContaining({ model: 'gpt-4' }),
+        { promptTokens: 100, completionTokens: 50 },
+      );
+      expect(mockSpendTokens).toHaveBeenNthCalledWith(
+        2,
+        expect.objectContaining({ model: 'claude-3' }),
+        { promptTokens: 80, completionTokens: 40 },
+      );
+      expect(mockSpendTokens).toHaveBeenNthCalledWith(
+        3,
+        expect.objectContaining({ model: 'gemini-pro' }),
+        { promptTokens: 120, completionTokens: 60 },
      );
    });

+    it('should use fallbackModel when usage.model is missing', async () => {
+      const collectedUsage = [{ input_tokens: 100, output_tokens: 50 }];
+
+      await spendCollectedUsage({
+        userId: 'user-123',
+        conversationId: 'convo-123',
+        collectedUsage,
+        fallbackModel: 'fallback-model',
+      });
+
+      expect(mockSpendTokens).toHaveBeenCalledWith(
+        expect.objectContaining({ model: 'fallback-model' }),
+        expect.any(Object),
+      );
+    });
+
+    it('should use spendStructuredTokens for OpenAI format cache tokens', async () => {
+      const collectedUsage = [
+        {
+          input_tokens: 100,
+          output_tokens: 50,
+          model: 'gpt-4',
+          input_token_details: {
+            cache_creation: 20,
+            cache_read: 10,
+          },
+        },
+      ];
+
+      await spendCollectedUsage({
+        userId: 'user-123',
+        conversationId: 'convo-123',
+        collectedUsage,
+        fallbackModel: 'gpt-4',
+      });
+
+      expect(mockSpendStructuredTokens).toHaveBeenCalledTimes(1);
+      expect(mockSpendTokens).not.toHaveBeenCalled();
+      expect(mockSpendStructuredTokens).toHaveBeenCalledWith(
+        expect.objectContaining({ model: 'gpt-4', context: 'abort' }),
+        {
+          promptTokens: {
+            input: 100,
+            write: 20,
+            read: 10,
+          },
+          completionTokens: 50,
+        },
+      );
+    });
+
+    it('should use spendStructuredTokens for Anthropic format cache tokens', async () => {
+      const collectedUsage = [
+        {
+          input_tokens: 100,
+          output_tokens: 50,
+          model: 'claude-3',
+          cache_creation_input_tokens: 25,
+          cache_read_input_tokens: 15,
+        },
+      ];
+
+      await spendCollectedUsage({
+        userId: 'user-123',
+        conversationId: 'convo-123',
+        collectedUsage,
+        fallbackModel: 'claude-3',
+      });
+
+      expect(mockSpendStructuredTokens).toHaveBeenCalledTimes(1);
+      expect(mockSpendTokens).not.toHaveBeenCalled();
+      expect(mockSpendStructuredTokens).toHaveBeenCalledWith(
+        expect.objectContaining({ model: 'claude-3' }),
+        {
+          promptTokens: {
+            input: 100,
+            write: 25,
+            read: 15,
+          },
+          completionTokens: 50,
+        },
+      );
+    });
+
+    it('should handle mixed cache and non-cache entries', async () => {
+      const collectedUsage = [
+        { input_tokens: 100, output_tokens: 50, model: 'gpt-4' },
+        {
+          input_tokens: 150,
+          output_tokens: 30,
+          model: 'claude-3',
+          cache_creation_input_tokens: 20,
+          cache_read_input_tokens: 10,
+        },
+        { input_tokens: 200, output_tokens: 20, model: 'gemini-pro' },
+      ];
+
+      await spendCollectedUsage({
+        userId: 'user-123',
+        conversationId: 'convo-123',
+        collectedUsage,
+        fallbackModel: 'gpt-4',
+      });
+
+      expect(mockSpendTokens).toHaveBeenCalledTimes(2);
+      expect(mockSpendStructuredTokens).toHaveBeenCalledTimes(1);
+    });
+
    it('should handle real-world parallel agent abort scenario', async () => {
+      // Simulates: Primary agent (gemini) + addedConvo agent (gpt-5) aborted mid-stream
      const collectedUsage = [
        { input_tokens: 31596, output_tokens: 151, model: 'gemini-3-flash-preview' },
        { input_tokens: 28000, output_tokens: 120, model: 'gpt-5.2' },
@ -182,24 +356,27 @@ describe('abortMiddleware - spendCollectedUsage', () => {
        fallbackModel: 'gemini-3-flash-preview',
      });

-      expect(mockRecordCollectedUsage).toHaveBeenCalledTimes(1);
-      expect(mockRecordCollectedUsage).toHaveBeenCalledWith(
-        expect.any(Object),
-        expect.objectContaining({
-          user: 'user-123',
-          conversationId: 'convo-123',
-          context: 'abort',
-          model: 'gemini-3-flash-preview',
-        }),
+      expect(mockSpendTokens).toHaveBeenCalledTimes(2);
+
+      // Primary model
+      expect(mockSpendTokens).toHaveBeenNthCalledWith(
+        1,
+        expect.objectContaining({ model: 'gemini-3-flash-preview' }),
+        { promptTokens: 31596, completionTokens: 151 },
+      );
+
+      // Parallel model (addedConvo)
+      expect(mockSpendTokens).toHaveBeenNthCalledWith(
+        2,
+        expect.objectContaining({ model: 'gpt-5.2' }),
+        { promptTokens: 28000, completionTokens: 120 },
      );
    });

-    /**
-     * Race condition prevention: after abort middleware spends tokens,
-     * the collectedUsage array is cleared so AgentClient.recordCollectedUsage()
-     * (which shares the same array reference) sees an empty array and returns early.
-     */
    it('should clear collectedUsage array after spending to prevent double-spending', async () => {
+      // This tests the race condition fix: after abort middleware spends tokens,
+      // the collectedUsage array is cleared so AgentClient.recordCollectedUsage()
+      // (which shares the same array reference) sees an empty array and returns early.
      const collectedUsage = [
        { input_tokens: 100, output_tokens: 50, model: 'gpt-4' },
        { input_tokens: 80, output_tokens: 40, model: 'claude-3' },
@ -214,16 +391,19 @@ describe('abortMiddleware - spendCollectedUsage', () => {
        fallbackModel: 'gpt-4',
      });

-      expect(mockRecordCollectedUsage).toHaveBeenCalledTimes(1);
+      expect(mockSpendTokens).toHaveBeenCalledTimes(2);
+
+      // The array should be cleared after spending
      expect(collectedUsage.length).toBe(0);
    });

-    it('should await recordCollectedUsage before clearing array', async () => {
-      let resolved = false;
-      mockRecordCollectedUsage.mockImplementation(async () => {
+    it('should await all token spending operations before clearing array', async () => {
+      // Ensure we don't clear the array before spending completes
+      let spendCallCount = 0;
+      mockSpendTokens.mockImplementation(async () => {
+        spendCallCount++;
+        // Simulate async delay
        await new Promise((resolve) => setTimeout(resolve, 10));
-        resolved = true;
-        return { input_tokens: 100, output_tokens: 50 };
      });

      const collectedUsage = [
@ -238,7 +418,10 @@ describe('abortMiddleware - spendCollectedUsage', () => {
        fallbackModel: 'gpt-4',
      });

-      expect(resolved).toBe(true);
+      // Both spend calls should have completed
+      expect(spendCallCount).toBe(2);
+
+      // Array should be cleared after awaiting
      expect(collectedUsage.length).toBe(0);
    });
  });
--- a/api/server/middleware/accessResources/canAccessAgentFromBody.js
+++ b/api/server/middleware/accessResources/canAccessAgentFromBody.js
@ -1,144 +1,42 @@
 const { logger } = require('@librechat/data-schemas');
 const {
  Constants,
-  Permissions,
  ResourceType,
-  SystemRoles,
-  PermissionTypes,
  isAgentsEndpoint,
  isEphemeralAgentId,
 } = require('librechat-data-provider');
-const { checkPermission } = require('~/server/services/PermissionService');
 const { canAccessResource } = require('./canAccessResource');
-const { getRoleByName } = require('~/models/Role');
 const { getAgent } = require('~/models/Agent');

 /**
- * Resolves custom agent ID (e.g., "agent_abc123") to a MongoDB document.
+ * Agent ID resolver function for agent_id from request body
+ * Resolves custom agent ID (e.g., "agent_abc123") to MongoDB ObjectId
+ * This is used specifically for chat routes where agent_id comes from request body
+ *
 * @param {string} agentCustomId - Custom agent ID from request body
- * @returns {Promise<Object|null>} Agent document with _id field, or null if ephemeral/not found
+ * @returns {Promise<Object|null>} Agent document with _id field, or null if not found
 */
 const resolveAgentIdFromBody = async (agentCustomId) => {
+  // Handle ephemeral agents - they don't need permission checks
+  // Real agent IDs always start with "agent_", so anything else is ephemeral
  if (isEphemeralAgentId(agentCustomId)) {
-    return null;
+    return null; // No permission check needed for ephemeral agents
  }
-  return getAgent({ id: agentCustomId });
+
+  return await getAgent({ id: agentCustomId });
 };

 /**
- * Creates a `canAccessResource` middleware for the given agent ID
- * and chains to the provided continuation on success.
- *
- * @param {string} agentId - The agent's custom string ID (e.g., "agent_abc123")
- * @param {number} requiredPermission - Permission bit(s) required
- * @param {import('express').Request} req
- * @param {import('express').Response} res - Written on deny; continuation called on allow
- * @param {Function} continuation - Called when the permission check passes
- * @returns {Promise<void>}
- */
-const checkAgentResourceAccess = (agentId, requiredPermission, req, res, continuation) => {
-  const middleware = canAccessResource({
-    resourceType: ResourceType.AGENT,
-    requiredPermission,
-    resourceIdParam: 'agent_id',
-    idResolver: () => resolveAgentIdFromBody(agentId),
-  });
-
-  const tempReq = {
-    ...req,
-    params: { ...req.params, agent_id: agentId },
-  };
-
-  return middleware(tempReq, res, continuation);
-};
-
-/**
- * Middleware factory that validates MULTI_CONVO:USE role permission and, when
- * addedConvo.agent_id is a non-ephemeral agent, the same resource-level permission
- * required for the primary agent (`requiredPermission`). Caches the resolved agent
- * document on `req.resolvedAddedAgent` to avoid a duplicate DB fetch in `loadAddedAgent`.
- *
- * @param {number} requiredPermission - Permission bit(s) to check on the added agent resource
- * @returns {(req: import('express').Request, res: import('express').Response, next: Function) => Promise<void>}
- */
-const checkAddedConvoAccess = (requiredPermission) => async (req, res, next) => {
-  const addedConvo = req.body?.addedConvo;
-  if (!addedConvo || typeof addedConvo !== 'object' || Array.isArray(addedConvo)) {
-    return next();
-  }
-
-  try {
-    if (!req.user?.role) {
-      return res.status(403).json({
-        error: 'Forbidden',
-        message: 'Insufficient permissions for multi-conversation',
-      });
-    }
-
-    if (req.user.role !== SystemRoles.ADMIN) {
-      const role = await getRoleByName(req.user.role);
-      const hasMultiConvo = role?.permissions?.[PermissionTypes.MULTI_CONVO]?.[Permissions.USE];
-      if (!hasMultiConvo) {
-        return res.status(403).json({
-          error: 'Forbidden',
-          message: 'Multi-conversation feature is not enabled',
-        });
-      }
-    }
-
-    const addedAgentId = addedConvo.agent_id;
-    if (!addedAgentId || typeof addedAgentId !== 'string' || isEphemeralAgentId(addedAgentId)) {
-      return next();
-    }
-
-    if (req.user.role === SystemRoles.ADMIN) {
-      return next();
-    }
-
-    const agent = await resolveAgentIdFromBody(addedAgentId);
-    if (!agent) {
-      return res.status(404).json({
-        error: 'Not Found',
-        message: `${ResourceType.AGENT} not found`,
-      });
-    }
-
-    const hasPermission = await checkPermission({
-      userId: req.user.id,
-      role: req.user.role,
-      resourceType: ResourceType.AGENT,
-      resourceId: agent._id,
-      requiredPermission,
-    });
-
-    if (!hasPermission) {
-      return res.status(403).json({
-        error: 'Forbidden',
-        message: `Insufficient permissions to access this ${ResourceType.AGENT}`,
-      });
-    }
-
-    req.resolvedAddedAgent = agent;
-    return next();
-  } catch (error) {
-    logger.error('Failed to validate addedConvo access permissions', error);
-    return res.status(500).json({
-      error: 'Internal Server Error',
-      message: 'Failed to validate addedConvo access permissions',
-    });
-  }
-};
-
-/**
- * Middleware factory that checks agent access permissions from request body.
- * Validates both the primary agent_id and, when present, addedConvo.agent_id
- * (which also requires MULTI_CONVO:USE role permission).
+ * Middleware factory that creates middleware to check agent access permissions from request body.
+ * This middleware is specifically designed for chat routes where the agent_id comes from req.body
+ * instead of route parameters.
 *
 * @param {Object} options - Configuration options
 * @param {number} options.requiredPermission - The permission bit required (1=view, 2=edit, 4=delete, 8=share)
 * @returns {Function} Express middleware function
 *
 * @example
+ * // Basic usage for agent chat (requires VIEW permission)
 * router.post('/chat',
 *   canAccessAgentFromBody({ requiredPermission: PermissionBits.VIEW }),
 *   buildEndpointOption,
@ -148,12 +46,11 @@ const checkAddedConvoAccess = (requiredPermission) => async (req, res, next) =>
 const canAccessAgentFromBody = (options) => {
  const { requiredPermission } = options;

+  // Validate required options
  if (!requiredPermission || typeof requiredPermission !== 'number') {
    throw new Error('canAccessAgentFromBody: requiredPermission is required and must be a number');
  }

-  const addedConvoMiddleware = checkAddedConvoAccess(requiredPermission);
-
  return async (req, res, next) => {
    try {
      const { endpoint, agent_id } = req.body;
@ -170,13 +67,28 @@ const canAccessAgentFromBody = (options) => {
        });
      }

-      const afterPrimaryCheck = () => addedConvoMiddleware(req, res, next);
-
+      // Skip permission checks for ephemeral agents
+      // Real agent IDs always start with "agent_", so anything else is ephemeral
      if (isEphemeralAgentId(agentId)) {
-        return afterPrimaryCheck();
+        return next();
      }

-      return checkAgentResourceAccess(agentId, requiredPermission, req, res, afterPrimaryCheck);
+      const agentAccessMiddleware = canAccessResource({
+        resourceType: ResourceType.AGENT,
+        requiredPermission,
+        resourceIdParam: 'agent_id', // This will be ignored since we use custom resolver
+        idResolver: () => resolveAgentIdFromBody(agentId),
+      });
+
+      const tempReq = {
+        ...req,
+        params: {
+          ...req.params,
+          agent_id: agentId,
+        },
+      };
+
+      return agentAccessMiddleware(tempReq, res, next);
    } catch (error) {
      logger.error('Failed to validate agent access permissions', error);
      return res.status(500).json({
--- a/api/server/middleware/accessResources/canAccessAgentFromBody.spec.js
+++ b/api/server/middleware/accessResources/canAccessAgentFromBody.spec.js
@ -1,509 +0,0 @@
-const mongoose = require('mongoose');
-const {
-  ResourceType,
-  SystemRoles,
-  PrincipalType,
-  PrincipalModel,
-} = require('librechat-data-provider');
-const { MongoMemoryServer } = require('mongodb-memory-server');
-const { canAccessAgentFromBody } = require('./canAccessAgentFromBody');
-const { User, Role, AclEntry } = require('~/db/models');
-const { createAgent } = require('~/models/Agent');
-
-describe('canAccessAgentFromBody middleware', () => {
-  let mongoServer;
-  let req, res, next;
-  let testUser, otherUser;
-
-  beforeAll(async () => {
-    mongoServer = await MongoMemoryServer.create();
-    await mongoose.connect(mongoServer.getUri());
-  });
-
-  afterAll(async () => {
-    await mongoose.disconnect();
-    await mongoServer.stop();
-  });
-
-  beforeEach(async () => {
-    await mongoose.connection.dropDatabase();
-
-    await Role.create({
-      name: 'test-role',
-      permissions: {
-        AGENTS: { USE: true, CREATE: true, SHARE: true },
-        MULTI_CONVO: { USE: true },
-      },
-    });
-
-    await Role.create({
-      name: 'no-multi-convo',
-      permissions: {
-        AGENTS: { USE: true, CREATE: true, SHARE: true },
-        MULTI_CONVO: { USE: false },
-      },
-    });
-
-    await Role.create({
-      name: SystemRoles.ADMIN,
-      permissions: {
-        AGENTS: { USE: true, CREATE: true, SHARE: true },
-        MULTI_CONVO: { USE: true },
-      },
-    });
-
-    testUser = await User.create({
-      email: 'test@example.com',
-      name: 'Test User',
-      username: 'testuser',
-      role: 'test-role',
-    });
-
-    otherUser = await User.create({
-      email: 'other@example.com',
-      name: 'Other User',
-      username: 'otheruser',
-      role: 'test-role',
-    });
-
-    req = {
-      user: { id: testUser._id, role: testUser.role },
-      params: {},
-      body: {
-        endpoint: 'agents',
-        agent_id: 'ephemeral_primary',
-      },
-    };
-    res = {
-      status: jest.fn().mockReturnThis(),
-      json: jest.fn(),
-    };
-    next = jest.fn();
-
-    jest.clearAllMocks();
-  });
-
-  describe('middleware factory', () => {
-    test('throws if requiredPermission is missing', () => {
-      expect(() => canAccessAgentFromBody({})).toThrow(
-        'canAccessAgentFromBody: requiredPermission is required and must be a number',
-      );
-    });
-
-    test('throws if requiredPermission is not a number', () => {
-      expect(() => canAccessAgentFromBody({ requiredPermission: '1' })).toThrow(
-        'canAccessAgentFromBody: requiredPermission is required and must be a number',
-      );
-    });
-
-    test('returns a middleware function', () => {
-      const middleware = canAccessAgentFromBody({ requiredPermission: 1 });
-      expect(typeof middleware).toBe('function');
-      expect(middleware.length).toBe(3);
-    });
-  });
-
-  describe('primary agent checks', () => {
-    test('returns 400 when agent_id is missing on agents endpoint', async () => {
-      req.body.agent_id = undefined;
-      const middleware = canAccessAgentFromBody({ requiredPermission: 1 });
-      await middleware(req, res, next);
-
-      expect(next).not.toHaveBeenCalled();
-      expect(res.status).toHaveBeenCalledWith(400);
-    });
-
-    test('proceeds for ephemeral primary agent without addedConvo', async () => {
-      const middleware = canAccessAgentFromBody({ requiredPermission: 1 });
-      await middleware(req, res, next);
-
-      expect(next).toHaveBeenCalled();
-      expect(res.status).not.toHaveBeenCalled();
-    });
-
-    test('proceeds for non-agents endpoint (ephemeral fallback)', async () => {
-      req.body.endpoint = 'openAI';
-      req.body.agent_id = undefined;
-      const middleware = canAccessAgentFromBody({ requiredPermission: 1 });
-      await middleware(req, res, next);
-
-      expect(next).toHaveBeenCalled();
-    });
-  });
-
-  describe('addedConvo — absent or invalid shape', () => {
-    test('calls next when addedConvo is absent', async () => {
-      const middleware = canAccessAgentFromBody({ requiredPermission: 1 });
-      await middleware(req, res, next);
-
-      expect(next).toHaveBeenCalled();
-    });
-
-    test('calls next when addedConvo is a string', async () => {
-      req.body.addedConvo = 'not-an-object';
-      const middleware = canAccessAgentFromBody({ requiredPermission: 1 });
-      await middleware(req, res, next);
-
-      expect(next).toHaveBeenCalled();
-    });
-
-    test('calls next when addedConvo is an array', async () => {
-      req.body.addedConvo = [{ agent_id: 'agent_something' }];
-      const middleware = canAccessAgentFromBody({ requiredPermission: 1 });
-      await middleware(req, res, next);
-
-      expect(next).toHaveBeenCalled();
-    });
-  });
-
-  describe('addedConvo — MULTI_CONVO permission gate', () => {
-    test('returns 403 when user lacks MULTI_CONVO:USE', async () => {
-      req.user.role = 'no-multi-convo';
-      req.body.addedConvo = { agent_id: 'agent_x', endpoint: 'agents', model: 'gpt-4' };
-
-      const middleware = canAccessAgentFromBody({ requiredPermission: 1 });
-      await middleware(req, res, next);
-
-      expect(next).not.toHaveBeenCalled();
-      expect(res.status).toHaveBeenCalledWith(403);
-      expect(res.json).toHaveBeenCalledWith(
-        expect.objectContaining({ message: 'Multi-conversation feature is not enabled' }),
-      );
-    });
-
-    test('returns 403 when user.role is missing', async () => {
-      req.user = { id: testUser._id };
-      req.body.addedConvo = { agent_id: 'agent_x', endpoint: 'agents', model: 'gpt-4' };
-
-      const middleware = canAccessAgentFromBody({ requiredPermission: 1 });
-      await middleware(req, res, next);
-
-      expect(next).not.toHaveBeenCalled();
-      expect(res.status).toHaveBeenCalledWith(403);
-    });
-
-    test('ADMIN bypasses MULTI_CONVO check', async () => {
-      req.user.role = SystemRoles.ADMIN;
-      req.body.addedConvo = { agent_id: 'ephemeral_x', endpoint: 'agents', model: 'gpt-4' };
-
-      const middleware = canAccessAgentFromBody({ requiredPermission: 1 });
-      await middleware(req, res, next);
-
-      expect(next).toHaveBeenCalled();
-      expect(res.status).not.toHaveBeenCalled();
-    });
-  });
-
-  describe('addedConvo — agent_id shape validation', () => {
-    test('calls next when agent_id is ephemeral', async () => {
-      req.body.addedConvo = { agent_id: 'ephemeral_xyz', endpoint: 'agents', model: 'gpt-4' };
-
-      const middleware = canAccessAgentFromBody({ requiredPermission: 1 });
-      await middleware(req, res, next);
-
-      expect(next).toHaveBeenCalled();
-    });
-
-    test('calls next when agent_id is absent', async () => {
-      req.body.addedConvo = { endpoint: 'agents', model: 'gpt-4' };
-
-      const middleware = canAccessAgentFromBody({ requiredPermission: 1 });
-      await middleware(req, res, next);
-
-      expect(next).toHaveBeenCalled();
-    });
-
-    test('calls next when agent_id is not a string (object injection)', async () => {
-      req.body.addedConvo = { agent_id: { $gt: '' }, endpoint: 'agents', model: 'gpt-4' };
-
-      const middleware = canAccessAgentFromBody({ requiredPermission: 1 });
-      await middleware(req, res, next);
-
-      expect(next).toHaveBeenCalled();
-    });
-  });
-
-  describe('addedConvo — agent resource ACL (IDOR prevention)', () => {
-    let addedAgent;
-
-    beforeEach(async () => {
-      addedAgent = await createAgent({
-        id: `agent_added_${Date.now()}`,
-        name: 'Private Agent',
-        provider: 'openai',
-        model: 'gpt-4',
-        author: otherUser._id,
-      });
-
-      await AclEntry.create({
-        principalType: PrincipalType.USER,
-        principalId: otherUser._id,
-        principalModel: PrincipalModel.USER,
-        resourceType: ResourceType.AGENT,
-        resourceId: addedAgent._id,
-        permBits: 15,
-        grantedBy: otherUser._id,
-      });
-    });
-
-    test('returns 403 when requester has no ACL for the added agent', async () => {
-      req.body.addedConvo = { agent_id: addedAgent.id, endpoint: 'agents', model: 'gpt-4' };
-
-      const middleware = canAccessAgentFromBody({ requiredPermission: 1 });
-      await middleware(req, res, next);
-
-      expect(next).not.toHaveBeenCalled();
-      expect(res.status).toHaveBeenCalledWith(403);
-      expect(res.json).toHaveBeenCalledWith(
-        expect.objectContaining({
-          message: 'Insufficient permissions to access this agent',
-        }),
-      );
-    });
-
-    test('returns 404 when added agent does not exist', async () => {
-      req.body.addedConvo = {
-        agent_id: 'agent_nonexistent_999',
-        endpoint: 'agents',
-        model: 'gpt-4',
-      };
-
-      const middleware = canAccessAgentFromBody({ requiredPermission: 1 });
-      await middleware(req, res, next);
-
-      expect(next).not.toHaveBeenCalled();
-      expect(res.status).toHaveBeenCalledWith(404);
-    });
-
-    test('proceeds when requester has ACL for the added agent', async () => {
-      await AclEntry.create({
-        principalType: PrincipalType.USER,
-        principalId: testUser._id,
-        principalModel: PrincipalModel.USER,
-        resourceType: ResourceType.AGENT,
-        resourceId: addedAgent._id,
-        permBits: 1,
-        grantedBy: otherUser._id,
-      });
-
-      req.body.addedConvo = { agent_id: addedAgent.id, endpoint: 'agents', model: 'gpt-4' };
-
-      const middleware = canAccessAgentFromBody({ requiredPermission: 1 });
-      await middleware(req, res, next);
-
-      expect(next).toHaveBeenCalled();
-      expect(res.status).not.toHaveBeenCalled();
-    });
-
-    test('denies when ACL permission bits are insufficient', async () => {
-      await AclEntry.create({
-        principalType: PrincipalType.USER,
-        principalId: testUser._id,
-        principalModel: PrincipalModel.USER,
-        resourceType: ResourceType.AGENT,
-        resourceId: addedAgent._id,
-        permBits: 1,
-        grantedBy: otherUser._id,
-      });
-
-      req.body.addedConvo = { agent_id: addedAgent.id, endpoint: 'agents', model: 'gpt-4' };
-
-      const middleware = canAccessAgentFromBody({ requiredPermission: 2 });
-      await middleware(req, res, next);
-
-      expect(next).not.toHaveBeenCalled();
-      expect(res.status).toHaveBeenCalledWith(403);
-    });
-
-    test('caches resolved agent on req.resolvedAddedAgent', async () => {
-      await AclEntry.create({
-        principalType: PrincipalType.USER,
-        principalId: testUser._id,
-        principalModel: PrincipalModel.USER,
-        resourceType: ResourceType.AGENT,
-        resourceId: addedAgent._id,
-        permBits: 1,
-        grantedBy: otherUser._id,
-      });
-
-      req.body.addedConvo = { agent_id: addedAgent.id, endpoint: 'agents', model: 'gpt-4' };
-
-      const middleware = canAccessAgentFromBody({ requiredPermission: 1 });
-      await middleware(req, res, next);
-
-      expect(next).toHaveBeenCalled();
-      expect(req.resolvedAddedAgent).toBeDefined();
-      expect(req.resolvedAddedAgent._id.toString()).toBe(addedAgent._id.toString());
-    });
-
-    test('ADMIN bypasses agent resource ACL for addedConvo', async () => {
-      req.user.role = SystemRoles.ADMIN;
-      req.body.addedConvo = { agent_id: addedAgent.id, endpoint: 'agents', model: 'gpt-4' };
-
-      const middleware = canAccessAgentFromBody({ requiredPermission: 1 });
-      await middleware(req, res, next);
-
-      expect(next).toHaveBeenCalled();
-      expect(res.status).not.toHaveBeenCalled();
-      expect(req.resolvedAddedAgent).toBeUndefined();
-    });
-  });
-
-  describe('end-to-end: primary real agent + addedConvo real agent', () => {
-    let primaryAgent, addedAgent;
-
-    beforeEach(async () => {
-      primaryAgent = await createAgent({
-        id: `agent_primary_${Date.now()}`,
-        name: 'Primary Agent',
-        provider: 'openai',
-        model: 'gpt-4',
-        author: testUser._id,
-      });
-
-      await AclEntry.create({
-        principalType: PrincipalType.USER,
-        principalId: testUser._id,
-        principalModel: PrincipalModel.USER,
-        resourceType: ResourceType.AGENT,
-        resourceId: primaryAgent._id,
-        permBits: 15,
-        grantedBy: testUser._id,
-      });
-
-      addedAgent = await createAgent({
-        id: `agent_added_${Date.now()}`,
-        name: 'Added Agent',
-        provider: 'openai',
-        model: 'gpt-4',
-        author: otherUser._id,
-      });
-
-      await AclEntry.create({
-        principalType: PrincipalType.USER,
-        principalId: otherUser._id,
-        principalModel: PrincipalModel.USER,
-        resourceType: ResourceType.AGENT,
-        resourceId: addedAgent._id,
-        permBits: 15,
-        grantedBy: otherUser._id,
-      });
-
-      req.body.agent_id = primaryAgent.id;
-    });
-
-    test('both checks pass when user has ACL for both agents', async () => {
-      await AclEntry.create({
-        principalType: PrincipalType.USER,
-        principalId: testUser._id,
-        principalModel: PrincipalModel.USER,
-        resourceType: ResourceType.AGENT,
-        resourceId: addedAgent._id,
-        permBits: 1,
-        grantedBy: otherUser._id,
-      });
-
-      req.body.addedConvo = { agent_id: addedAgent.id, endpoint: 'agents', model: 'gpt-4' };
-
-      const middleware = canAccessAgentFromBody({ requiredPermission: 1 });
-      await middleware(req, res, next);
-
-      expect(next).toHaveBeenCalled();
-      expect(res.status).not.toHaveBeenCalled();
-      expect(req.resolvedAddedAgent).toBeDefined();
-    });
-
-    test('primary passes but addedConvo denied → 403', async () => {
-      req.body.addedConvo = { agent_id: addedAgent.id, endpoint: 'agents', model: 'gpt-4' };
-
-      const middleware = canAccessAgentFromBody({ requiredPermission: 1 });
-      await middleware(req, res, next);
-
-      expect(next).not.toHaveBeenCalled();
-      expect(res.status).toHaveBeenCalledWith(403);
-    });
-
-    test('primary denied → 403 without reaching addedConvo check', async () => {
-      const foreignAgent = await createAgent({
-        id: `agent_foreign_${Date.now()}`,
-        name: 'Foreign Agent',
-        provider: 'openai',
-        model: 'gpt-4',
-        author: otherUser._id,
-      });
-
-      await AclEntry.create({
-        principalType: PrincipalType.USER,
-        principalId: otherUser._id,
-        principalModel: PrincipalModel.USER,
-        resourceType: ResourceType.AGENT,
-        resourceId: foreignAgent._id,
-        permBits: 15,
-        grantedBy: otherUser._id,
-      });
-
-      req.body.agent_id = foreignAgent.id;
-      req.body.addedConvo = { agent_id: addedAgent.id, endpoint: 'agents', model: 'gpt-4' };
-
-      const middleware = canAccessAgentFromBody({ requiredPermission: 1 });
-      await middleware(req, res, next);
-
-      expect(next).not.toHaveBeenCalled();
-      expect(res.status).toHaveBeenCalledWith(403);
-    });
-  });
-
-  describe('ephemeral primary + real addedConvo agent', () => {
-    let addedAgent;
-
-    beforeEach(async () => {
-      addedAgent = await createAgent({
-        id: `agent_added_${Date.now()}`,
-        name: 'Added Agent',
-        provider: 'openai',
-        model: 'gpt-4',
-        author: otherUser._id,
-      });
-
-      await AclEntry.create({
-        principalType: PrincipalType.USER,
-        principalId: otherUser._id,
-        principalModel: PrincipalModel.USER,
-        resourceType: ResourceType.AGENT,
-        resourceId: addedAgent._id,
-        permBits: 15,
-        grantedBy: otherUser._id,
-      });
-    });
-
-    test('runs full addedConvo ACL check even when primary is ephemeral', async () => {
-      req.body.addedConvo = { agent_id: addedAgent.id, endpoint: 'agents', model: 'gpt-4' };
-
-      const middleware = canAccessAgentFromBody({ requiredPermission: 1 });
-      await middleware(req, res, next);
-
-      expect(next).not.toHaveBeenCalled();
-      expect(res.status).toHaveBeenCalledWith(403);
-    });
-
-    test('proceeds when user has ACL for added agent (ephemeral primary)', async () => {
-      await AclEntry.create({
-        principalType: PrincipalType.USER,
-        principalId: testUser._id,
-        principalModel: PrincipalModel.USER,
-        resourceType: ResourceType.AGENT,
-        resourceId: addedAgent._id,
-        permBits: 1,
-        grantedBy: otherUser._id,
-      });
-
-      req.body.addedConvo = { agent_id: addedAgent.id, endpoint: 'agents', model: 'gpt-4' };
-
-      const middleware = canAccessAgentFromBody({ requiredPermission: 1 });
-      await middleware(req, res, next);
-
-      expect(next).toHaveBeenCalled();
-      expect(res.status).not.toHaveBeenCalled();
-    });
-  });
-});
--- a/api/server/middleware/buildEndpointOption.js
+++ b/api/server/middleware/buildEndpointOption.js
@ -5,11 +5,9 @@ const {
  EModelEndpoint,
  isAgentsEndpoint,
  parseCompactConvo,
-  getDefaultParamsEndpoint,
 } = require('librechat-data-provider');
 const azureAssistants = require('~/server/services/Endpoints/azureAssistants');
 const assistants = require('~/server/services/Endpoints/assistants');
-const { getEndpointsConfig } = require('~/server/services/Config');
 const agents = require('~/server/services/Endpoints/agents');
 const { updateFilesUsage } = require('~/models');

@ -21,24 +19,9 @@ const buildFunction = {

 async function buildEndpointOption(req, res, next) {
  const { endpoint, endpointType } = req.body;
-
-  let endpointsConfig;
-  try {
-    endpointsConfig = await getEndpointsConfig(req);
-  } catch (error) {
-    logger.error('Error fetching endpoints config in buildEndpointOption', error);
-  }
-
-  const defaultParamsEndpoint = getDefaultParamsEndpoint(endpointsConfig, endpoint);
-
  let parsedBody;
  try {
-    parsedBody = parseCompactConvo({
-      endpoint,
-      endpointType,
-      conversation: req.body,
-      defaultParamsEndpoint,
-    });
+    parsedBody = parseCompactConvo({ endpoint, endpointType, conversation: req.body });
  } catch (error) {
    logger.error(`Error parsing compact conversation for endpoint ${endpoint}`, error);
    logger.debug({
@ -72,7 +55,6 @@ async function buildEndpointOption(req, res, next) {
        endpoint,
        endpointType,
        conversation: currentModelSpec.preset,
-        defaultParamsEndpoint,
      });
      if (currentModelSpec.iconURL != null && currentModelSpec.iconURL !== '') {
        parsedBody.iconURL = currentModelSpec.iconURL;
--- a/api/server/middleware/buildEndpointOption.spec.js
+++ b/api/server/middleware/buildEndpointOption.spec.js
@ -1,237 +0,0 @@
-/**
- * Wrap parseCompactConvo: the REAL function runs, but jest can observe
- * calls and return values. Must be declared before require('./buildEndpointOption')
- * so the destructured reference in the middleware captures the wrapper.
- */
-jest.mock('librechat-data-provider', () => {
-  const actual = jest.requireActual('librechat-data-provider');
-  return {
-    ...actual,
-    parseCompactConvo: jest.fn((...args) => actual.parseCompactConvo(...args)),
-  };
-});
-
-const { EModelEndpoint, parseCompactConvo } = require('librechat-data-provider');
-
-const mockBuildOptions = jest.fn((_endpoint, parsedBody) => ({
-  ...parsedBody,
-  endpoint: _endpoint,
-}));
-
-jest.mock('~/server/services/Endpoints/azureAssistants', () => ({
-  buildOptions: mockBuildOptions,
-}));
-jest.mock('~/server/services/Endpoints/assistants', () => ({
-  buildOptions: mockBuildOptions,
-}));
-jest.mock('~/server/services/Endpoints/agents', () => ({
-  buildOptions: mockBuildOptions,
-}));
-
-jest.mock('~/models', () => ({
-  updateFilesUsage: jest.fn(),
-}));
-
-const mockGetEndpointsConfig = jest.fn();
-jest.mock('~/server/services/Config', () => ({
-  getEndpointsConfig: (...args) => mockGetEndpointsConfig(...args),
-}));
-
-jest.mock('@librechat/api', () => ({
-  handleError: jest.fn(),
-}));
-
-const buildEndpointOption = require('./buildEndpointOption');
-
-const createReq = (body, config = {}) => ({
-  body,
-  config,
-  baseUrl: '/api/chat',
-});
-
-const createRes = () => ({
-  status: jest.fn().mockReturnThis(),
-  json: jest.fn().mockReturnThis(),
-});
-
-describe('buildEndpointOption - defaultParamsEndpoint parsing', () => {
-  beforeEach(() => {
-    jest.clearAllMocks();
-  });
-
-  it('should pass defaultParamsEndpoint to parseCompactConvo and preserve maxOutputTokens', async () => {
-    mockGetEndpointsConfig.mockResolvedValue({
-      AnthropicClaude: {
-        type: EModelEndpoint.custom,
-        customParams: {
-          defaultParamsEndpoint: EModelEndpoint.anthropic,
-        },
-      },
-    });
-
-    const req = createReq(
-      {
-        endpoint: 'AnthropicClaude',
-        endpointType: EModelEndpoint.custom,
-        model: 'anthropic/claude-opus-4.5',
-        temperature: 0.7,
-        maxOutputTokens: 8192,
-        topP: 0.9,
-        maxContextTokens: 50000,
-      },
-      { modelSpecs: null },
-    );
-
-    await buildEndpointOption(req, createRes(), jest.fn());
-
-    expect(parseCompactConvo).toHaveBeenCalledWith(
-      expect.objectContaining({
-        defaultParamsEndpoint: EModelEndpoint.anthropic,
-      }),
-    );
-
-    const parsedResult = parseCompactConvo.mock.results[0].value;
-    expect(parsedResult.maxOutputTokens).toBe(8192);
-    expect(parsedResult.topP).toBe(0.9);
-    expect(parsedResult.temperature).toBe(0.7);
-    expect(parsedResult.maxContextTokens).toBe(50000);
-  });
-
-  it('should strip maxOutputTokens when no defaultParamsEndpoint is configured', async () => {
-    mockGetEndpointsConfig.mockResolvedValue({
-      MyOpenRouter: {
-        type: EModelEndpoint.custom,
-      },
-    });
-
-    const req = createReq(
-      {
-        endpoint: 'MyOpenRouter',
-        endpointType: EModelEndpoint.custom,
-        model: 'gpt-4o',
-        temperature: 0.7,
-        maxOutputTokens: 8192,
-        max_tokens: 4096,
-      },
-      { modelSpecs: null },
-    );
-
-    await buildEndpointOption(req, createRes(), jest.fn());
-
-    expect(parseCompactConvo).toHaveBeenCalledWith(
-      expect.objectContaining({
-        defaultParamsEndpoint: undefined,
-      }),
-    );
-
-    const parsedResult = parseCompactConvo.mock.results[0].value;
-    expect(parsedResult.maxOutputTokens).toBeUndefined();
-    expect(parsedResult.max_tokens).toBe(4096);
-    expect(parsedResult.temperature).toBe(0.7);
-  });
-
-  it('should strip bedrock region from custom endpoint without defaultParamsEndpoint', async () => {
-    mockGetEndpointsConfig.mockResolvedValue({
-      MyEndpoint: {
-        type: EModelEndpoint.custom,
-      },
-    });
-
-    const req = createReq(
-      {
-        endpoint: 'MyEndpoint',
-        endpointType: EModelEndpoint.custom,
-        model: 'gpt-4o',
-        temperature: 0.7,
-        region: 'us-east-1',
-      },
-      { modelSpecs: null },
-    );
-
-    await buildEndpointOption(req, createRes(), jest.fn());
-
-    const parsedResult = parseCompactConvo.mock.results[0].value;
-    expect(parsedResult.region).toBeUndefined();
-    expect(parsedResult.temperature).toBe(0.7);
-  });
-
-  it('should pass defaultParamsEndpoint when re-parsing enforced model spec', async () => {
-    mockGetEndpointsConfig.mockResolvedValue({
-      AnthropicClaude: {
-        type: EModelEndpoint.custom,
-        customParams: {
-          defaultParamsEndpoint: EModelEndpoint.anthropic,
-        },
-      },
-    });
-
-    const modelSpec = {
-      name: 'claude-opus-4.5',
-      preset: {
-        endpoint: 'AnthropicClaude',
-        endpointType: EModelEndpoint.custom,
-        model: 'anthropic/claude-opus-4.5',
-        temperature: 0.7,
-        maxOutputTokens: 8192,
-        maxContextTokens: 50000,
-      },
-    };
-
-    const req = createReq(
-      {
-        endpoint: 'AnthropicClaude',
-        endpointType: EModelEndpoint.custom,
-        spec: 'claude-opus-4.5',
-        model: 'anthropic/claude-opus-4.5',
-      },
-      {
-        modelSpecs: {
-          enforce: true,
-          list: [modelSpec],
-        },
-      },
-    );
-
-    await buildEndpointOption(req, createRes(), jest.fn());
-
-    const enforcedCall = parseCompactConvo.mock.calls[1];
-    expect(enforcedCall[0]).toEqual(
-      expect.objectContaining({
-        defaultParamsEndpoint: EModelEndpoint.anthropic,
-      }),
-    );
-
-    const enforcedResult = parseCompactConvo.mock.results[1].value;
-    expect(enforcedResult.maxOutputTokens).toBe(8192);
-    expect(enforcedResult.temperature).toBe(0.7);
-    expect(enforcedResult.maxContextTokens).toBe(50000);
-  });
-
-  it('should fall back to OpenAI schema when getEndpointsConfig fails', async () => {
-    mockGetEndpointsConfig.mockRejectedValue(new Error('Config unavailable'));
-
-    const req = createReq(
-      {
-        endpoint: 'AnthropicClaude',
-        endpointType: EModelEndpoint.custom,
-        model: 'anthropic/claude-opus-4.5',
-        temperature: 0.7,
-        maxOutputTokens: 8192,
-        max_tokens: 4096,
-      },
-      { modelSpecs: null },
-    );
-
-    await buildEndpointOption(req, createRes(), jest.fn());
-
-    expect(parseCompactConvo).toHaveBeenCalledWith(
-      expect.objectContaining({
-        defaultParamsEndpoint: undefined,
-      }),
-    );
-
-    const parsedResult = parseCompactConvo.mock.results[0].value;
-    expect(parsedResult.maxOutputTokens).toBeUndefined();
-    expect(parsedResult.max_tokens).toBe(4096);
-  });
-});
--- a/api/server/middleware/checkSharePublicAccess.js
+++ b/api/server/middleware/checkSharePublicAccess.js
@ -9,7 +9,6 @@ const resourceToPermissionType = {
  [ResourceType.AGENT]: PermissionTypes.AGENTS,
  [ResourceType.PROMPTGROUP]: PermissionTypes.PROMPTS,
  [ResourceType.MCPSERVER]: PermissionTypes.MCP_SERVERS,
-  [ResourceType.REMOTE_AGENT]: PermissionTypes.REMOTE_AGENTS,
 };

 /**
--- a/api/server/middleware/limiters/forkLimiters.js
+++ b/api/server/middleware/limiters/forkLimiters.js
@ -48,7 +48,7 @@ const createForkHandler = (ip = true) => {
    };

    await logViolation(req, res, type, errorMessage, forkViolationScore);
-    res.status(429).json({ message: 'Too many requests. Try again later' });
+    res.status(429).json({ message: 'Too many conversation fork requests. Try again later' });
  };
 };

--- a/api/server/middleware/requireJwtAuth.js
+++ b/api/server/middleware/requireJwtAuth.js
@ -7,13 +7,16 @@ const { isEnabled } = require('@librechat/api');
 * Switches between JWT and OpenID authentication based on cookies and environment settings
 */
 const requireJwtAuth = (req, res, next) => {
+  // Check if token provider is specified in cookies
  const cookieHeader = req.headers.cookie;
  const tokenProvider = cookieHeader ? cookies.parse(cookieHeader).token_provider : null;

+  // Use OpenID authentication if token provider is OpenID and OPENID_REUSE_TOKENS is enabled
  if (tokenProvider === 'openid' && isEnabled(process.env.OPENID_REUSE_TOKENS)) {
    return passport.authenticate('openidJwt', { session: false })(req, res, next);
  }

+  // Default to standard JWT authentication
  return passport.authenticate('jwt', { session: false })(req, res, next);
 };

--- a/api/server/routes/test-utils/convos-route-mocks.js
+++ b/api/server/routes/test-utils/convos-route-mocks.js
@ -1,93 +0,0 @@
-module.exports = {
-  agents: () => ({ sleep: jest.fn() }),
-
-  api: (overrides = {}) => ({
-    isEnabled: jest.fn(),
-    resolveImportMaxFileSize: jest.fn(() => 262144000),
-    createAxiosInstance: jest.fn(() => ({
-      get: jest.fn(),
-      post: jest.fn(),
-      put: jest.fn(),
-      delete: jest.fn(),
-    })),
-    logAxiosError: jest.fn(),
-    ...overrides,
-  }),
-
-  dataSchemas: () => ({
-    logger: {
-      debug: jest.fn(),
-      info: jest.fn(),
-      warn: jest.fn(),
-      error: jest.fn(),
-    },
-    createModels: jest.fn(() => ({
-      User: {},
-      Conversation: {},
-      Message: {},
-      SharedLink: {},
-    })),
-  }),
-
-  dataProvider: (overrides = {}) => ({
-    CacheKeys: { GEN_TITLE: 'GEN_TITLE' },
-    EModelEndpoint: {
-      azureAssistants: 'azureAssistants',
-      assistants: 'assistants',
-    },
-    ...overrides,
-  }),
-
-  conversationModel: () => ({
-    getConvosByCursor: jest.fn(),
-    getConvo: jest.fn(),
-    deleteConvos: jest.fn(),
-    saveConvo: jest.fn(),
-  }),
-
-  toolCallModel: () => ({ deleteToolCalls: jest.fn() }),
-
-  sharedModels: () => ({
-    deleteAllSharedLinks: jest.fn(),
-    deleteConvoSharedLink: jest.fn(),
-  }),
-
-  requireJwtAuth: () => (req, res, next) => next(),
-
-  middlewarePassthrough: () => ({
-    createImportLimiters: jest.fn(() => ({
-      importIpLimiter: (req, res, next) => next(),
-      importUserLimiter: (req, res, next) => next(),
-    })),
-    createForkLimiters: jest.fn(() => ({
-      forkIpLimiter: (req, res, next) => next(),
-      forkUserLimiter: (req, res, next) => next(),
-    })),
-    configMiddleware: (req, res, next) => next(),
-    validateConvoAccess: (req, res, next) => next(),
-  }),
-
-  forkUtils: () => ({
-    forkConversation: jest.fn(),
-    duplicateConversation: jest.fn(),
-  }),
-
-  importUtils: () => ({ importConversations: jest.fn() }),
-
-  logStores: () => jest.fn(),
-
-  multerSetup: () => ({
-    storage: {},
-    importFileFilter: jest.fn(),
-  }),
-
-  multerLib: () =>
-    jest.fn(() => ({
-      single: jest.fn(() => (req, res, next) => {
-        req.file = { path: '/tmp/test-file.json' };
-        next();
-      }),
-    })),
-
-  assistantEndpoint: () => ({ initializeClient: jest.fn() }),
-};
--- a/api/server/routes/tests/convos-duplicate-ratelimit.spec.js
+++ b/api/server/routes/tests/convos-duplicate-ratelimit.spec.js
@ -1,135 +0,0 @@
-const express = require('express');
-const request = require('supertest');
-
-const MOCKS = '../__test-utils__/convos-route-mocks';
-
-jest.mock('@librechat/agents', () => require(MOCKS).agents());
-jest.mock('@librechat/api', () => require(MOCKS).api({ limiterCache: jest.fn(() => undefined) }));
-jest.mock('@librechat/data-schemas', () => require(MOCKS).dataSchemas());
-jest.mock('librechat-data-provider', () =>
-  require(MOCKS).dataProvider({ ViolationTypes: { FILE_UPLOAD_LIMIT: 'file_upload_limit' } }),
-);
-
-jest.mock('~/cache/logViolation', () => jest.fn().mockResolvedValue(undefined));
-jest.mock('~/cache/getLogStores', () => require(MOCKS).logStores());
-jest.mock('~/models/Conversation', () => require(MOCKS).conversationModel());
-jest.mock('~/models/ToolCall', () => require(MOCKS).toolCallModel());
-jest.mock('~/models', () => require(MOCKS).sharedModels());
-jest.mock('~/server/middleware/requireJwtAuth', () => require(MOCKS).requireJwtAuth());
-
-jest.mock('~/server/middleware', () => {
-  const { createForkLimiters } = jest.requireActual('~/server/middleware/limiters/forkLimiters');
-  return {
-    createImportLimiters: jest.fn(() => ({
-      importIpLimiter: (req, res, next) => next(),
-      importUserLimiter: (req, res, next) => next(),
-    })),
-    createForkLimiters,
-    configMiddleware: (req, res, next) => next(),
-    validateConvoAccess: (req, res, next) => next(),
-  };
-});
-
-jest.mock('~/server/utils/import/fork', () => require(MOCKS).forkUtils());
-jest.mock('~/server/utils/import', () => require(MOCKS).importUtils());
-jest.mock('~/server/routes/files/multer', () => require(MOCKS).multerSetup());
-jest.mock('multer', () => require(MOCKS).multerLib());
-jest.mock('~/server/services/Endpoints/azureAssistants', () => require(MOCKS).assistantEndpoint());
-jest.mock('~/server/services/Endpoints/assistants', () => require(MOCKS).assistantEndpoint());
-
-describe('POST /api/convos/duplicate - Rate Limiting', () => {
-  let app;
-  let duplicateConversation;
-  const savedEnv = {};
-
-  beforeAll(() => {
-    savedEnv.FORK_USER_MAX = process.env.FORK_USER_MAX;
-    savedEnv.FORK_USER_WINDOW = process.env.FORK_USER_WINDOW;
-    savedEnv.FORK_IP_MAX = process.env.FORK_IP_MAX;
-    savedEnv.FORK_IP_WINDOW = process.env.FORK_IP_WINDOW;
-  });
-
-  afterAll(() => {
-    for (const key of Object.keys(savedEnv)) {
-      if (savedEnv[key] === undefined) {
-        delete process.env[key];
-      } else {
-        process.env[key] = savedEnv[key];
-      }
-    }
-  });
-
-  const setupApp = () => {
-    jest.clearAllMocks();
-    jest.isolateModules(() => {
-      const convosRouter = require('../convos');
-      ({ duplicateConversation } = require('~/server/utils/import/fork'));
-
-      app = express();
-      app.use(express.json());
-      app.use((req, res, next) => {
-        req.user = { id: 'rate-limit-test-user' };
-        next();
-      });
-      app.use('/api/convos', convosRouter);
-    });
-
-    duplicateConversation.mockResolvedValue({
-      conversation: { conversationId: 'duplicated-conv' },
-    });
-  };
-
-  describe('user limit', () => {
-    beforeEach(() => {
-      process.env.FORK_USER_MAX = '2';
-      process.env.FORK_USER_WINDOW = '1';
-      process.env.FORK_IP_MAX = '100';
-      process.env.FORK_IP_WINDOW = '1';
-      setupApp();
-    });
-
-    it('should return 429 after exceeding the user rate limit', async () => {
-      const userMax = parseInt(process.env.FORK_USER_MAX, 10);
-
-      for (let i = 0; i < userMax; i++) {
-        const res = await request(app)
-          .post('/api/convos/duplicate')
-          .send({ conversationId: 'conv-123' });
-        expect(res.status).toBe(201);
-      }
-
-      const res = await request(app)
-        .post('/api/convos/duplicate')
-        .send({ conversationId: 'conv-123' });
-      expect(res.status).toBe(429);
-      expect(res.body.message).toMatch(/too many/i);
-    });
-  });
-
-  describe('IP limit', () => {
-    beforeEach(() => {
-      process.env.FORK_USER_MAX = '100';
-      process.env.FORK_USER_WINDOW = '1';
-      process.env.FORK_IP_MAX = '2';
-      process.env.FORK_IP_WINDOW = '1';
-      setupApp();
-    });
-
-    it('should return 429 after exceeding the IP rate limit', async () => {
-      const ipMax = parseInt(process.env.FORK_IP_MAX, 10);
-
-      for (let i = 0; i < ipMax; i++) {
-        const res = await request(app)
-          .post('/api/convos/duplicate')
-          .send({ conversationId: 'conv-123' });
-        expect(res.status).toBe(201);
-      }
-
-      const res = await request(app)
-        .post('/api/convos/duplicate')
-        .send({ conversationId: 'conv-123' });
-      expect(res.status).toBe(429);
-      expect(res.body.message).toMatch(/too many/i);
-    });
-  });
-});
--- a/api/server/routes/tests/convos-import.spec.js
+++ b/api/server/routes/tests/convos-import.spec.js
@ -1,98 +0,0 @@
-const express = require('express');
-const request = require('supertest');
-const multer = require('multer');
-
-const importFileFilter = (req, file, cb) => {
-  if (file.mimetype === 'application/json') {
-    cb(null, true);
-  } else {
-    cb(new Error('Only JSON files are allowed'), false);
-  }
-};
-
-/** Proxy app that mirrors the production multer + error-handling pattern */
-function createImportApp(fileSize) {
-  const app = express();
-  const upload = multer({
-    storage: multer.memoryStorage(),
-    fileFilter: importFileFilter,
-    limits: { fileSize },
-  });
-  const uploadSingle = upload.single('file');
-
-  function handleUpload(req, res, next) {
-    uploadSingle(req, res, (err) => {
-      if (err && err.code === 'LIMIT_FILE_SIZE') {
-        return res.status(413).json({ message: 'File exceeds the maximum allowed size' });
-      }
-      if (err) {
-        return next(err);
-      }
-      next();
-    });
-  }
-
-  app.post('/import', handleUpload, (req, res) => {
-    res.status(201).json({ message: 'success', size: req.file.size });
-  });
-
-  app.use((err, _req, res, _next) => {
-    res.status(400).json({ error: err.message });
-  });
-
-  return app;
-}
-
-describe('Conversation Import - Multer File Size Limits', () => {
-  describe('multer rejects files exceeding the configured limit', () => {
-    it('returns 413 for files larger than the limit', async () => {
-      const limit = 1024;
-      const app = createImportApp(limit);
-      const oversized = Buffer.alloc(limit + 512, 'x');
-
-      const res = await request(app)
-        .post('/import')
-        .attach('file', oversized, { filename: 'import.json', contentType: 'application/json' });
-
-      expect(res.status).toBe(413);
-      expect(res.body.message).toBe('File exceeds the maximum allowed size');
-    });
-
-    it('accepts files within the limit', async () => {
-      const limit = 4096;
-      const app = createImportApp(limit);
-      const valid = Buffer.from(JSON.stringify({ title: 'test' }));
-
-      const res = await request(app)
-        .post('/import')
-        .attach('file', valid, { filename: 'import.json', contentType: 'application/json' });
-
-      expect(res.status).toBe(201);
-      expect(res.body.message).toBe('success');
-    });
-
-    it('rejects at the exact boundary (limit + 1 byte)', async () => {
-      const limit = 512;
-      const app = createImportApp(limit);
-      const boundary = Buffer.alloc(limit + 1, 'a');
-
-      const res = await request(app)
-        .post('/import')
-        .attach('file', boundary, { filename: 'import.json', contentType: 'application/json' });
-
-      expect(res.status).toBe(413);
-    });
-
-    it('accepts a file just under the limit', async () => {
-      const limit = 512;
-      const app = createImportApp(limit);
-      const underLimit = Buffer.alloc(limit - 1, 'b');
-
-      const res = await request(app)
-        .post('/import')
-        .attach('file', underLimit, { filename: 'import.json', contentType: 'application/json' });
-
-      expect(res.status).toBe(201);
-    });
-  });
-});
--- a/api/server/routes/tests/convos.spec.js
+++ b/api/server/routes/tests/convos.spec.js
@ -1,24 +1,109 @@
 const express = require('express');
 const request = require('supertest');

-const MOCKS = '../__test-utils__/convos-route-mocks';
+jest.mock('@librechat/agents', () => ({
+  sleep: jest.fn(),
+}));

-jest.mock('@librechat/agents', () => require(MOCKS).agents());
-jest.mock('@librechat/api', () => require(MOCKS).api());
-jest.mock('@librechat/data-schemas', () => require(MOCKS).dataSchemas());
-jest.mock('librechat-data-provider', () => require(MOCKS).dataProvider());
-jest.mock('~/models/Conversation', () => require(MOCKS).conversationModel());
-jest.mock('~/models/ToolCall', () => require(MOCKS).toolCallModel());
-jest.mock('~/models', () => require(MOCKS).sharedModels());
-jest.mock('~/server/middleware/requireJwtAuth', () => require(MOCKS).requireJwtAuth());
-jest.mock('~/server/middleware', () => require(MOCKS).middlewarePassthrough());
-jest.mock('~/server/utils/import/fork', () => require(MOCKS).forkUtils());
-jest.mock('~/server/utils/import', () => require(MOCKS).importUtils());
-jest.mock('~/cache/getLogStores', () => require(MOCKS).logStores());
-jest.mock('~/server/routes/files/multer', () => require(MOCKS).multerSetup());
-jest.mock('multer', () => require(MOCKS).multerLib());
-jest.mock('~/server/services/Endpoints/azureAssistants', () => require(MOCKS).assistantEndpoint());
-jest.mock('~/server/services/Endpoints/assistants', () => require(MOCKS).assistantEndpoint());
+jest.mock('@librechat/api', () => ({
+  isEnabled: jest.fn(),
+  createAxiosInstance: jest.fn(() => ({
+    get: jest.fn(),
+    post: jest.fn(),
+    put: jest.fn(),
+    delete: jest.fn(),
+  })),
+  logAxiosError: jest.fn(),
+}));
+
+jest.mock('@librechat/data-schemas', () => ({
+  logger: {
+    debug: jest.fn(),
+    info: jest.fn(),
+    warn: jest.fn(),
+    error: jest.fn(),
+  },
+  createModels: jest.fn(() => ({
+    User: {},
+    Conversation: {},
+    Message: {},
+    SharedLink: {},
+  })),
+}));
+
+jest.mock('~/models/Conversation', () => ({
+  getConvosByCursor: jest.fn(),
+  getConvo: jest.fn(),
+  deleteConvos: jest.fn(),
+  saveConvo: jest.fn(),
+}));
+
+jest.mock('~/models/ToolCall', () => ({
+  deleteToolCalls: jest.fn(),
+}));
+
+jest.mock('~/models', () => ({
+  deleteAllSharedLinks: jest.fn(),
+  deleteConvoSharedLink: jest.fn(),
+}));
+
+jest.mock('~/server/middleware/requireJwtAuth', () => (req, res, next) => next());
+
+jest.mock('~/server/middleware', () => ({
+  createImportLimiters: jest.fn(() => ({
+    importIpLimiter: (req, res, next) => next(),
+    importUserLimiter: (req, res, next) => next(),
+  })),
+  createForkLimiters: jest.fn(() => ({
+    forkIpLimiter: (req, res, next) => next(),
+    forkUserLimiter: (req, res, next) => next(),
+  })),
+  configMiddleware: (req, res, next) => next(),
+  validateConvoAccess: (req, res, next) => next(),
+}));
+
+jest.mock('~/server/utils/import/fork', () => ({
+  forkConversation: jest.fn(),
+  duplicateConversation: jest.fn(),
+}));
+
+jest.mock('~/server/utils/import', () => ({
+  importConversations: jest.fn(),
+}));
+
+jest.mock('~/cache/getLogStores', () => jest.fn());
+
+jest.mock('~/server/routes/files/multer', () => ({
+  storage: {},
+  importFileFilter: jest.fn(),
+}));
+
+jest.mock('multer', () => {
+  return jest.fn(() => ({
+    single: jest.fn(() => (req, res, next) => {
+      req.file = { path: '/tmp/test-file.json' };
+      next();
+    }),
+  }));
+});
+
+jest.mock('librechat-data-provider', () => ({
+  CacheKeys: {
+    GEN_TITLE: 'GEN_TITLE',
+  },
+  EModelEndpoint: {
+    azureAssistants: 'azureAssistants',
+    assistants: 'assistants',
+  },
+}));
+
+jest.mock('~/server/services/Endpoints/azureAssistants', () => ({
+  initializeClient: jest.fn(),
+}));
+
+jest.mock('~/server/services/Endpoints/assistants', () => ({
+  initializeClient: jest.fn(),
+}));

 describe('Convos Routes', () => {
  let app;
@ -300,40 +385,6 @@ describe('Convos Routes', () => {
      expect(deleteConvoSharedLink).not.toHaveBeenCalled();
    });

-    it('should return 400 when request body is empty (DoS prevention)', async () => {
-      const response = await request(app).delete('/api/convos').send({});
-
-      expect(response.status).toBe(400);
-      expect(response.body).toEqual({ error: 'no parameters provided' });
-      expect(deleteConvos).not.toHaveBeenCalled();
-    });
-
-    it('should return 400 when arg is null (DoS prevention)', async () => {
-      const response = await request(app).delete('/api/convos').send({ arg: null });
-
-      expect(response.status).toBe(400);
-      expect(response.body).toEqual({ error: 'no parameters provided' });
-      expect(deleteConvos).not.toHaveBeenCalled();
-    });
-
-    it('should return 400 when arg is undefined (DoS prevention)', async () => {
-      const response = await request(app).delete('/api/convos').send({ arg: undefined });
-
-      expect(response.status).toBe(400);
-      expect(response.body).toEqual({ error: 'no parameters provided' });
-      expect(deleteConvos).not.toHaveBeenCalled();
-    });
-
-    it('should return 400 when request body is null (DoS prevention)', async () => {
-      const response = await request(app)
-        .delete('/api/convos')
-        .set('Content-Type', 'application/json')
-        .send('null');
-
-      expect(response.status).toBe(400);
-      expect(deleteConvos).not.toHaveBeenCalled();
-    });
-
    it('should return 500 if deleteConvoSharedLink fails', async () => {
      const mockConversationId = 'conv-error';

--- a/api/server/routes/tests/keys.spec.js
+++ b/api/server/routes/tests/keys.spec.js
@ -1,174 +0,0 @@
-const express = require('express');
-const request = require('supertest');
-
-jest.mock('~/models', () => ({
-  updateUserKey: jest.fn(),
-  deleteUserKey: jest.fn(),
-  getUserKeyExpiry: jest.fn(),
-}));
-
-jest.mock('~/server/middleware/requireJwtAuth', () => (req, res, next) => next());
-
-jest.mock('~/server/middleware', () => ({
-  requireJwtAuth: (req, res, next) => next(),
-}));
-
-describe('Keys Routes', () => {
-  let app;
-  const { updateUserKey, deleteUserKey, getUserKeyExpiry } = require('~/models');
-
-  beforeAll(() => {
-    const keysRouter = require('../keys');
-
-    app = express();
-    app.use(express.json());
-
-    app.use((req, res, next) => {
-      req.user = { id: 'test-user-123' };
-      next();
-    });
-
-    app.use('/api/keys', keysRouter);
-  });
-
-  beforeEach(() => {
-    jest.clearAllMocks();
-  });
-
-  describe('PUT /', () => {
-    it('should update a user key with the authenticated user ID', async () => {
-      updateUserKey.mockResolvedValue({});
-
-      const response = await request(app)
-        .put('/api/keys')
-        .send({ name: 'openAI', value: 'sk-test-key-123', expiresAt: '2026-12-31' });
-
-      expect(response.status).toBe(201);
-      expect(updateUserKey).toHaveBeenCalledWith({
-        userId: 'test-user-123',
-        name: 'openAI',
-        value: 'sk-test-key-123',
-        expiresAt: '2026-12-31',
-      });
-      expect(updateUserKey).toHaveBeenCalledTimes(1);
-    });
-
-    it('should not allow userId override via request body (IDOR prevention)', async () => {
-      updateUserKey.mockResolvedValue({});
-
-      const response = await request(app).put('/api/keys').send({
-        userId: 'attacker-injected-id',
-        name: 'openAI',
-        value: 'sk-attacker-key',
-      });
-
-      expect(response.status).toBe(201);
-      expect(updateUserKey).toHaveBeenCalledWith({
-        userId: 'test-user-123',
-        name: 'openAI',
-        value: 'sk-attacker-key',
-        expiresAt: undefined,
-      });
-    });
-
-    it('should ignore extraneous fields from request body', async () => {
-      updateUserKey.mockResolvedValue({});
-
-      const response = await request(app).put('/api/keys').send({
-        name: 'openAI',
-        value: 'sk-test-key',
-        expiresAt: '2026-12-31',
-        _id: 'injected-mongo-id',
-        __v: 99,
-        extra: 'should-be-ignored',
-      });
-
-      expect(response.status).toBe(201);
-      expect(updateUserKey).toHaveBeenCalledWith({
-        userId: 'test-user-123',
-        name: 'openAI',
-        value: 'sk-test-key',
-        expiresAt: '2026-12-31',
-      });
-    });
-
-    it('should handle missing optional fields', async () => {
-      updateUserKey.mockResolvedValue({});
-
-      const response = await request(app)
-        .put('/api/keys')
-        .send({ name: 'anthropic', value: 'sk-ant-key' });
-
-      expect(response.status).toBe(201);
-      expect(updateUserKey).toHaveBeenCalledWith({
-        userId: 'test-user-123',
-        name: 'anthropic',
-        value: 'sk-ant-key',
-        expiresAt: undefined,
-      });
-    });
-
-    it('should return 400 when request body is null', async () => {
-      const response = await request(app)
-        .put('/api/keys')
-        .set('Content-Type', 'application/json')
-        .send('null');
-
-      expect(response.status).toBe(400);
-      expect(updateUserKey).not.toHaveBeenCalled();
-    });
-  });
-
-  describe('DELETE /:name', () => {
-    it('should delete a user key by name', async () => {
-      deleteUserKey.mockResolvedValue({});
-
-      const response = await request(app).delete('/api/keys/openAI');
-
-      expect(response.status).toBe(204);
-      expect(deleteUserKey).toHaveBeenCalledWith({
-        userId: 'test-user-123',
-        name: 'openAI',
-      });
-      expect(deleteUserKey).toHaveBeenCalledTimes(1);
-    });
-  });
-
-  describe('DELETE /', () => {
-    it('should delete all keys when all=true', async () => {
-      deleteUserKey.mockResolvedValue({});
-
-      const response = await request(app).delete('/api/keys?all=true');
-
-      expect(response.status).toBe(204);
-      expect(deleteUserKey).toHaveBeenCalledWith({
-        userId: 'test-user-123',
-        all: true,
-      });
-    });
-
-    it('should return 400 when all query param is not true', async () => {
-      const response = await request(app).delete('/api/keys');
-
-      expect(response.status).toBe(400);
-      expect(response.body).toEqual({ error: 'Specify either all=true to delete.' });
-      expect(deleteUserKey).not.toHaveBeenCalled();
-    });
-  });
-
-  describe('GET /', () => {
-    it('should return key expiry for a given key name', async () => {
-      const mockExpiry = { expiresAt: '2026-12-31' };
-      getUserKeyExpiry.mockResolvedValue(mockExpiry);
-
-      const response = await request(app).get('/api/keys?name=openAI');
-
-      expect(response.status).toBe(200);
-      expect(response.body).toEqual(mockExpiry);
-      expect(getUserKeyExpiry).toHaveBeenCalledWith({
-        userId: 'test-user-123',
-        name: 'openAI',
-      });
-    });
-  });
-});
--- a/api/server/routes/tests/mcp.spec.js
+++ b/api/server/routes/tests/mcp.spec.js
@ -1,18 +1,8 @@
-const crypto = require('crypto');
 const express = require('express');
 const request = require('supertest');
 const mongoose = require('mongoose');
-const cookieParser = require('cookie-parser');
-const { getBasePath } = require('@librechat/api');
 const { MongoMemoryServer } = require('mongodb-memory-server');
-
-function generateTestCsrfToken(flowId) {
-  return crypto
-    .createHmac('sha256', process.env.JWT_SECRET)
-    .update(flowId)
-    .digest('hex')
-    .slice(0, 32);
-}
+const { getBasePath } = require('@librechat/api');

 const mockRegistryInstance = {
  getServerConfig: jest.fn(),
@ -32,9 +22,6 @@ jest.mock('@librechat/api', () => {
      getFlowState: jest.fn(),
      completeOAuthFlow: jest.fn(),
      generateFlowId: jest.fn(),
-      resolveStateToFlowId: jest.fn(async (state) => state),
-      storeStateMapping: jest.fn(),
-      deleteStateMapping: jest.fn(),
    },
    MCPTokenStorage: {
      storeTokens: jest.fn(),
@ -143,7 +130,6 @@ describe('MCP Routes', () => {

    app = express();
    app.use(express.json());
-    app.use(cookieParser());

    app.use((req, res, next) => {
      req.user = { id: 'test-user-id' };
@ -182,15 +168,12 @@ describe('MCP Routes', () => {

      MCPOAuthHandler.initiateOAuthFlow.mockResolvedValue({
        authorizationUrl: 'https://oauth.example.com/auth',
-        flowId: 'test-user-id:test-server',
-        flowMetadata: { state: 'random-state-value' },
+        flowId: 'test-flow-id',
      });
-      MCPOAuthHandler.storeStateMapping.mockResolvedValue();
-      mockFlowManager.initFlow = jest.fn().mockResolvedValue();

      const response = await request(app).get('/api/mcp/test-server/oauth/initiate').query({
        userId: 'test-user-id',
-        flowId: 'test-user-id:test-server',
+        flowId: 'test-flow-id',
      });

      expect(response.status).toBe(302);
@ -207,7 +190,7 @@ describe('MCP Routes', () => {
    it('should return 403 when userId does not match authenticated user', async () => {
      const response = await request(app).get('/api/mcp/test-server/oauth/initiate').query({
        userId: 'different-user-id',
-        flowId: 'test-user-id:test-server',
+        flowId: 'test-flow-id',
      });

      expect(response.status).toBe(403);
@ -245,7 +228,7 @@ describe('MCP Routes', () => {

      const response = await request(app).get('/api/mcp/test-server/oauth/initiate').query({
        userId: 'test-user-id',
-        flowId: 'test-user-id:test-server',
+        flowId: 'test-flow-id',
      });

      expect(response.status).toBe(400);
@ -262,7 +245,7 @@ describe('MCP Routes', () => {

      const response = await request(app).get('/api/mcp/test-server/oauth/initiate').query({
        userId: 'test-user-id',
-        flowId: 'test-user-id:test-server',
+        flowId: 'test-flow-id',
      });

      expect(response.status).toBe(500);
@ -272,7 +255,7 @@ describe('MCP Routes', () => {
    it('should return 400 when flow state metadata is null', async () => {
      const mockFlowManager = {
        getFlowState: jest.fn().mockResolvedValue({
-          id: 'test-user-id:test-server',
+          id: 'test-flow-id',
          metadata: null,
        }),
      };
@ -282,7 +265,7 @@ describe('MCP Routes', () => {

      const response = await request(app).get('/api/mcp/test-server/oauth/initiate').query({
        userId: 'test-user-id',
-        flowId: 'test-user-id:test-server',
+        flowId: 'test-flow-id',
      });

      expect(response.status).toBe(400);
@ -297,7 +280,7 @@ describe('MCP Routes', () => {
    it('should redirect to error page when OAuth error is received', async () => {
      const response = await request(app).get('/api/mcp/test-server/oauth/callback').query({
        error: 'access_denied',
-        state: 'test-user-id:test-server',
+        state: 'test-flow-id',
      });
      const basePath = getBasePath();

@ -307,7 +290,7 @@ describe('MCP Routes', () => {

    it('should redirect to error page when code is missing', async () => {
      const response = await request(app).get('/api/mcp/test-server/oauth/callback').query({
-        state: 'test-user-id:test-server',
+        state: 'test-flow-id',
      });
      const basePath = getBasePath();

@ -325,169 +308,19 @@ describe('MCP Routes', () => {
      expect(response.headers.location).toBe(`${basePath}/oauth/error?error=missing_state`);
    });

-    it('should redirect to error page when CSRF cookie is missing', async () => {
-      const response = await request(app).get('/api/mcp/test-server/oauth/callback').query({
-        code: 'test-auth-code',
-        state: 'test-user-id:test-server',
-      });
-      const basePath = getBasePath();
-
-      expect(response.status).toBe(302);
-      expect(response.headers.location).toBe(
-        `${basePath}/oauth/error?error=csrf_validation_failed`,
-      );
-    });
-
-    it('should redirect to error page when CSRF cookie does not match state', async () => {
-      const csrfToken = generateTestCsrfToken('different-flow-id');
-      const response = await request(app)
-        .get('/api/mcp/test-server/oauth/callback')
-        .set('Cookie', [`oauth_csrf=${csrfToken}`])
-        .query({
-          code: 'test-auth-code',
-          state: 'test-user-id:test-server',
-        });
-      const basePath = getBasePath();
-
-      expect(response.status).toBe(302);
-      expect(response.headers.location).toBe(
-        `${basePath}/oauth/error?error=csrf_validation_failed`,
-      );
-    });
-
    it('should redirect to error page when flow state is not found', async () => {
      MCPOAuthHandler.getFlowState.mockResolvedValue(null);
-      const flowId = 'invalid-flow:id';
-      const csrfToken = generateTestCsrfToken(flowId);

-      const response = await request(app)
-        .get('/api/mcp/test-server/oauth/callback')
-        .set('Cookie', [`oauth_csrf=${csrfToken}`])
-        .query({
-          code: 'test-auth-code',
-          state: flowId,
-        });
+      const response = await request(app).get('/api/mcp/test-server/oauth/callback').query({
+        code: 'test-auth-code',
+        state: 'invalid-flow-id',
+      });
      const basePath = getBasePath();

      expect(response.status).toBe(302);
      expect(response.headers.location).toBe(`${basePath}/oauth/error?error=invalid_state`);
    });

-    describe('CSRF fallback via active PENDING flow', () => {
-      it('should proceed when a fresh PENDING flow exists and no cookies are present', async () => {
-        const flowId = 'test-user-id:test-server';
-        const mockFlowManager = {
-          getFlowState: jest.fn().mockResolvedValue({
-            status: 'PENDING',
-            createdAt: Date.now(),
-          }),
-          completeFlow: jest.fn().mockResolvedValue(true),
-          deleteFlow: jest.fn().mockResolvedValue(true),
-        };
-        const mockFlowState = {
-          serverName: 'test-server',
-          userId: 'test-user-id',
-          metadata: {},
-          clientInfo: {},
-          codeVerifier: 'test-verifier',
-        };
-
-        getLogStores.mockReturnValue({});
-        require('~/config').getFlowStateManager.mockReturnValue(mockFlowManager);
-        MCPOAuthHandler.getFlowState.mockResolvedValue(mockFlowState);
-        MCPOAuthHandler.completeOAuthFlow.mockResolvedValue({
-          access_token: 'test-token',
-        });
-        MCPTokenStorage.storeTokens.mockResolvedValue();
-        mockRegistryInstance.getServerConfig.mockResolvedValue({});
-
-        const mockMcpManager = {
-          getUserConnection: jest.fn().mockResolvedValue({
-            fetchTools: jest.fn().mockResolvedValue([]),
-          }),
-        };
-        require('~/config').getMCPManager.mockReturnValue(mockMcpManager);
-        require('~/config').getOAuthReconnectionManager.mockReturnValue({
-          clearReconnection: jest.fn(),
-        });
-        require('~/server/services/Config/mcp').updateMCPServerTools.mockResolvedValue();
-
-        const response = await request(app)
-          .get('/api/mcp/test-server/oauth/callback')
-          .query({ code: 'test-code', state: flowId });
-
-        const basePath = getBasePath();
-        expect(response.status).toBe(302);
-        expect(response.headers.location).toContain(`${basePath}/oauth/success`);
-      });
-
-      it('should reject when no PENDING flow exists and no cookies are present', async () => {
-        const flowId = 'test-user-id:test-server';
-        const mockFlowManager = {
-          getFlowState: jest.fn().mockResolvedValue(null),
-        };
-
-        getLogStores.mockReturnValue({});
-        require('~/config').getFlowStateManager.mockReturnValue(mockFlowManager);
-
-        const response = await request(app)
-          .get('/api/mcp/test-server/oauth/callback')
-          .query({ code: 'test-code', state: flowId });
-
-        const basePath = getBasePath();
-        expect(response.status).toBe(302);
-        expect(response.headers.location).toBe(
-          `${basePath}/oauth/error?error=csrf_validation_failed`,
-        );
-      });
-
-      it('should reject when only a COMPLETED flow exists (not PENDING)', async () => {
-        const flowId = 'test-user-id:test-server';
-        const mockFlowManager = {
-          getFlowState: jest.fn().mockResolvedValue({
-            status: 'COMPLETED',
-            createdAt: Date.now(),
-          }),
-        };
-
-        getLogStores.mockReturnValue({});
-        require('~/config').getFlowStateManager.mockReturnValue(mockFlowManager);
-
-        const response = await request(app)
-          .get('/api/mcp/test-server/oauth/callback')
-          .query({ code: 'test-code', state: flowId });
-
-        const basePath = getBasePath();
-        expect(response.status).toBe(302);
-        expect(response.headers.location).toBe(
-          `${basePath}/oauth/error?error=csrf_validation_failed`,
-        );
-      });
-
-      it('should reject when PENDING flow is stale (older than PENDING_STALE_MS)', async () => {
-        const flowId = 'test-user-id:test-server';
-        const mockFlowManager = {
-          getFlowState: jest.fn().mockResolvedValue({
-            status: 'PENDING',
-            createdAt: Date.now() - 3 * 60 * 1000,
-          }),
-        };
-
-        getLogStores.mockReturnValue({});
-        require('~/config').getFlowStateManager.mockReturnValue(mockFlowManager);
-
-        const response = await request(app)
-          .get('/api/mcp/test-server/oauth/callback')
-          .query({ code: 'test-code', state: flowId });
-
-        const basePath = getBasePath();
-        expect(response.status).toBe(302);
-        expect(response.headers.location).toBe(
-          `${basePath}/oauth/error?error=csrf_validation_failed`,
-        );
-      });
-    });
-
    it('should handle OAuth callback successfully', async () => {
      // mockRegistryInstance is defined at the top of the file
      const mockFlowManager = {
@ -536,22 +369,16 @@ describe('MCP Routes', () => {
      });
      setCachedTools.mockResolvedValue();

-      const flowId = 'test-user-id:test-server';
-      const csrfToken = generateTestCsrfToken(flowId);
-
-      const response = await request(app)
-        .get('/api/mcp/test-server/oauth/callback')
-        .set('Cookie', [`oauth_csrf=${csrfToken}`])
-        .query({
-          code: 'test-auth-code',
-          state: flowId,
-        });
+      const response = await request(app).get('/api/mcp/test-server/oauth/callback').query({
+        code: 'test-auth-code',
+        state: 'test-flow-id',
+      });
      const basePath = getBasePath();

      expect(response.status).toBe(302);
      expect(response.headers.location).toBe(`${basePath}/oauth/success?serverName=test-server`);
      expect(MCPOAuthHandler.completeOAuthFlow).toHaveBeenCalledWith(
-        flowId,
+        'test-flow-id',
        'test-auth-code',
        mockFlowManager,
        {},
@ -573,24 +400,16 @@ describe('MCP Routes', () => {
        'mcp_oauth',
        mockTokens,
      );
-      expect(mockFlowManager.deleteFlow).toHaveBeenCalledWith(
-        'test-user-id:test-server',
-        'mcp_get_tokens',
-      );
+      expect(mockFlowManager.deleteFlow).toHaveBeenCalledWith('test-flow-id', 'mcp_get_tokens');
    });

    it('should redirect to error page when callback processing fails', async () => {
      MCPOAuthHandler.getFlowState.mockRejectedValue(new Error('Callback error'));
-      const flowId = 'test-user-id:test-server';
-      const csrfToken = generateTestCsrfToken(flowId);

-      const response = await request(app)
-        .get('/api/mcp/test-server/oauth/callback')
-        .set('Cookie', [`oauth_csrf=${csrfToken}`])
-        .query({
-          code: 'test-auth-code',
-          state: flowId,
-        });
+      const response = await request(app).get('/api/mcp/test-server/oauth/callback').query({
+        code: 'test-auth-code',
+        state: 'test-flow-id',
+      });
      const basePath = getBasePath();

      expect(response.status).toBe(302);
@ -623,21 +442,15 @@ describe('MCP Routes', () => {
      getLogStores.mockReturnValue({});
      require('~/config').getFlowStateManager.mockReturnValue(mockFlowManager);

-      const flowId = 'test-user-id:test-server';
-      const csrfToken = generateTestCsrfToken(flowId);
-
-      const response = await request(app)
-        .get('/api/mcp/test-server/oauth/callback')
-        .set('Cookie', [`oauth_csrf=${csrfToken}`])
-        .query({
-          code: 'test-auth-code',
-          state: flowId,
-        });
+      const response = await request(app).get('/api/mcp/test-server/oauth/callback').query({
+        code: 'test-auth-code',
+        state: 'test-flow-id',
+      });
      const basePath = getBasePath();

      expect(response.status).toBe(302);
      expect(response.headers.location).toBe(`${basePath}/oauth/success?serverName=test-server`);
-      expect(mockFlowManager.deleteFlow).toHaveBeenCalledWith(flowId, 'mcp_get_tokens');
+      expect(mockFlowManager.deleteFlow).toHaveBeenCalledWith('test-flow-id', 'mcp_get_tokens');
    });

    it('should handle reconnection failure after OAuth', async () => {
@ -675,22 +488,16 @@ describe('MCP Routes', () => {
      getCachedTools.mockResolvedValue({});
      setCachedTools.mockResolvedValue();

-      const flowId = 'test-user-id:test-server';
-      const csrfToken = generateTestCsrfToken(flowId);
-
-      const response = await request(app)
-        .get('/api/mcp/test-server/oauth/callback')
-        .set('Cookie', [`oauth_csrf=${csrfToken}`])
-        .query({
-          code: 'test-auth-code',
-          state: flowId,
-        });
+      const response = await request(app).get('/api/mcp/test-server/oauth/callback').query({
+        code: 'test-auth-code',
+        state: 'test-flow-id',
+      });
      const basePath = getBasePath();

      expect(response.status).toBe(302);
      expect(response.headers.location).toBe(`${basePath}/oauth/success?serverName=test-server`);
      expect(MCPTokenStorage.storeTokens).toHaveBeenCalled();
-      expect(mockFlowManager.deleteFlow).toHaveBeenCalledWith(flowId, 'mcp_get_tokens');
+      expect(mockFlowManager.deleteFlow).toHaveBeenCalledWith('test-flow-id', 'mcp_get_tokens');
    });

    it('should redirect to error page if token storage fails', async () => {
@ -723,16 +530,10 @@ describe('MCP Routes', () => {
      };
      require('~/config').getMCPManager.mockReturnValue(mockMcpManager);

-      const flowId = 'test-user-id:test-server';
-      const csrfToken = generateTestCsrfToken(flowId);
-
-      const response = await request(app)
-        .get('/api/mcp/test-server/oauth/callback')
-        .set('Cookie', [`oauth_csrf=${csrfToken}`])
-        .query({
-          code: 'test-auth-code',
-          state: flowId,
-        });
+      const response = await request(app).get('/api/mcp/test-server/oauth/callback').query({
+        code: 'test-auth-code',
+        state: 'test-flow-id',
+      });
      const basePath = getBasePath();

      expect(response.status).toBe(302);
@ -788,27 +589,22 @@ describe('MCP Routes', () => {
        clearReconnection: jest.fn(),
      });

-      const flowId = 'test-user-id:test-server';
-      const csrfToken = generateTestCsrfToken(flowId);
-
-      const response = await request(app)
-        .get('/api/mcp/test-server/oauth/callback')
-        .set('Cookie', [`oauth_csrf=${csrfToken}`])
-        .query({
-          code: 'test-auth-code',
-          state: flowId,
-        });
+      const response = await request(app).get('/api/mcp/test-server/oauth/callback').query({
+        code: 'test-auth-code',
+        state: 'test-flow-id',
+      });
      const basePath = getBasePath();

      expect(response.status).toBe(302);
      expect(response.headers.location).toBe(`${basePath}/oauth/success?serverName=test-server`);

+      // Verify storeTokens was called with ORIGINAL flow state credentials
      expect(MCPTokenStorage.storeTokens).toHaveBeenCalledWith(
        expect.objectContaining({
          userId: 'test-user-id',
          serverName: 'test-server',
          tokens: mockTokens,
-          clientInfo: clientInfo,
+          clientInfo: clientInfo, // Uses original flow state, not any "updated" credentials
          metadata: flowState.metadata,
        }),
      );
@ -835,21 +631,16 @@ describe('MCP Routes', () => {
      getLogStores.mockReturnValue({});
      require('~/config').getFlowStateManager.mockReturnValue(mockFlowManager);

-      const flowId = 'test-user-id:test-server';
-      const csrfToken = generateTestCsrfToken(flowId);
-
-      const response = await request(app)
-        .get('/api/mcp/test-server/oauth/callback')
-        .set('Cookie', [`oauth_csrf=${csrfToken}`])
-        .query({
-          code: 'test-auth-code',
-          state: flowId,
-        });
+      const response = await request(app).get('/api/mcp/test-server/oauth/callback').query({
+        code: 'test-auth-code',
+        state: 'test-flow-id',
+      });
      const basePath = getBasePath();

      expect(response.status).toBe(302);
      expect(response.headers.location).toBe(`${basePath}/oauth/success?serverName=test-server`);

+      // Verify completeOAuthFlow was NOT called (prevented duplicate)
      expect(MCPOAuthHandler.completeOAuthFlow).not.toHaveBeenCalled();
      expect(MCPTokenStorage.storeTokens).not.toHaveBeenCalled();
    });
@ -964,7 +755,7 @@ describe('MCP Routes', () => {
      getLogStores.mockReturnValue({});
      require('~/config').getFlowStateManager.mockReturnValue(mockFlowManager);

-      const response = await request(app).get('/api/mcp/oauth/status/test-user-id:test-server');
+      const response = await request(app).get('/api/mcp/oauth/status/test-flow-id');

      expect(response.status).toBe(200);
      expect(response.body).toEqual({
@ -975,13 +766,6 @@ describe('MCP Routes', () => {
      });
    });

-    it('should return 403 when flowId does not match authenticated user', async () => {
-      const response = await request(app).get('/api/mcp/oauth/status/other-user-id:test-server');
-
-      expect(response.status).toBe(403);
-      expect(response.body).toEqual({ error: 'Access denied' });
-    });
-
    it('should return 404 when flow is not found', async () => {
      const mockFlowManager = {
        getFlowState: jest.fn().mockResolvedValue(null),
@ -990,7 +774,7 @@ describe('MCP Routes', () => {
      getLogStores.mockReturnValue({});
      require('~/config').getFlowStateManager.mockReturnValue(mockFlowManager);

-      const response = await request(app).get('/api/mcp/oauth/status/test-user-id:non-existent');
+      const response = await request(app).get('/api/mcp/oauth/status/non-existent-flow');

      expect(response.status).toBe(404);
      expect(response.body).toEqual({ error: 'Flow not found' });
@ -1004,7 +788,7 @@ describe('MCP Routes', () => {
      getLogStores.mockReturnValue({});
      require('~/config').getFlowStateManager.mockReturnValue(mockFlowManager);

-      const response = await request(app).get('/api/mcp/oauth/status/test-user-id:error-server');
+      const response = await request(app).get('/api/mcp/oauth/status/error-flow-id');

      expect(response.status).toBe(500);
      expect(response.body).toEqual({ error: 'Failed to get flow status' });
@ -1591,7 +1375,7 @@ describe('MCP Routes', () => {
        refresh_token: 'edge-refresh-token',
      };
      MCPOAuthHandler.getFlowState = jest.fn().mockResolvedValue({
-        id: 'test-user-id:test-server',
+        id: 'test-flow-id',
        userId: 'test-user-id',
        metadata: {
          serverUrl: 'https://example.com',
@ -1619,12 +1403,8 @@ describe('MCP Routes', () => {
      };
      require('~/config').getMCPManager.mockReturnValue(mockMcpManager);

-      const flowId = 'test-user-id:test-server';
-      const csrfToken = generateTestCsrfToken(flowId);
-
      const response = await request(app)
-        .get(`/api/mcp/test-server/oauth/callback?code=test-code&state=${flowId}`)
-        .set('Cookie', [`oauth_csrf=${csrfToken}`])
+        .get('/api/mcp/test-server/oauth/callback?code=test-code&state=test-flow-id')
        .expect(302);

      const basePath = getBasePath();
@ -1644,7 +1424,7 @@ describe('MCP Routes', () => {

      const mockFlowManager = {
        getFlowState: jest.fn().mockResolvedValue({
-          id: 'test-user-id:test-server',
+          id: 'test-flow-id',
          userId: 'test-user-id',
          metadata: { serverUrl: 'https://example.com', oauth: {} },
          clientInfo: {},
@ -1673,12 +1453,8 @@ describe('MCP Routes', () => {
      };
      require('~/config').getMCPManager.mockReturnValue(mockMcpManager);

-      const flowId = 'test-user-id:test-server';
-      const csrfToken = generateTestCsrfToken(flowId);
-
      const response = await request(app)
-        .get(`/api/mcp/test-server/oauth/callback?code=test-code&state=${flowId}`)
-        .set('Cookie', [`oauth_csrf=${csrfToken}`])
+        .get('/api/mcp/test-server/oauth/callback?code=test-code&state=test-flow-id')
        .expect(302);

      const basePath = getBasePath();
@ -1693,14 +1469,12 @@ describe('MCP Routes', () => {
    it('should return all server configs for authenticated user', async () => {
      const mockServerConfigs = {
        'server-1': {
-          type: 'sse',
-          url: 'http://server1.com/sse',
-          title: 'Server 1',
+          endpoint: 'http://server1.com',
+          name: 'Server 1',
        },
        'server-2': {
-          type: 'sse',
-          url: 'http://server2.com/sse',
-          title: 'Server 2',
+          endpoint: 'http://server2.com',
+          name: 'Server 2',
        },
      };

@ -1709,18 +1483,7 @@ describe('MCP Routes', () => {
      const response = await request(app).get('/api/mcp/servers');

      expect(response.status).toBe(200);
-      expect(response.body['server-1']).toMatchObject({
-        type: 'sse',
-        url: 'http://server1.com/sse',
-        title: 'Server 1',
-      });
-      expect(response.body['server-2']).toMatchObject({
-        type: 'sse',
-        url: 'http://server2.com/sse',
-        title: 'Server 2',
-      });
-      expect(response.body['server-1'].headers).toBeUndefined();
-      expect(response.body['server-2'].headers).toBeUndefined();
+      expect(response.body).toEqual(mockServerConfigs);
      expect(mockRegistryInstance.getAllServerConfigs).toHaveBeenCalledWith('test-user-id');
    });

@ -1775,10 +1538,10 @@ describe('MCP Routes', () => {
      const response = await request(app).post('/api/mcp/servers').send({ config: validConfig });

      expect(response.status).toBe(201);
-      expect(response.body.serverName).toBe('test-sse-server');
-      expect(response.body.type).toBe('sse');
-      expect(response.body.url).toBe('https://mcp-server.example.com/sse');
-      expect(response.body.title).toBe('Test SSE Server');
+      expect(response.body).toEqual({
+        serverName: 'test-sse-server',
+        ...validConfig,
+      });
      expect(mockRegistryInstance.addServer).toHaveBeenCalledWith(
        'temp_server_name',
        expect.objectContaining({
@ -1832,78 +1595,6 @@ describe('MCP Routes', () => {
      expect(response.body.message).toBe('Invalid configuration');
    });

-    it('should reject SSE URL containing env variable references', async () => {
-      const response = await request(app)
-        .post('/api/mcp/servers')
-        .send({
-          config: {
-            type: 'sse',
-            url: 'http://attacker.com/?secret=${JWT_SECRET}',
-          },
-        });
-
-      expect(response.status).toBe(400);
-      expect(response.body.message).toBe('Invalid configuration');
-      expect(mockRegistryInstance.addServer).not.toHaveBeenCalled();
-    });
-
-    it('should reject streamable-http URL containing env variable references', async () => {
-      const response = await request(app)
-        .post('/api/mcp/servers')
-        .send({
-          config: {
-            type: 'streamable-http',
-            url: 'http://attacker.com/?key=${CREDS_KEY}&iv=${CREDS_IV}',
-          },
-        });
-
-      expect(response.status).toBe(400);
-      expect(response.body.message).toBe('Invalid configuration');
-      expect(mockRegistryInstance.addServer).not.toHaveBeenCalled();
-    });
-
-    it('should reject websocket URL containing env variable references', async () => {
-      const response = await request(app)
-        .post('/api/mcp/servers')
-        .send({
-          config: {
-            type: 'websocket',
-            url: 'ws://attacker.com/?secret=${MONGO_URI}',
-          },
-        });
-
-      expect(response.status).toBe(400);
-      expect(response.body.message).toBe('Invalid configuration');
-      expect(mockRegistryInstance.addServer).not.toHaveBeenCalled();
-    });
-
-    it('should redact secrets from create response', async () => {
-      const validConfig = {
-        type: 'sse',
-        url: 'https://mcp-server.example.com/sse',
-        title: 'Test Server',
-      };
-
-      mockRegistryInstance.addServer.mockResolvedValue({
-        serverName: 'test-server',
-        config: {
-          ...validConfig,
-          apiKey: { source: 'admin', authorization_type: 'bearer', key: 'admin-secret-key' },
-          oauth: { client_id: 'cid', client_secret: 'admin-oauth-secret' },
-          headers: { Authorization: 'Bearer leaked-token' },
-        },
-      });
-
-      const response = await request(app).post('/api/mcp/servers').send({ config: validConfig });
-
-      expect(response.status).toBe(201);
-      expect(response.body.apiKey?.key).toBeUndefined();
-      expect(response.body.oauth?.client_secret).toBeUndefined();
-      expect(response.body.headers).toBeUndefined();
-      expect(response.body.apiKey?.source).toBe('admin');
-      expect(response.body.oauth?.client_id).toBe('cid');
-    });
-
    it('should return 500 when registry throws error', async () => {
      const validConfig = {
        type: 'sse',
@ -1933,9 +1624,7 @@ describe('MCP Routes', () => {
      const response = await request(app).get('/api/mcp/servers/test-server');

      expect(response.status).toBe(200);
-      expect(response.body.type).toBe('sse');
-      expect(response.body.url).toBe('https://mcp-server.example.com/sse');
-      expect(response.body.title).toBe('Test Server');
+      expect(response.body).toEqual(mockConfig);
      expect(mockRegistryInstance.getServerConfig).toHaveBeenCalledWith(
        'test-server',
        'test-user-id',
@ -1951,29 +1640,6 @@ describe('MCP Routes', () => {
      expect(response.body).toEqual({ message: 'MCP server not found' });
    });

-    it('should redact secrets from get response', async () => {
-      mockRegistryInstance.getServerConfig.mockResolvedValue({
-        type: 'sse',
-        url: 'https://mcp-server.example.com/sse',
-        title: 'Secret Server',
-        apiKey: { source: 'admin', authorization_type: 'bearer', key: 'decrypted-admin-key' },
-        oauth: { client_id: 'cid', client_secret: 'decrypted-oauth-secret' },
-        headers: { Authorization: 'Bearer internal-token' },
-        oauth_headers: { 'X-OAuth': 'secret-value' },
-      });
-
-      const response = await request(app).get('/api/mcp/servers/secret-server');
-
-      expect(response.status).toBe(200);
-      expect(response.body.title).toBe('Secret Server');
-      expect(response.body.apiKey?.key).toBeUndefined();
-      expect(response.body.apiKey?.source).toBe('admin');
-      expect(response.body.oauth?.client_secret).toBeUndefined();
-      expect(response.body.oauth?.client_id).toBe('cid');
-      expect(response.body.headers).toBeUndefined();
-      expect(response.body.oauth_headers).toBeUndefined();
-    });
-
    it('should return 500 when registry throws error', async () => {
      mockRegistryInstance.getServerConfig.mockRejectedValue(new Error('Database error'));

@ -2000,9 +1666,7 @@ describe('MCP Routes', () => {
        .send({ config: updatedConfig });

      expect(response.status).toBe(200);
-      expect(response.body.type).toBe('sse');
-      expect(response.body.url).toBe('https://updated-mcp-server.example.com/sse');
-      expect(response.body.title).toBe('Updated Server');
+      expect(response.body).toEqual(updatedConfig);
      expect(mockRegistryInstance.updateServer).toHaveBeenCalledWith(
        'test-server',
        expect.objectContaining({
@ -2014,35 +1678,6 @@ describe('MCP Routes', () => {
      );
    });

-    it('should redact secrets from update response', async () => {
-      const validConfig = {
-        type: 'sse',
-        url: 'https://mcp-server.example.com/sse',
-        title: 'Updated Server',
-      };
-
-      mockRegistryInstance.updateServer.mockResolvedValue({
-        ...validConfig,
-        apiKey: { source: 'admin', authorization_type: 'bearer', key: 'preserved-admin-key' },
-        oauth: { client_id: 'cid', client_secret: 'preserved-oauth-secret' },
-        headers: { Authorization: 'Bearer internal-token' },
-        env: { DATABASE_URL: 'postgres://admin:pass@localhost/db' },
-      });
-
-      const response = await request(app)
-        .patch('/api/mcp/servers/test-server')
-        .send({ config: validConfig });
-
-      expect(response.status).toBe(200);
-      expect(response.body.title).toBe('Updated Server');
-      expect(response.body.apiKey?.key).toBeUndefined();
-      expect(response.body.apiKey?.source).toBe('admin');
-      expect(response.body.oauth?.client_secret).toBeUndefined();
-      expect(response.body.oauth?.client_id).toBe('cid');
-      expect(response.body.headers).toBeUndefined();
-      expect(response.body.env).toBeUndefined();
-    });
-
    it('should return 400 for invalid configuration', async () => {
      const invalidConfig = {
        type: 'sse',
@ -2059,51 +1694,6 @@ describe('MCP Routes', () => {
      expect(response.body.errors).toBeDefined();
    });

-    it('should reject SSE URL containing env variable references', async () => {
-      const response = await request(app)
-        .patch('/api/mcp/servers/test-server')
-        .send({
-          config: {
-            type: 'sse',
-            url: 'http://attacker.com/?secret=${JWT_SECRET}',
-          },
-        });
-
-      expect(response.status).toBe(400);
-      expect(response.body.message).toBe('Invalid configuration');
-      expect(mockRegistryInstance.updateServer).not.toHaveBeenCalled();
-    });
-
-    it('should reject streamable-http URL containing env variable references', async () => {
-      const response = await request(app)
-        .patch('/api/mcp/servers/test-server')
-        .send({
-          config: {
-            type: 'streamable-http',
-            url: 'http://attacker.com/?key=${CREDS_KEY}',
-          },
-        });
-
-      expect(response.status).toBe(400);
-      expect(response.body.message).toBe('Invalid configuration');
-      expect(mockRegistryInstance.updateServer).not.toHaveBeenCalled();
-    });
-
-    it('should reject websocket URL containing env variable references', async () => {
-      const response = await request(app)
-        .patch('/api/mcp/servers/test-server')
-        .send({
-          config: {
-            type: 'websocket',
-            url: 'ws://attacker.com/?secret=${MONGO_URI}',
-          },
-        });
-
-      expect(response.status).toBe(400);
-      expect(response.body.message).toBe('Invalid configuration');
-      expect(mockRegistryInstance.updateServer).not.toHaveBeenCalled();
-    });
-
    it('should return 500 when registry throws error', async () => {
      const validConfig = {
        type: 'sse',
--- a/api/server/routes/tests/messages-delete.spec.js
+++ b/api/server/routes/tests/messages-delete.spec.js
@ -1,200 +0,0 @@
-const mongoose = require('mongoose');
-const express = require('express');
-const request = require('supertest');
-const { v4: uuidv4 } = require('uuid');
-const { MongoMemoryServer } = require('mongodb-memory-server');
-
-jest.mock('@librechat/agents', () => ({
-  sleep: jest.fn(),
-}));
-
-jest.mock('@librechat/api', () => ({
-  unescapeLaTeX: jest.fn((x) => x),
-  countTokens: jest.fn().mockResolvedValue(10),
-}));
-
-jest.mock('@librechat/data-schemas', () => ({
-  ...jest.requireActual('@librechat/data-schemas'),
-  logger: {
-    debug: jest.fn(),
-    info: jest.fn(),
-    warn: jest.fn(),
-    error: jest.fn(),
-  },
-}));
-
-jest.mock('librechat-data-provider', () => ({
-  ...jest.requireActual('librechat-data-provider'),
-}));
-
-jest.mock('~/models', () => ({
-  saveConvo: jest.fn(),
-  getMessage: jest.fn(),
-  saveMessage: jest.fn(),
-  getMessages: jest.fn(),
-  updateMessage: jest.fn(),
-  deleteMessages: jest.fn(),
-}));
-
-jest.mock('~/server/services/Artifacts/update', () => ({
-  findAllArtifacts: jest.fn(),
-  replaceArtifactContent: jest.fn(),
-}));
-
-jest.mock('~/server/middleware/requireJwtAuth', () => (req, res, next) => next());
-
-jest.mock('~/server/middleware', () => ({
-  requireJwtAuth: (req, res, next) => next(),
-  validateMessageReq: (req, res, next) => next(),
-}));
-
-jest.mock('~/models/Conversation', () => ({
-  getConvosQueried: jest.fn(),
-}));
-
-jest.mock('~/db/models', () => ({
-  Message: {
-    findOne: jest.fn(),
-    find: jest.fn(),
-    meiliSearch: jest.fn(),
-  },
-}));
-
-/* ─── Model-level tests: real MongoDB, proves cross-user deletion is prevented ─── */
-
-const { messageSchema } = require('@librechat/data-schemas');
-
-describe('deleteMessages – model-level IDOR prevention', () => {
-  let mongoServer;
-  let Message;
-
-  const ownerUserId = 'user-owner-111';
-  const attackerUserId = 'user-attacker-222';
-
-  beforeAll(async () => {
-    mongoServer = await MongoMemoryServer.create();
-    Message = mongoose.models.Message || mongoose.model('Message', messageSchema);
-    await mongoose.connect(mongoServer.getUri());
-  });
-
-  afterAll(async () => {
-    await mongoose.disconnect();
-    await mongoServer.stop();
-  });
-
-  beforeEach(async () => {
-    await Message.deleteMany({});
-  });
-
-  it("should NOT delete another user's message when attacker supplies victim messageId", async () => {
-    const conversationId = uuidv4();
-    const victimMsgId = 'victim-msg-001';
-
-    await Message.create({
-      messageId: victimMsgId,
-      conversationId,
-      user: ownerUserId,
-      text: 'Sensitive owner data',
-    });
-
-    await Message.deleteMany({ messageId: victimMsgId, user: attackerUserId });
-
-    const victimMsg = await Message.findOne({ messageId: victimMsgId }).lean();
-    expect(victimMsg).not.toBeNull();
-    expect(victimMsg.user).toBe(ownerUserId);
-    expect(victimMsg.text).toBe('Sensitive owner data');
-  });
-
-  it("should delete the user's own message", async () => {
-    const conversationId = uuidv4();
-    const ownMsgId = 'own-msg-001';
-
-    await Message.create({
-      messageId: ownMsgId,
-      conversationId,
-      user: ownerUserId,
-      text: 'My message',
-    });
-
-    const result = await Message.deleteMany({ messageId: ownMsgId, user: ownerUserId });
-    expect(result.deletedCount).toBe(1);
-
-    const deleted = await Message.findOne({ messageId: ownMsgId }).lean();
-    expect(deleted).toBeNull();
-  });
-
-  it('should scope deletion by conversationId, messageId, and user together', async () => {
-    const convoA = uuidv4();
-    const convoB = uuidv4();
-
-    await Message.create([
-      { messageId: 'msg-a1', conversationId: convoA, user: ownerUserId, text: 'A1' },
-      { messageId: 'msg-b1', conversationId: convoB, user: ownerUserId, text: 'B1' },
-    ]);
-
-    await Message.deleteMany({ messageId: 'msg-a1', conversationId: convoA, user: attackerUserId });
-
-    const remaining = await Message.find({ user: ownerUserId }).lean();
-    expect(remaining).toHaveLength(2);
-  });
-});
-
-/* ─── Route-level tests: supertest + mocked deleteMessages ─── */
-
-describe('DELETE /:conversationId/:messageId – route handler', () => {
-  let app;
-  const { deleteMessages } = require('~/models');
-
-  const authenticatedUserId = 'user-owner-123';
-
-  beforeAll(() => {
-    const messagesRouter = require('../messages');
-
-    app = express();
-    app.use(express.json());
-    app.use((req, res, next) => {
-      req.user = { id: authenticatedUserId };
-      next();
-    });
-    app.use('/api/messages', messagesRouter);
-  });
-
-  beforeEach(() => {
-    jest.clearAllMocks();
-  });
-
-  it('should pass user and conversationId in the deleteMessages filter', async () => {
-    deleteMessages.mockResolvedValue({ deletedCount: 1 });
-
-    await request(app).delete('/api/messages/convo-1/msg-1');
-
-    expect(deleteMessages).toHaveBeenCalledTimes(1);
-    expect(deleteMessages).toHaveBeenCalledWith({
-      messageId: 'msg-1',
-      conversationId: 'convo-1',
-      user: authenticatedUserId,
-    });
-  });
-
-  it('should return 204 on successful deletion', async () => {
-    deleteMessages.mockResolvedValue({ deletedCount: 1 });
-
-    const response = await request(app).delete('/api/messages/convo-1/msg-owned');
-
-    expect(response.status).toBe(204);
-    expect(deleteMessages).toHaveBeenCalledWith({
-      messageId: 'msg-owned',
-      conversationId: 'convo-1',
-      user: authenticatedUserId,
-    });
-  });
-
-  it('should return 500 when deleteMessages throws', async () => {
-    deleteMessages.mockRejectedValue(new Error('DB failure'));
-
-    const response = await request(app).delete('/api/messages/convo-1/msg-1');
-
-    expect(response.status).toBe(500);
-    expect(response.body).toEqual({ error: 'Internal server error' });
-  });
-});
--- a/Show more
+++ b/Show more