refactor: add back getTokenCountForResponse for slightly more accurate mapping of responses token counts (#1067)

2026-02-06 17:51:50 +01:00 · 2023-10-17 06:42:58 -04:00 · 2023-10-17 06:42:58 -04:00 · 377f2c7c19
commit 377f2c7c19
parent 6d8aed7ef8
3 changed files with 26 additions and 6 deletions
--- a/api/app/clients/PluginsClient.js
+++ b/api/app/clients/PluginsClient.js
@ -230,13 +230,15 @@ If your reverse proxy is compatible to OpenAI specs in every other way, it may s
      console.debug('[handleResponseMessage] Output:', { output, errorMessage, ...result });
    const { error } = responseMessage;
    if (!error) {
-      responseMessage.tokenCount = this.getTokenCount(responseMessage.text);
-      responseMessage.completionTokens = responseMessage.tokenCount;
+      responseMessage.tokenCount = this.getTokenCountForResponse(responseMessage);
+      responseMessage.completionTokens = this.getTokenCount(responseMessage.text);
    }

+    // Record usage only when completion is skipped as it is already recorded in the agent phase.
    if (!this.agentOptions.skipCompletion && !error) {
      await this.recordTokenUsage(responseMessage);
    }
+
    await this.saveMessageToDatabase(responseMessage, saveOptions, user);
    delete responseMessage.tokenCount;
    return { ...responseMessage, ...result };