fix: Patch tiktoken method missing

resolves #541
2025-04-17 18:18:11 +00:00 · 2024-01-05 09:39:19 -08:00 · 2024-01-05 09:39:19 -08:00 · 3e088f22b1
commit 3e088f22b1
parent d95d1a9dfd
2 changed files with 11 additions and 4 deletions
--- a/server/utils/helpers/chat/index.js
+++ b/server/utils/helpers/chat/index.js
@ -300,7 +300,7 @@ function cannonball({
  // if the delta is the token difference between where our prompt is in size
  // and where we ideally need to land.
  const delta = initialInputSize - targetTokenSize;
-  const tokenChunks = tokenManager.countFromString(input);
+  const tokenChunks = tokenManager.tokensFromString(input);
  const middleIdx = Math.floor(tokenChunks.length / 2);

  // middle truncate the text going left and right of midpoint
--- a/server/utils/helpers/tiktoken.js
+++ b/server/utils/helpers/tiktoken.js
@ -15,15 +15,22 @@ class TokenManager {
    }
  }

+  // Pass in an empty array of disallowedSpecials to handle all tokens as text and to be tokenized.
+  // https://github.com/openai/tiktoken/blob/9e79899bc248d5313c7dd73562b5e211d728723d/tiktoken/core.py#L91C20-L91C38
+  // Returns number[]
+  tokensFromString(input = "") {
+    const tokens = this.encoder.encode(input, undefined, []);
+    return tokens;
+  }
+
  bytesFromTokens(tokens = []) {
    const bytes = this.encoder.decode(tokens);
    return bytes;
  }

-  // Pass in an empty array of disallowedSpecials to handle all tokens as text and to be tokenized.
-  // https://github.com/openai/tiktoken/blob/9e79899bc248d5313c7dd73562b5e211d728723d/tiktoken/core.py#L91C20-L91C38
+  // Returns number
  countFromString(input = "") {
-    const tokens = this.encoder.encode(input, undefined, []);
+    const tokens = this.tokensFromString(input);
    return tokens.length;
  }