refactor: replace approximateTokenSize with estimateTokenCount and update tests

johannschopplich · johannschopplich · commit 14ba6ddf7e3c · 2025-09-23T13:33:00.000+02:00
diff --git a/scripts/generateTable.ts b/scripts/generateTable.ts
@@ -2,7 +2,7 @@ import { readFile, writeFile } from 'node:fs/promises'
 import { join } from 'node:path'
 import { fileURLToPath } from 'node:url'
 import { encode } from 'gpt-tokenizer'
-import { approximateTokenSize } from '../src/index'
+import { estimateTokenCount } from '../src/index'
 
 const rootDir = join(fileURLToPath(new URL('../', import.meta.url)))
 const readmePath = join(rootDir, 'README.md')
@@ -49,7 +49,7 @@ for (const example of tokenExamples) {
     ? (await readFile(example.input, 'utf-8'))
     : example.input
   const tokenCount = encode(text).length
-  const estimatedTokenCount = approximateTokenSize(text)
+  const estimatedTokenCount = estimateTokenCount(text)
   const errorPercentage = ((Math.abs(tokenCount - estimatedTokenCount) / tokenCount) * 100).toFixed(2)
 
   markdownTable += `| ${[
diff --git a/src/index.ts b/src/index.ts
@@ -34,7 +34,7 @@ export function isWithinTokenLimit(
   return estimateTokenCount(text, options) <= tokenLimit
 }
 
-// Legacy alias for backward compatibility
+/** @deprecated Use `estimateTokenCount` instead */
 export const approximateTokenSize: typeof estimateTokenCount = estimateTokenCount
 
 /**
diff --git a/test/index.test.ts b/test/index.test.ts
@@ -3,7 +3,6 @@ import { join } from 'node:path'
 import { fileURLToPath } from 'node:url'
 import { describe, expect, it } from 'vitest'
 import {
-  approximateTokenSize,
   estimateTokenCount,
   isWithinTokenLimit,
   sliceByTokens,
@@ -15,38 +14,28 @@ describe('token-related functions', () => {
   const ENGLISH_TEXT = 'Hello, world! This is a short sentence.'
   const GERMAN_TEXT = 'Die pünktlich gewünschte Trüffelfüllung im übergestülpten Würzkümmel-Würfel ist kümmerlich und dürfte fürderhin zu Rüffeln in Hülle und Fülle führen'
 
-  describe('approximateTokenSize (legacy)', () => {
-    it('should approximate the token size for short English text', () => {
-      expect(approximateTokenSize(ENGLISH_TEXT)).toMatchInlineSnapshot('11')
+  describe('estimateTokenCount', () => {
+    it('should estimate tokens for short English text', () => {
+      expect(estimateTokenCount(ENGLISH_TEXT)).toMatchInlineSnapshot('11')
     })
 
-    it('should approximate the token size for short German text with umlauts', () => {
-      expect(approximateTokenSize(GERMAN_TEXT)).toMatchInlineSnapshot('49')
+    it('should estimate tokens for German text with umlauts', () => {
+      expect(estimateTokenCount(GERMAN_TEXT)).toMatchInlineSnapshot('49')
     })
 
     it('should approximate the token size for English ebook', async () => {
       const input = await readFile(join(fixturesDir, 'ebooks/pg5200.txt'), 'utf-8')
-      expect(approximateTokenSize(input)).toMatchInlineSnapshot(`35705`)
+      expect(estimateTokenCount(input)).toMatchInlineSnapshot(`35705`)
     })
 
     it('should approximate the token size for German ebook', async () => {
       const input = await readFile(join(fixturesDir, 'ebooks/pg22367.txt'), 'utf-8')
-      expect(approximateTokenSize(input)).toMatchInlineSnapshot(`35069`)
+      expect(estimateTokenCount(input)).toMatchInlineSnapshot(`35069`)
     })
 
     it('should approximate the token size for Chinese ebook', async () => {
       const input = await readFile(join(fixturesDir, 'ebooks/pg7337.txt'), 'utf-8')
-      expect(approximateTokenSize(input)).toMatchInlineSnapshot(`12059`)
-    })
-  })
-
-  describe('estimateTokenCount', () => {
-    it('should estimate tokens for short English text', () => {
-      expect(estimateTokenCount(ENGLISH_TEXT)).toMatchInlineSnapshot('11')
-    })
-
-    it('should estimate tokens for German text with umlauts', () => {
-      expect(estimateTokenCount(GERMAN_TEXT)).toMatchInlineSnapshot('49')
+      expect(estimateTokenCount(input)).toMatchInlineSnapshot(`12059`)
     })
 
     it('should handle empty input', () => {

Original file line number	Diff line number	Diff line change
`@@ -34,7 +34,7 @@ export function isWithinTokenLimit(`
`34`	`34`	`return estimateTokenCount(text, options) <= tokenLimit`
`35`	`35`	`}`
`36`	`36`
`37`		`-// Legacy alias for backward compatibility`
	`37`	+/** @deprecated Use `estimateTokenCount` instead */
`38`	`38`	`export const approximateTokenSize: typeof estimateTokenCount = estimateTokenCount`
`39`	`39`
`40`	`40`	`/**`