perf: 9x AI code optimization

vladholubiev · vladholubiev · commit d6f2959930a0 · 2025-09-19T21:55:44.000+02:00
diff --git a/package.json b/package.json
@@ -50,8 +50,7 @@
     "string-width": "4.2.3"
   },
   "dependencies": {
-    "runes": "0.4.3",
-    "string-length": "6.0.0"
+    "runes": "0.4.3"
   },
   "devDependencies": {
     "@shelf/eslint-config": "5.2.3",
diff --git a/readme.md b/readme.md
@@ -37,52 +37,62 @@ Running "Without Unicode" suite...
 Progress: 100%
 
   ~33 kb split by 2 kb:
-    14 255 401 ops/s, ±0.33%   | 83.34% slower
+    14 106 903 ops/s, ±1.71%    | 86.19% slower
 
   ~33 kb split by 1 mb:
-    85 581 562 ops/s, ±1.89%   | fastest
+    100 461 043 ops/s, ±1.45%   | 1.63% slower
 
   ~330 kb split by 2 kb:
-    1 612 589 ops/s, ±0.83%    | 98.12% slower
+    1 600 485 ops/s, ±0.63%     | 98.43% slower
 
   ~330 kb split by 1 mb:
-    84 876 970 ops/s, ±1.98%   | 0.82% slower
+    102 125 168 ops/s, ±1.50%   | fastest
 
   ~3.3 mb split by 2 kb:
-    165 944 ops/s, ±0.62%      | 99.81% slower
+    161 507 ops/s, ±1.19%       | 99.84% slower
 
   ~3.3 mb split by 1 mb:
-    40 975 330 ops/s, ±1.19%   | 52.12% slower
+    41 773 807 ops/s, ±1.54%    | 59.1% slower
 
   ~33 mb split by 2 kb:
-    11 643 ops/s, ±0.50%       | slowest, 99.99% slower
+    11 098 ops/s, ±0.25%        | slowest, 99.99% slower
 
   ~33 mb split by 1 mb:
-    5 444 259 ops/s, ±0.78%    | 93.64% slower
+    5 506 349 ops/s, ±0.58%     | 94.61% slower
 
 Finished 8 cases!
-  Fastest: ~33 kb split by 1 mb
+  Fastest: ~330 kb split by 1 mb
   Slowest: ~33 mb split by 2 kb
 Running "Unicode Aware" suite...
 Progress: 100%
 
   ~33 kb split by 2 kb with unicodeAware:
-    101.4 ops/s, ±0.95%   | fastest
+    847 ops/s, ±0.99%   | 12.14% slower
 
   ~33 kb split by 1 mb with unicodeAware:
-    99.7 ops/s, ±0.84%    | 1.68% slower
+    964 ops/s, ±0.25%   | fastest
 
   ~330 kb split by 2 kb with unicodeAware:
-    10.2 ops/s, ±0.51%    | 89.94% slower
+    71 ops/s, ±0.76%    | slowest, 92.63% slower
 
   ~330 kb split by 1 mb with unicodeAware:
-    10 ops/s, ±0.55%      | slowest, 90.14% slower
+    90 ops/s, ±0.94%    | 90.66% slower
 
 Finished 4 cases!
-  Fastest: ~33 kb split by 2 kb with unicodeAware
-  Slowest: ~330 kb split by 1 mb with unicodeAware
+  Fastest: ~33 kb split by 1 mb with unicodeAware
+  Slowest: ~330 kb split by 2 kb with unicodeAware
 ```
 
+## Recent optimizations — September 2025
+
+September 2025 improvements were delivered autonomously by the gpt-5-codex model. We treated the hot paths like any latency-sensitive service and tuned the slowest sections:
+
+- Single-pass unicode chunking – length and slicing now come from the same `runes()` walk, eliminating the extra `string-length` scan and keeping multicodepoint graphemes intact.
+- Consolidated ASCII loop – collapsed the fast path into one traversal with early exits for empty inputs and oversized chunk sizes to trim per-call overhead.
+- Fractional-size parity – restored the legacy `slice` coercion semantics so non-integer chunk sizes behave exactly as before, backed by new regression tests.
+
+The result is steadier throughput in the ASCII suite (for example ~33 kb split by 1 mb climbs from 85.6M to 100.5M ops/s) and a 9–10× lift in the unicode-aware scenarios (e.g. 33 kb splits rise from ~101 ops/s to ~964 ops/s) while preserving behaviour for combining marks and emoji ligatures.
+
 ## See Also
 
 - [fast-normalize-spaces](https://github.com/shelfio/fast-normalize-spaces)
diff --git a/src/index.test.ts b/src/index.test.ts
@@ -37,3 +37,7 @@ it('should split emojis correctly w/ useByteLength option', () => {
 it('should split emojis correctly w/ useByteLength option for odd chunk length', () => {
   expect(fastChunkString('😀😃😄', {size: 2, unicodeAware: true})).toEqual(['😀😃', '😄']);
 });
+
+it('should coerce fractional unicode chunk sizes like slice does', () => {
+  expect(fastChunkString('abcdef', {size: 2.5, unicodeAware: true})).toEqual(['ab', 'cde', 'f']);
+});
diff --git a/src/index.ts b/src/index.ts
@@ -1,8 +1,7 @@
 import runes from 'runes';
-import stringLength from 'string-length';
 
 function fastChunkString(
-  str: string,
+  original: string,
   {
     size,
     unicodeAware = false,
@@ -11,7 +10,12 @@ function fastChunkString(
     unicodeAware?: boolean;
   },
 ): string[] {
-  str = str || '';
+  const str = original || '';
+
+  if (str.length === 0) {
+    return [];
+  }
+
   if (!unicodeAware) {
     return getChunks(str, size);
   }
@@ -20,31 +24,52 @@ function fastChunkString(
 }
 
 function getChunks(str: string, size: number): string[] {
-  const strLength: number = str.length;
-  const numChunks: number = Math.ceil(strLength / size);
-  const chunks: string[] = new Array(numChunks);
+  const strLength = str.length;
+
+  if (strLength === 0) {
+    return [];
+  }
+
+  if (size >= strLength) {
+    return [str];
+  }
 
-  let i = 0;
-  let o = 0;
+  const numChunks = Math.ceil(strLength / size);
+  const chunks = new Array<string>(numChunks);
 
-  for (; i < numChunks; ++i, o += size) {
-    chunks[i] = str.substr(o, size);
+  for (let index = 0, offset = 0; index < numChunks; index += 1, offset += size) {
+    chunks[index] = str.substr(offset, size);
   }
 
   return chunks;
 }
 
 function getChunksUnicode(str: string, size: number): string[] {
-  const strLength: number = stringLength(str);
-  const numChunks: number = Math.ceil(strLength / size);
-  const chunks: string[] = new Array(numChunks);
+  const runeChars = runes(str);
+  const runeCount = runeChars.length;
 
-  let i = 0;
-  let o = 0;
+  if (runeCount === 0) {
+    return [];
+  }
 
-  const runeChars = runes(str);
-  for (; i < numChunks; ++i, o += size) {
-    chunks[i] = runeChars.slice(o, o + size).join('');
+  if (size >= runeCount) {
+    return [str];
+  }
+
+  const numChunks = Math.ceil(runeCount / size);
+  const chunks = new Array<string>(numChunks);
+
+  for (let index = 0, offset = 0; index < numChunks; index += 1, offset += size) {
+    const start = Math.min(Math.floor(offset), runeCount);
+    const end = Math.min(Math.floor(offset + size), runeCount);
+
+    let chunk = '';
+
+    for (let i = start; i < end; i += 1) {
+      chunk += runeChars[i];
+    }
+
+    chunks[index] = chunk;
   }
 
   return chunks;