feat: US-069 - Fix IPC binary frame length guards and fnv1aHash (TypeScript)

NathanFlurry · claude · NathanFlurry · commit ef4580b0c558 · 2026-03-19T21:09:29.000-07:00
Co-Authored-By: Claude Opus 4.6 (1M context) &lt;noreply@anthropic.com&gt;
diff --git a/packages/secure-exec-v8/src/index.ts b/packages/secure-exec-v8/src/index.ts
@@ -1,5 +1,5 @@
 // V8 runtime process manager.
-export { createV8Runtime } from "./runtime.js";
+export { createV8Runtime, fnv1aHash } from "./runtime.js";
 export type { V8Runtime, V8RuntimeOptions } from "./runtime.js";
 
 // V8 session types.
diff --git a/packages/secure-exec-v8/src/ipc-binary.ts b/packages/secure-exec-v8/src/ipc-binary.ts
@@ -222,14 +222,19 @@ export function decodeFrame(buf: Buffer): BinaryFrame {
 			}
 			let error: ExecutionErrorBin | null = null;
 			if (flags & FLAG_HAS_ERROR) {
-				const errorType = readLenPrefixedU16(buf, pos);
-				pos += 2 + Buffer.byteLength(errorType, "utf8");
-				const message = readLenPrefixedU16(buf, pos);
-				pos += 2 + Buffer.byteLength(message, "utf8");
-				const stack = readLenPrefixedU16(buf, pos);
-				pos += 2 + Buffer.byteLength(stack, "utf8");
-				const code = readLenPrefixedU16(buf, pos);
-				error = { errorType, message, stack, code };
+				const et = readLenPrefixedU16(buf, pos);
+				pos += et.bytesRead;
+				const msg = readLenPrefixedU16(buf, pos);
+				pos += msg.bytesRead;
+				const st = readLenPrefixedU16(buf, pos);
+				pos += st.bytesRead;
+				const cd = readLenPrefixedU16(buf, pos);
+				error = {
+					errorType: et.value,
+					message: msg.value,
+					stack: st.value,
+					code: cd.value,
+				};
 			}
 			return { type: "ExecutionResult", sessionId, exitCode, exports, error };
 		}
@@ -422,6 +427,11 @@ function encodeBody(frame: BinaryFrame): Buffer {
 
 function encodeSessionId(sid: string): Buffer {
 	const bytes = Buffer.from(sid, "utf8");
+	if (bytes.length > 255) {
+		throw new Error(
+			`Session ID byte length ${bytes.length} exceeds maximum 255`,
+		);
+	}
 	const out = Buffer.alloc(1 + bytes.length);
 	out[0] = bytes.length;
 	bytes.copy(out, 1);
@@ -430,15 +440,24 @@ function encodeSessionId(sid: string): Buffer {
 
 function writeLenPrefixedU16(s: string): Buffer {
 	const bytes = Buffer.from(s, "utf8");
+	if (bytes.length > 0xffff) {
+		throw new Error(
+			`String byte length ${bytes.length} exceeds maximum 65535`,
+		);
+	}
 	const out = Buffer.alloc(2 + bytes.length);
 	out.writeUInt16BE(bytes.length, 0);
 	bytes.copy(out, 2);
 	return out;
 }
 
-function readLenPrefixedU16(buf: Buffer, pos: number): string {
+function readLenPrefixedU16(
+	buf: Buffer,
+	pos: number,
+): { value: string; bytesRead: number } {
 	const len = buf.readUInt16BE(pos);
-	return buf.toString("utf8", pos + 2, pos + 2 + len);
+	const value = buf.toString("utf8", pos + 2, pos + 2 + len);
+	return { value, bytesRead: 2 + len };
 }
 
 // Re-export v8 serialize/deserialize for convenience
diff --git a/packages/secure-exec-v8/src/runtime.ts b/packages/secure-exec-v8/src/runtime.ts
@@ -499,11 +499,12 @@ function readSocketPath(child: ChildProcess): Promise<string> {
 }
 
 /** FNV-1a hash of a string, returning a 32-bit integer.
- * Matches the hash algorithm used on the Rust side for bridge code comparison. */
-function fnv1aHash(str: string): number {
+ * Hashes over UTF-8 bytes to match the Rust side. */
+export function fnv1aHash(str: string): number {
+	const bytes = Buffer.from(str, "utf8");
 	let hash = 0x811c9dc5;
-	for (let i = 0; i < str.length; i++) {
-		hash ^= str.charCodeAt(i);
+	for (let i = 0; i < bytes.length; i++) {
+		hash ^= bytes[i];
 		hash = Math.imul(hash, 0x01000193);
 	}
 	return hash >>> 0;
diff --git a/packages/secure-exec-v8/test/ipc-binary.test.ts b/packages/secure-exec-v8/test/ipc-binary.test.ts
@@ -16,6 +16,7 @@ import {
 	deserializePayload,
 	type BinaryFrame,
 } from "../src/ipc-binary.js";
+import { fnv1aHash } from "../src/runtime.js";
 
 function roundtrip(frame: BinaryFrame): void {
 	const encoded = encodeFrame(frame);
@@ -751,3 +752,189 @@ describe("V8 serialize/deserialize payload integration", () => {
 		}
 	});
 });
+
+// -- Overflow guards --
+
+describe("overflow guards", () => {
+	it("encodeSessionId throws on >255 byte session ID", () => {
+		// 256 ASCII chars → 256 bytes UTF-8
+		const longSid = "x".repeat(256);
+		expect(() =>
+			encodeFrame({
+				type: "DestroySession",
+				sessionId: longSid,
+			}),
+		).toThrow("Session ID byte length 256 exceeds maximum 255");
+	});
+
+	it("encodeSessionId allows exactly 255 byte session ID", () => {
+		const sid255 = "a".repeat(255);
+		expect(() =>
+			encodeFrame({ type: "DestroySession", sessionId: sid255 }),
+		).not.toThrow();
+	});
+
+	it("encodeSessionId counts UTF-8 bytes not characters", () => {
+		// Each emoji is 4 bytes in UTF-8 — 64 emojis = 256 bytes → should throw
+		const emojiSid = "\u{1F600}".repeat(64);
+		expect(Buffer.byteLength(emojiSid, "utf8")).toBe(256);
+		expect(() =>
+			encodeFrame({ type: "DestroySession", sessionId: emojiSid }),
+		).toThrow("exceeds maximum 255");
+	});
+
+	it("writeLenPrefixedU16 throws on >65535 byte string", () => {
+		const longStr = "x".repeat(65536);
+		expect(() =>
+			encodeFrame({
+				type: "ExecutionResult",
+				sessionId: "s",
+				exitCode: 1,
+				exports: null,
+				error: {
+					errorType: longStr,
+					message: "",
+					stack: "",
+					code: "",
+				},
+			}),
+		).toThrow("String byte length 65536 exceeds maximum 65535");
+	});
+
+	it("writeLenPrefixedU16 allows exactly 65535 byte string", () => {
+		const str65535 = "a".repeat(65535);
+		expect(() =>
+			encodeFrame({
+				type: "ExecutionResult",
+				sessionId: "s",
+				exitCode: 1,
+				exports: null,
+				error: {
+					errorType: str65535,
+					message: "",
+					stack: "",
+					code: "",
+				},
+			}),
+		).not.toThrow();
+	});
+});
+
+// -- readLenPrefixedU16 position advance --
+
+describe("readLenPrefixedU16 position advance", () => {
+	it("round-trips ExecutionResult with multi-byte UTF-8 error strings", () => {
+		// Multi-byte UTF-8: each char is 3 bytes in UTF-8 but 1 char in JS
+		const frame: BinaryFrame = {
+			type: "ExecutionResult",
+			sessionId: "s",
+			exitCode: 1,
+			exports: null,
+			error: {
+				errorType: "TypeError",
+				message: "变量未定义",
+				stack: "在文件第一行",
+				code: "ERR_UNDEFINED",
+			},
+		};
+		roundtrip(frame);
+	});
+
+	it("round-trips ExecutionResult with emoji in error fields", () => {
+		const frame: BinaryFrame = {
+			type: "ExecutionResult",
+			sessionId: "sess-emoji",
+			exitCode: 1,
+			exports: null,
+			error: {
+				errorType: "Error",
+				message: "Failed \u{1F4A5} boom",
+				stack: "at \u{1F4C4} file.js:1",
+				code: "",
+			},
+		};
+		roundtrip(frame);
+	});
+
+	it("round-trips ExecutionResult with all error fields containing multi-byte chars", () => {
+		const frame: BinaryFrame = {
+			type: "ExecutionResult",
+			sessionId: "t",
+			exitCode: 1,
+			exports: Buffer.from([0x01]),
+			error: {
+				errorType: "Ошибка",
+				message: "не найдено: файл.txt",
+				stack: "в строке 日本語テスト",
+				code: "ENOENT_テスト",
+			},
+		};
+		roundtrip(frame);
+	});
+});
+
+// -- fnv1aHash --
+
+describe("fnv1aHash", () => {
+	it("produces consistent hash for ASCII strings", () => {
+		expect(fnv1aHash("hello")).toBe(fnv1aHash("hello"));
+		expect(fnv1aHash("hello")).not.toBe(fnv1aHash("world"));
+	});
+
+	it("produces same hash as Rust FNV-1a over UTF-8 bytes for ASCII", () => {
+		// FNV-1a 32-bit of "hello" over UTF-8 bytes [0x68, 0x65, 0x6c, 0x6c, 0x6f]:
+		// hash = 0x811c9dc5
+		// hash ^= 0x68; hash *= 0x01000193 → ...
+		// Expected: 0x4f9f2cab (computed from reference implementation)
+		const bytes = Buffer.from("hello", "utf8");
+		let expected = 0x811c9dc5;
+		for (let i = 0; i < bytes.length; i++) {
+			expected ^= bytes[i];
+			expected = Math.imul(expected, 0x01000193);
+		}
+		expected = expected >>> 0;
+		expect(fnv1aHash("hello")).toBe(expected);
+	});
+
+	it("hashes over UTF-8 bytes for non-ASCII strings", () => {
+		// "é" is 2 bytes in UTF-8 (0xc3 0xa9) but 1 code unit in UTF-16
+		// If we hashed over UTF-16, we'd get a different result than UTF-8
+		const bytes = Buffer.from("café", "utf8");
+		let expected = 0x811c9dc5;
+		for (let i = 0; i < bytes.length; i++) {
+			expected ^= bytes[i];
+			expected = Math.imul(expected, 0x01000193);
+		}
+		expected = expected >>> 0;
+		expect(fnv1aHash("café")).toBe(expected);
+		// Verify it's 5 bytes, not 4 code units
+		expect(bytes.length).toBe(5);
+	});
+
+	it("produces different hash for non-ASCII vs naive charCodeAt approach", () => {
+		// Verify the fix matters: naive charCodeAt gives different result for non-ASCII
+		const str = "日本語";
+		const bytes = Buffer.from(str, "utf8");
+
+		// UTF-8 bytes hash (correct)
+		let utf8Hash = 0x811c9dc5;
+		for (let i = 0; i < bytes.length; i++) {
+			utf8Hash ^= bytes[i];
+			utf8Hash = Math.imul(utf8Hash, 0x01000193);
+		}
+		utf8Hash = utf8Hash >>> 0;
+
+		// UTF-16 code units hash (old buggy behavior)
+		let utf16Hash = 0x811c9dc5;
+		for (let i = 0; i < str.length; i++) {
+			utf16Hash ^= str.charCodeAt(i);
+			utf16Hash = Math.imul(utf16Hash, 0x01000193);
+		}
+		utf16Hash = utf16Hash >>> 0;
+
+		// They should differ for non-ASCII
+		expect(utf8Hash).not.toBe(utf16Hash);
+		// Our function should match the UTF-8 version
+		expect(fnv1aHash(str)).toBe(utf8Hash);
+	});
+});