feat: use lodestar-bun hashtree (#8481)

wemeetagain · web-flow · commit fd1dac853d05 · 2025-09-30T17:29:30.000-04:00
**Motivation** - #7280 **Description** - bump lodestar-bun - leveldb uses snappy - leveldb macos build fix - use hashtree-bun hasher in bun
diff --git a/packages/cli/package.json b/packages/cli/package.json
@@ -9,7 +9,18 @@
   },
   "homepage": "https://github.com/ChainSafe/lodestar#readme",
   "type": "module",
-  "exports": "./lib/index.js",
+  "exports": {
+    ".": {
+      "bun": "./src/index.ts",
+      "import": "./lib/index.js"
+    }
+  },
+  "imports": {
+    "#hashtree-hasher": {
+      "bun": "./src/util/hasher_bun.ts",
+      "import": "./lib/util/hasher_nodejs.js"
+    }
+  },
   "files": [
     "src",
     "lib",
@@ -65,6 +76,7 @@
     "@libp2p/peer-id": "^5.1.0",
     "@lodestar/api": "^1.34.1",
     "@lodestar/beacon-node": "^1.34.1",
+    "@lodestar/bun": "git+https://github.com/ChainSafe/lodestar-bun.git",
     "@lodestar/config": "^1.34.1",
     "@lodestar/db": "^1.34.1",
     "@lodestar/light-client": "^1.34.1",
diff --git a/packages/cli/src/applyPreset.ts b/packages/cli/src/applyPreset.ts
@@ -1,6 +1,7 @@
 // MUST import this file first before anything and not import any Lodestar code.
+
+import {hasher as hashtreeHasher} from "#hashtree-hasher";
 import {setHasher} from "@chainsafe/persistent-merkle-tree";
-import {hasher as hashtreeHasher} from "@chainsafe/persistent-merkle-tree/hasher/hashtree";
 
 // Without setting this first, persistent-merkle-tree will use noble instead
 setHasher(hashtreeHasher);
diff --git a/packages/cli/src/util/hasher_bun.ts b/packages/cli/src/util/hasher_bun.ts
@@ -0,0 +1,133 @@
+import {byteArrayIntoHashObject} from "@chainsafe/as-sha256";
+import {
+  HashComputationLevel,
+  HashObject,
+  Hasher,
+  Node,
+  doDigestNLevel,
+  doMerkleizeBlockArray,
+  doMerkleizeBlocksBytes,
+} from "@chainsafe/persistent-merkle-tree";
+import {digest2Bytes32, digest2Bytes32Into, hashInto} from "@lodestar/bun";
+
+/**
+ * Best SIMD implementation is in 512 bits = 64 bytes
+ * If not, hashtree will make a loop inside
+ * Given sha256 operates on a block of 4 bytes, we can hash 16 inputs at once
+ * Each input is 64 bytes
+ */
+const PARALLEL_FACTOR = 16;
+const MAX_INPUT_SIZE = PARALLEL_FACTOR * 64;
+const uint8Input = new Uint8Array(MAX_INPUT_SIZE);
+const uint32Input = new Uint32Array(uint8Input.buffer);
+const uint8Output = new Uint8Array(PARALLEL_FACTOR * 32);
+// having this will cause more memory to extract uint32
+// const uint32Output = new Uint32Array(uint8Output.buffer);
+// convenient reusable Uint8Array for hash64
+const hash64Input = uint8Input.subarray(0, 64);
+const hash64Output = uint8Output.subarray(0, 32);
+// size input array to 2 HashObject per computation * 32 bytes per object
+const destNodes: Node[] = new Array<Node>(PARALLEL_FACTOR);
+
+export const hasher: Hasher = {
+  name: "hashtree-bun",
+  hashInto,
+  digest64(obj1: Uint8Array, obj2: Uint8Array): Uint8Array {
+    return digest2Bytes32(obj1, obj2);
+  },
+  digest64Into: (obj1: Uint8Array, obj2: Uint8Array, output: Uint8Array): void => {
+    digest2Bytes32Into(obj1, obj2, output);
+  },
+  digest64HashObjects(left: HashObject, right: HashObject, parent: HashObject): void {
+    hashObjectsToUint32Array(left, right, uint32Input);
+    hashInto(hash64Input, hash64Output);
+    byteArrayIntoHashObject(hash64Output, 0, parent);
+  },
+  merkleizeBlocksBytes(blocksBytes: Uint8Array, padFor: number, output: Uint8Array, offset: number): void {
+    doMerkleizeBlocksBytes(blocksBytes, padFor, output, offset, hashInto);
+  },
+  merkleizeBlockArray(blocks, blockLimit, padFor, output, offset) {
+    doMerkleizeBlockArray(blocks, blockLimit, padFor, output, offset, hashInto, uint8Input);
+  },
+  digestNLevel(data: Uint8Array, nLevel: number): Uint8Array {
+    return doDigestNLevel(data, nLevel, hashInto);
+  },
+  executeHashComputations(hashComputations: HashComputationLevel[]): void {
+    for (let level = hashComputations.length - 1; level >= 0; level--) {
+      const hcArr = hashComputations[level];
+      if (!hcArr) {
+        // should not happen
+        throw Error(`no hash computations for level ${level}`);
+      }
+
+      if (hcArr.length === 0) {
+        // nothing to hash
+        continue;
+      }
+
+      // hash every 16 inputs at once to avoid memory allocation
+      let i = 0;
+      for (const {src0, src1, dest} of hcArr) {
+        if (!src0 || !src1 || !dest) {
+          throw new Error(`Invalid HashComputation at index ${i}`);
+        }
+        const indexInBatch = i % PARALLEL_FACTOR;
+        const offset = indexInBatch * 16;
+
+        hashObjectToUint32Array(src0, uint32Input, offset);
+        hashObjectToUint32Array(src1, uint32Input, offset + 8);
+        destNodes[indexInBatch] = dest;
+        if (indexInBatch === PARALLEL_FACTOR - 1) {
+          hashInto(uint8Input, uint8Output);
+          for (const [j, destNode] of destNodes.entries()) {
+            byteArrayIntoHashObject(uint8Output, j * 32, destNode);
+          }
+        }
+        i++;
+      }
+
+      const remaining = hcArr.length % PARALLEL_FACTOR;
+      // we prepared data in input, now hash the remaining
+      if (remaining > 0) {
+        const remainingInput = uint8Input.subarray(0, remaining * 64);
+        const remainingOutput = uint8Output.subarray(0, remaining * 32);
+        hashInto(remainingInput, remainingOutput);
+        // destNodes was prepared above
+        for (let j = 0; j < remaining; j++) {
+          byteArrayIntoHashObject(remainingOutput, j * 32, destNodes[j]);
+        }
+      }
+    }
+  },
+};
+
+function hashObjectToUint32Array(obj: HashObject, arr: Uint32Array, offset: number): void {
+  arr[offset] = obj.h0;
+  arr[offset + 1] = obj.h1;
+  arr[offset + 2] = obj.h2;
+  arr[offset + 3] = obj.h3;
+  arr[offset + 4] = obj.h4;
+  arr[offset + 5] = obj.h5;
+  arr[offset + 6] = obj.h6;
+  arr[offset + 7] = obj.h7;
+}
+
+// note that uint32ArrayToHashObject will cause more memory
+function hashObjectsToUint32Array(obj1: HashObject, obj2: HashObject, arr: Uint32Array): void {
+  arr[0] = obj1.h0;
+  arr[1] = obj1.h1;
+  arr[2] = obj1.h2;
+  arr[3] = obj1.h3;
+  arr[4] = obj1.h4;
+  arr[5] = obj1.h5;
+  arr[6] = obj1.h6;
+  arr[7] = obj1.h7;
+  arr[8] = obj2.h0;
+  arr[9] = obj2.h1;
+  arr[10] = obj2.h2;
+  arr[11] = obj2.h3;
+  arr[12] = obj2.h4;
+  arr[13] = obj2.h5;
+  arr[14] = obj2.h6;
+  arr[15] = obj2.h7;
+}
diff --git a/packages/cli/src/util/hasher_nodejs.ts b/packages/cli/src/util/hasher_nodejs.ts
@@ -0,0 +1,3 @@
+import {hasher} from "@chainsafe/persistent-merkle-tree/hasher/hashtree";
+
+export {hasher};
diff --git a/packages/cli/tsconfig.build.json b/packages/cli/tsconfig.build.json
@@ -2,6 +2,7 @@
   "extends": "../../tsconfig.build.json",
   "include": ["src"],
   "compilerOptions": {
+    "rootDir": "src",
     "outDir": "lib"
   }
 }
diff --git a/packages/cli/tsconfig.json b/packages/cli/tsconfig.json
@@ -2,6 +2,7 @@
   "extends": "../../tsconfig.json",
   "include": ["src", "test"],
   "compilerOptions": {
+    "rootDir": "../..",
     "outDir": "lib"
   }
 }
diff --git a/yarn.lock b/yarn.lock
@@ -550,10 +550,10 @@
     "@chainsafe/blst-linux-x64-musl" "2.2.0"
     "@chainsafe/blst-win32-x64-msvc" "2.2.0"
 
-"@chainsafe/bun-ffi-z@^1.1.3":
-  version "1.1.3"
-  resolved "https://registry.yarnpkg.com/@chainsafe/bun-ffi-z/-/bun-ffi-z-1.1.3.tgz#152a06a9cde8e0050ac400703ec5c438fcbcd221"
-  integrity sha512-KlhcVDUYdcAI7KRy4UTQvxMtaFGpSodHizNy/1aHFaC+sjCKBoTTaVdQhbcVF1Jy3O12WK7ZzTlljpKgEvma+Q==
+"@chainsafe/bun-ffi-z@^1.1.4":
+  version "1.1.4"
+  resolved "https://registry.yarnpkg.com/@chainsafe/bun-ffi-z/-/bun-ffi-z-1.1.4.tgz#7f069f4c66771ca0850d675193be707dbc06922b"
+  integrity sha512-yegYWjcj9pMwrf554iuFGoUc+Kq8EWDrVpeGiPl/nmXu/lm5EaUzxsiLG6WR1J9tpTQk012213y9RA5PwDrUTQ==
 
 "@chainsafe/discv5@^11.0.4":
   version "11.0.4"
@@ -2140,9 +2140,9 @@
 
 "@lodestar/bun@git+https://github.com/ChainSafe/lodestar-bun.git":
   version "0.1.0"
-  resolved "git+https://github.com/ChainSafe/lodestar-bun.git#368dfa6e112171231d23edbc34e55ad53054442e"
+  resolved "git+https://github.com/ChainSafe/lodestar-bun.git#e1b7001df927619284c1a29320240c4834278777"
   dependencies:
-    "@chainsafe/bun-ffi-z" "^1.1.3"
+    "@chainsafe/bun-ffi-z" "^1.1.4"
 
 "@lukeed/ms@^2.0.2":
   version "2.0.2"

Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+import {hasher} from "@chainsafe/persistent-merkle-tree/hasher/hashtree";`
	`2`	`+`
	`3`	`+export {hasher};`
Original file line number	Diff line number	Diff line change
`@@ -2,6 +2,7 @@`
`2`	`2`	`"extends": "../../tsconfig.build.json",`
`3`	`3`	`"include": ["src"],`
`4`	`4`	`"compilerOptions": {`
	`5`	`+ "rootDir": "src",`
`5`	`6`	`"outDir": "lib"`
`6`	`7`	`}`
`7`	`8`	`}`
Original file line number	Diff line number	Diff line change
`@@ -2,6 +2,7 @@`
`2`	`2`	`"extends": "../../tsconfig.json",`
`3`	`3`	`"include": ["src", "test"],`
`4`	`4`	`"compilerOptions": {`
	`5`	`+ "rootDir": "../..",`
`5`	`6`	`"outDir": "lib"`
`6`	`7`	`}`
`7`	`8`	`}`