QuarkChain · ping-ke · Mar 13, 2026 · Mar 26, 2026 · Mar 30, 2026 · Mar 31, 2026
diff --git a/.gitignore b/.gitignore
@@ -8,6 +8,10 @@ __pycache__/
 
 # C extensions
 *.so
+*.pyd
+
+# Cython generated
+ethereum/pow/ethash_cy.c
 
 # qkchash binaries
 qkchash/qkchash

diff --git a/README.md b/README.md
@@ -71,9 +71,12 @@ To install the required modules for the project. Under `pyquarkchain` dir where
 # you may want to set the following if cryptography complains about header files: (https://github.com/pyca/cryptography/issues/3489)
 # export CPPFLAGS=-I/usr/local/opt/openssl/include
 # export LDFLAGS=-L/usr/local/opt/openssl/lib
-pip install -e .
+pip install -r requirements.txt
+python setup.py build_ext --inplace
 ```
 
+The second command builds the optional Cython extension (`ethash_cy`) that speeds up ethash `calc_dataset_item` by ~20x. It requires a C compiler. If the build is skipped, the pure-Python fallback is used automatically.
+
 Once all the modules are installed, try running all the unit tests under `pyquarkchain`
 
 ```

diff --git a/ethereum/pow/ethash.py b/ethereum/pow/ethash.py
@@ -1,94 +1,156 @@
-import copy
+import os
+import numpy as np
 from functools import lru_cache
 from typing import Callable, Dict, List
 
-from ethereum.pow.ethash_utils import *
+from ethereum.pow.ethash_utils import (
+    ethash_sha3_512, ethash_sha3_256,
+    FNV_PRIME, HASH_BYTES, WORD_BYTES, MIX_BYTES,
+    DATASET_PARENTS, CACHE_ROUNDS, ACCESSES, EPOCH_LENGTH,
+)
+
+# uint32 overflow is intentional in FNV arithmetic
+np.seterr(over="ignore")
+
+_FNV_PRIME = np.uint32(FNV_PRIME)
+
+# Optional Cython inner loop for calc_dataset_item. Falls back to pure numpy
+# when the compiled extension isn't built (e.g. source checkouts without a
+# C compiler).
+try:
+    from ethereum.pow.ethash_cy import mix_parents as _cy_mix_parents
+except ImportError:  # pragma: no cover
+    _cy_mix_parents = None
 
 cache_seeds = [b"\x00" * 32]  # type: List[bytes]
 
 
-def mkcache(cache_size: int, block_number) -> List[List[int]]:
+
+# ---------------------------------------------------------------------------
+# ETHASH_LIB selects the implementation used for non-test PoW verification.
+#   "ethash"    — pure-Python + numpy (always available)
+#   "ethash_cy" — Cython + C keccak  (requires python setup.py build_ext)
+# Default: auto-detect best available (ethash_cy → ethash)
+# ---------------------------------------------------------------------------
+ETHASH_LIB = os.environ.get("ETHASH_LIB", "auto")
+
+if ETHASH_LIB == "auto":
+    try:
+        from ethereum.pow.ethash_cy import cy_hashimoto_light  # noqa: F401
+        ETHASH_LIB = "ethash_cy"
+    except ImportError:
+        ETHASH_LIB = "ethash"
+
+if ETHASH_LIB == "ethash":
+    @lru_cache(2)
+    def _get_cache(seed: bytes, n: int) -> np.ndarray:
+        """Returns cache as uint32 ndarray of shape (n, 16)."""
+        o = np.empty((n, 16), dtype=np.uint32)
+        o[0] = ethash_sha3_512(seed)
+        for i in range(1, n):
+            o[i] = ethash_sha3_512(o[i - 1])
+        for _ in range(CACHE_ROUNDS):
+            for i in range(n):
+                v = int(o[i, 0]) % n
+                xored = o[(i - 1 + n) % n] ^ o[v]
+                o[i] = ethash_sha3_512(xored)
+        return o
+
+    def hashimoto_light(
+        full_size: int, cache: np.ndarray, header: bytes, nonce: bytes
+    ) -> Dict:
+        return hashimoto(header, nonce, full_size, lambda x: calc_dataset_item(cache, x))
+
+elif ETHASH_LIB == "ethash_cy":
+    from ethereum.pow.ethash_cy import cy_hashimoto_light, cy_mkcache
+
+    @lru_cache(2)
+    def _get_cache(seed: bytes, n: int):
+        return cy_mkcache(np.frombuffer(seed, dtype=np.uint8), n)
+
+    def hashimoto_light(
+        full_size: int, cache: np.ndarray, header: bytes, nonce: bytes
+    ) -> Dict:
+        return cy_hashimoto_light(
+            full_size, cache,
+            np.frombuffer(header, dtype=np.uint8),
+            np.frombuffer(nonce, dtype=np.uint8),
+        )
+
+else:
+    raise ValueError(f"Unknown ETHASH_LIB={ETHASH_LIB!r}. "
+                     f"Use 'ethash', 'ethash_cy', or 'auto'.")
+
+
+def mkcache(cache_size: int, block_number) -> np.ndarray:
     while len(cache_seeds) <= block_number // EPOCH_LENGTH:
-        new_seed = serialize_hash(ethash_sha3_256(cache_seeds[-1]))
+        new_seed = ethash_sha3_256(cache_seeds[-1]).tobytes()
         cache_seeds.append(new_seed)
 
     seed = cache_seeds[block_number // EPOCH_LENGTH]
     return _get_cache(seed, cache_size // HASH_BYTES)
 
 
-@lru_cache(10)
-def _get_cache(seed, n) -> List[List[int]]:
-    # Sequentially produce the initial dataset
-    o = [ethash_sha3_512(seed)]
-    for i in range(1, n):
-        o.append(ethash_sha3_512(o[-1]))
-
-    # Use a low-round version of randmemohash
-    for _ in range(CACHE_ROUNDS):
-        for i in range(n):
-            v = o[i][0] % n
-            o[i] = ethash_sha3_512(list(map(xor, o[(i - 1 + n) % n], o[v])))
-
-    return o
-
-
-def calc_dataset_item(cache: List[List[int]], i: int) -> List[int]:
+def calc_dataset_item(cache: np.ndarray, i: int) -> np.ndarray:
     n = len(cache)
-    r = HASH_BYTES // WORD_BYTES
-    # initialize the mix
-    mix = copy.copy(cache[i % n])  # type: List[int]
-    mix[0] ^= i
+    mix = cache[i % n].copy()
+    mix[0] ^= i                    # numpy auto-converts int, no explicit np.uint32() boxing
     mix = ethash_sha3_512(mix)
-    # fnv it with a lot of random cache nodes based on i
-    for j in range(DATASET_PARENTS):
-        cache_index = fnv(i ^ j, mix[j % r])
-        mix = list(map(fnv, mix, cache[cache_index % n]))
+    if _cy_mix_parents is not None:
+        # mix is already C-contiguous uint32[16] (it's a fresh ndarray from
+        # ethash_sha3_512). cache rows are also contiguous uint32[16].
+        _cy_mix_parents(mix, cache, i)
+    else:
+        r = HASH_BYTES // WORD_BYTES   # 16
+        for j in range(DATASET_PARENTS):
+            cache_index = ((i ^ j) * FNV_PRIME ^ int(mix[j % r])) & 0xFFFFFFFF
+            mix *= _FNV_PRIME           # in-place: no temp array allocation
+            mix ^= cache[cache_index % n]  # in-place: no temp array allocation
     return ethash_sha3_512(mix)
 
 
-def calc_dataset(full_size, cache) -> List[List[int]]:
-    o = []
-    for i in range(full_size // HASH_BYTES):
-        o.append(calc_dataset_item(cache, i))
-    return o
+def calc_dataset(full_size, cache: np.ndarray) -> np.ndarray:
+    rows = full_size // HASH_BYTES
+    out = np.empty((rows, 16), dtype=np.uint32)
+    for i in range(rows):
+        out[i] = calc_dataset_item(cache, i)
+    return out
 
 
 def hashimoto(
     header: bytes,
     nonce: bytes,
     full_size: int,
-    dataset_lookup: Callable[[int], List[int]],
+    dataset_lookup: Callable[[int], np.ndarray],
 ) -> Dict:
     n = full_size // HASH_BYTES
     w = MIX_BYTES // WORD_BYTES
     mixhashes = MIX_BYTES // HASH_BYTES
-    # combine header+nonce into a 64 byte seed
-    s = ethash_sha3_512(header + nonce[::-1])
-    mix = []
-    for _ in range(MIX_BYTES // HASH_BYTES):
-        mix.extend(s)
-    # mix in random dataset nodes
+
+    s = ethash_sha3_512(header + nonce[::-1])     # (16,) uint32
+    mix = np.tile(s, mixhashes)                      # (32,) uint32
+    s0 = int(s[0])                                   # hoist constant, avoid repeated unboxing
+    newdata = np.empty(w, dtype=np.uint32)           # pre-allocate, reused every iteration
+
     for i in range(ACCESSES):
-        p = fnv(i ^ s[0], mix[i % w]) % (n // mixhashes) * mixhashes
-        newdata = []
-        for j in range(mixhashes):
-            newdata.extend(dataset_lookup(p + j))
-        mix = list(map(fnv, mix, newdata))
-    # compress mix
-    cmix = []
-    for i in range(0, len(mix), 4):
-        cmix.append(fnv(fnv(fnv(mix[i], mix[i + 1]), mix[i + 2]), mix[i + 3]))
+        p = ((i ^ s0) * FNV_PRIME ^ int(mix[i % w])) & 0xFFFFFFFF
+        p = p % (n // mixhashes) * mixhashes
+        for j in range(mixhashes):                   # avoid np.concatenate alloc+copy
+            newdata[j * 16:(j + 1) * 16] = dataset_lookup(p + j)
+        mix *= _FNV_PRIME                            # in-place: no temp array
+        mix ^= newdata                               # in-place: no temp array
+
+    mix_r = mix.reshape(-1, 4)
+    cmix = mix_r[:, 0] * _FNV_PRIME ^ mix_r[:, 1]
+    cmix = cmix * _FNV_PRIME ^ mix_r[:, 2]
+    cmix = cmix * _FNV_PRIME ^ mix_r[:, 3]
+
+    s_cmix = np.concatenate([s, cmix])
     return {
-        b"mix digest": serialize_hash(cmix),
-        b"result": serialize_hash(ethash_sha3_256(s + cmix)),
+        b"mix digest": cmix.tobytes(),
+        b"result": ethash_sha3_256(s_cmix).tobytes(),
     }
 
 
-def hashimoto_light(
-    full_size: int, cache: List[List[int]], header: bytes, nonce: bytes
-) -> Dict:
-    return hashimoto(header, nonce, full_size, lambda x: calc_dataset_item(cache, x))
-
-
-def hashimoto_full(dataset: List[List[int]], header: bytes, nonce: bytes) -> Dict:
+def hashimoto_full(dataset: np.ndarray, header: bytes, nonce: bytes) -> Dict:
     return hashimoto(header, nonce, len(dataset) * HASH_BYTES, lambda x: dataset[x])