/** * Internal methods for lattice-based ML-KEM and ML-DSA. * @module */ /*! noble-post-quantum - MIT License (c) 2024 Paul Miller (paulmillr.com) */ import { FFTCore, reverseBits } from '@noble/curves/abstract/fft.js'; import { shake128, shake256 } from '@noble/hashes/sha3.js'; import type { TypedArray } from '@noble/hashes/utils.js'; import { type BytesCoderLen, cleanBytes, type Coder, getMask, type TArg, type TRet, } from './utils.ts'; /** Extendable-output reader used by the CRYSTALS implementations. */ export type XOF = ( seed: Uint8Array, blockLen?: number ) => { /** * Read diagnostic counters for the current XOF session. * @returns Current call and XOF block counters. */ stats: () => { calls: number; xofs: number }; /** * Select one `(x, y)` coordinate pair and get a block reader for it. * Only one coordinate stream is live at a time: a later `get(...)` call rebinds the shared * SHAKE state and invalidates older readers. * Each squeeze aliases one mutable internal output buffer, so callers must copy blocks they * want to retain before the next read. * @param x - First matrix coordinate. * @param y - Second matrix coordinate. * @returns Lazy block reader for that coordinate pair. */ get: (x: number, y: number) => () => Uint8Array; // return block aligned to blockLen and 3 /** Wipe any buffered state once the reader is no longer needed. */ clean: () => void; }; /** CRYSTALS (ml-kem, ml-dsa) options */ /** Shared polynomial and NTT parameters for CRYSTALS algorithms. */ export type CrystalOpts = { /** * Allocate one zeroed polynomial/vector container. * @param n - Number of coefficients to allocate. * @returns Fresh typed container. */ newPoly: TypedCons; /** Polynomial size, typically `256`. */ N: number; /** Prime modulus used for all coefficient arithmetic. */ Q: number; /** Inverse transform normalization factor: * `256**-1 mod q` for Dilithium, `128**-1 mod q` for Kyber. */ F: number; /** Principal root of unity for the transform domain. */ ROOT_OF_UNITY: number; /** Number of bits used for bit-reversal ordering. */ brvBits: number; /** `true` for Kyber/ML-KEM mode, `false` for Dilithium/ML-DSA mode. */ isKyber: boolean; }; /** Constructor function for typed polynomial containers. */ export type TypedCons = (n: number) => T; type Crystals = { mod: (a: number, modulo?: number) => number; smod: (a: number, modulo?: number) => number; nttZetas: T; NTT: { /** Forward transform in place. Mutates and returns `r`. */ encode: (r: T) => T; /** Inverse transform in place. Mutates and returns `r`. */ decode: (r: T) => T; }; bitsCoder: (d: number, c: Coder) => BytesCoderLen; }; /** * Creates shared modular arithmetic, NTT, and packing helpers for CRYSTALS schemes. * @param opts - Polynomial and transform parameters. See {@link CrystalOpts}. * @returns CRYSTALS arithmetic and encoding helpers. * @example * Create shared modular arithmetic and NTT helpers for a CRYSTALS parameter set. * ```ts * const crystals = genCrystals({ * newPoly: (n) => new Uint16Array(n), * N: 256, * Q: 3329, * F: 3303, * ROOT_OF_UNITY: 17, * brvBits: 7, * isKyber: true, * }); * const reduced = crystals.mod(-1); * ``` */ export const genCrystals = (opts: CrystalOpts): TRet> => { // isKyber: true means Kyber, false means Dilithium const { newPoly, N, Q, F, ROOT_OF_UNITY, brvBits, isKyber } = opts; // Normalize JS `%` into the canonical Z_m representative `[0, modulo-1]` expected by // FIPS 203 §2.3 / FIPS 204 §2.3 before downstream mod-q arithmetic. const mod = (a: number, modulo = Q): number => { const result = a % modulo | 0; return (result >= 0 ? result | 0 : (modulo + result) | 0) | 0; }; // FIPS 204 §7.4 uses the centered `mod ±` representative for low bits, keeping the // positive midpoint when `modulo` is even. // Center to `[-floor((modulo-1)/2), floor(modulo/2)]`. const smod = (a: number, modulo = Q): number => { const r = mod(a, modulo) | 0; return (r > modulo >> 1 ? (r - modulo) | 0 : r) | 0; }; // Kyber uses the FIPS 203 Appendix A `BitRev_7` table here via the first 128 entries, while // Dilithium uses the FIPS 204 §7.5 / Appendix B `BitRev_8` zetas table over all 256 entries. function getZettas() { const out = newPoly(N); for (let i = 0; i < N; i++) { const b = reverseBits(i, brvBits); const p = BigInt(ROOT_OF_UNITY) ** BigInt(b) % BigInt(Q); out[i] = Number(p) | 0; } return out; } const nttZetas = getZettas(); // Number-Theoretic Transform // Explained: https://electricdusk.com/ntt.html // Kyber has slightly different params, since there is no 512th primitive root of unity mod q, // only 256th primitive root of unity mod. Which also complicates MultiplyNTT. const field = { add: (a: number, b: number) => mod((a | 0) + (b | 0)) | 0, sub: (a: number, b: number) => mod((a | 0) - (b | 0)) | 0, mul: (a: number, b: number) => mod((a | 0) * (b | 0)) | 0, inv: (_a: number) => { throw new Error('not implemented'); }, }; const nttOpts = { N, roots: nttZetas as any, invertButterflies: true, skipStages: isKyber ? 1 : 0, brp: false, }; const dif = FFTCore(field, { dit: false, ...nttOpts }); const dit = FFTCore(field, { dit: true, ...nttOpts }); const NTT = { encode: (r: T): T => { return dif(r) as any; }, decode: (r: T): T => { dit(r as any); // The inverse-NTT normalization factor is family-specific: FIPS 203 Algorithm 10 line 14 // uses `128^-1 mod q` for Kyber, while FIPS 204 Algorithm 42 lines 21-23 use `256^-1 mod q`. // kyber uses 128 here, because brv && stuff for (let i = 0; i < r.length; i++) r[i] = mod(F * r[i]); return r; }, }; // Pack one little-endian `d`-bit word per coefficient, matching FIPS 203 ByteEncode / // ByteDecode and the FIPS 204 BitsToBytes-based polynomial packing helpers. const bitsCoder = (d: number, c: Coder): TRet> => { const mask = getMask(d); const bytesLen = d * (N / 8); return { bytesLen, encode: (poly_: TArg): TRet => { const poly = poly_ as T; const r = new Uint8Array(bytesLen); for (let i = 0, buf = 0, bufLen = 0, pos = 0; i < poly.length; i++) { buf |= (c.encode(poly[i]) & mask) << bufLen; bufLen += d; for (; bufLen >= 8; bufLen -= 8, buf >>= 8) r[pos++] = buf & getMask(bufLen); } return r as TRet; }, decode: (bytes: TArg): TRet => { const r = newPoly(N); for (let i = 0, buf = 0, bufLen = 0, pos = 0; i < bytes.length; i++) { buf |= bytes[i] << bufLen; bufLen += 8; for (; bufLen >= d; bufLen -= d, buf >>= d) r[pos++] = c.decode(buf & mask); } return r as TRet; }, } as TRet>; }; return { mod, smod, nttZetas: nttZetas as TRet, NTT: { encode: (r: TArg): TRet => NTT.encode(r as T) as TRet, decode: (r: TArg): TRet => NTT.decode(r as T) as TRet, }, bitsCoder: bitsCoder as TRet>['bitsCoder'], }; }; const createXofShake = (shake: typeof shake128): TRet => (seed: TArg, blockLen?: number) => { if (!blockLen) blockLen = shake.blockLen; // Optimizations that won't mater: // - cached seed update (two .update(), on start and on the end) // - another cache which cloned into working copy // Faster than multiple updates, since seed less than blockLen const _seed = new Uint8Array(seed.length + 2); _seed.set(seed); const seedLen = seed.length; const buf = new Uint8Array(blockLen); // == shake128.blockLen let h = shake.create({}); let calls = 0; let xofs = 0; return { stats: () => ({ calls, xofs }), get: (x: number, y: number) => { // Rebind to `seed || x || y` so callers can implement the spec's per-coordinate // SHAKE inputs like `rho || j || i` and `rho || IntegerToBytes(counter, 2)`. _seed[seedLen + 0] = x; _seed[seedLen + 1] = y; h.destroy(); h = shake.create({}).update(_seed); calls++; return () => { xofs++; return h.xofInto(buf) as TRet; }; }, clean: () => { h.destroy(); cleanBytes(buf, _seed); }, }; }; /** * SHAKE128-based extendable-output reader factory used by ML-KEM. * `get(x, y)` selects one coordinate pair at a time; calling it again invalidates previously * returned readers, and each squeeze reuses one mutable internal output buffer. * @param seed - Seed bytes for the reader. * @param blockLen - Optional output block length. * @returns Stateful XOF reader. * @example * Build the ML-KEM SHAKE128 matrix expander and read one block. * ```ts * import { randomBytes } from '@noble/post-quantum/utils.js'; * import { XOF128 } from '@noble/post-quantum/_crystals.js'; * const reader = XOF128(randomBytes(32)); * const block = reader.get(0, 0)(); * ``` */ export const XOF128: TRet = /* @__PURE__ */ createXofShake(shake128); /** * SHAKE256-based extendable-output reader factory used by ML-DSA. * `get(x, y)` appends raw one-byte coordinates to the seed, invalidates previously returned * readers, and reuses one mutable internal output buffer for each squeeze. * @param seed - Seed bytes for the reader. * @param blockLen - Optional output block length. * @returns Stateful XOF reader. * @example * Build the ML-DSA SHAKE256 coefficient expander and read one block. * ```ts * import { randomBytes } from '@noble/post-quantum/utils.js'; * import { XOF256 } from '@noble/post-quantum/_crystals.js'; * const reader = XOF256(randomBytes(32)); * const block = reader.get(0, 0)(); * ``` */ export const XOF256: TRet = /* @__PURE__ */ createXofShake(shake256);