p3_field/field.rs
1use alloc::vec;
2use alloc::vec::Vec;
3use core::fmt::{Debug, Display};
4use core::hash::Hash;
5use core::iter::{Product, Sum};
6use core::ops::{Add, AddAssign, Div, DivAssign, Mul, MulAssign, Neg, Sub, SubAssign};
7use core::{array, slice};
8
9use num_bigint::BigUint;
10use p3_maybe_rayon::prelude::*;
11use p3_util::{flatten_to_base, iter_array_chunks_padded};
12use serde::Serialize;
13use serde::de::DeserializeOwned;
14
15use crate::exponentiation::bits_u64;
16use crate::integers::{QuotientMap, from_integer_types};
17use crate::packed::PackedField;
18use crate::{Packable, PackedFieldExtension, PackedValue};
19
20/// A commutative ring, `R`, with prime characteristic, `p`.
21///
22/// This permits elements like:
23/// - A single finite field element.
24/// - A symbolic expression which would evaluate to a field element.
25/// - An array of finite field elements.
26/// - A polynomial with coefficients in a finite field.
27///
28/// ### Mathematical Description
29///
30/// Mathematically, a commutative ring is a set of objects which supports an addition-like
31/// like operation, `+`, and a multiplication-like operation `*`.
32///
33/// Let `x, y, z` denote arbitrary elements of the set.
34///
35/// Then, an operation is addition-like if it satisfies the following properties:
36/// - Commutativity => `x + y = y + x`
37/// - Associativity => `x + (y + z) = (x + y) + z`
38/// - Unit => There exists an identity element `ZERO` satisfying `x + ZERO = x`.
39/// - Inverses => For every `x` there exists a unique inverse `(-x)` satisfying `x + (-x) = ZERO`
40///
41/// Similarly, an operation is multiplication-like if it satisfies the following properties:
42/// - Commutativity => `x * y = y * x`
43/// - Associativity => `x * (y * z) = (x * y) * z`
44/// - Unit => There exists an identity element `ONE` satisfying `x * ONE = x`.
45/// - Distributivity => The two operations `+` and `*` must together satisfy `x * (y + z) = (x * y) + (x * z)`
46///
47/// Unlike in the addition case, we do not require inverses to exist with respect to `*`.
48///
49/// The simplest examples of commutative rings are the integers (`ℤ`), and the integers mod `N` (`ℤ/N`).
50///
51/// The characteristic of a ring is the smallest positive integer `r` such that `0 = r . 1 = 1 + 1 + ... + 1 (r times)`.
52/// For example, the characteristic of the modulo ring `ℤ/N` is `N`.
53///
54/// Rings with prime characteristic are particularly special due to their close relationship with finite fields.
55pub trait PrimeCharacteristicRing:
56 Sized
57 + Default
58 + Clone
59 + Add<Output = Self>
60 + AddAssign
61 + Sub<Output = Self>
62 + SubAssign
63 + Neg<Output = Self>
64 + Mul<Output = Self>
65 + MulAssign
66 + Sum
67 + Product
68 + Debug
69{
70 /// The field `ℤ/p` where the characteristic of this ring is p.
71 type PrimeSubfield: PrimeField;
72
73 /// The additive identity of the ring.
74 ///
75 /// For every element `a` in the ring we require the following properties:
76 ///
77 /// `a + ZERO = ZERO + a = a,`
78 ///
79 /// `a + (-a) = (-a) + a = ZERO.`
80 const ZERO: Self;
81
82 /// The multiplicative identity of the ring.
83 ///
84 /// For every element `a` in the ring we require the following property:
85 ///
86 /// `a*ONE = ONE*a = a.`
87 const ONE: Self;
88
89 /// The element in the ring given by `ONE + ONE`.
90 ///
91 /// This is provided as a convenience as `TWO` occurs regularly in
92 /// the proving system. This also is slightly faster than computing
93 /// it via addition. Note that multiplication by `TWO` is discouraged.
94 /// Instead of `a * TWO` use `a.double()` which will be faster.
95 ///
96 /// If the field has characteristic 2 this is equal to ZERO.
97 const TWO: Self;
98
99 /// The element in the ring given by `-ONE`.
100 ///
101 /// This is provided as a convenience as `NEG_ONE` occurs regularly in
102 /// the proving system. This also is slightly faster than computing
103 /// it via negation. Note that where possible `NEG_ONE` should be absorbed
104 /// into mathematical operations. For example `a - b` will be faster
105 /// than `a + NEG_ONE * b` and similarly `(-b)` is faster than `NEG_ONE * b`.
106 ///
107 /// If the field has characteristic 2 this is equal to ONE.
108 const NEG_ONE: Self;
109
110 /// Embed an element of the prime field `ℤ/p` into the ring `R`.
111 ///
112 /// Given any element `[r] ∈ ℤ/p`, represented by an integer `r` between `0` and `p - 1`
113 /// `from_prime_subfield([r])` will be equal to:
114 ///
115 /// `Self::ONE + ... + Self::ONE (r times)`
116 #[must_use]
117 fn from_prime_subfield(f: Self::PrimeSubfield) -> Self;
118
119 /// Return `Self::ONE` if `b` is `true` and `Self::ZERO` if `b` is `false`.
120 #[must_use]
121 #[inline(always)]
122 fn from_bool(b: bool) -> Self {
123 // Some rings might reimplement this to avoid the branch.
124 if b { Self::ONE } else { Self::ZERO }
125 }
126
127 from_integer_types!(
128 u8, u16, u32, u64, u128, usize, i8, i16, i32, i64, i128, isize
129 );
130
131 /// The elementary function `double(a) = 2*a`.
132 ///
133 /// This function should be preferred over calling `a + a` or `TWO * a` as a faster implementation may be available for some rings.
134 /// If the field has characteristic 2 then this returns 0.
135 #[must_use]
136 #[inline(always)]
137 fn double(&self) -> Self {
138 self.clone() + self.clone()
139 }
140
141 /// The elementary function `halve(a) = a/2`.
142 ///
143 /// # Panics
144 /// The function will panic if the field has characteristic 2.
145 #[must_use]
146 #[inline]
147 fn halve(&self) -> Self {
148 // This must be overwritten by PrimeField implementations as this definition
149 // is circular when PrimeSubfield = Self. It should also be overwritten by
150 // most rings to avoid the multiplication.
151 let half = Self::from_prime_subfield(Self::PrimeSubfield::ONE.halve());
152 self.clone() * half
153 }
154
155 /// The elementary function `square(a) = a^2`.
156 ///
157 /// This function should be preferred over calling `a * a`, as a faster implementation may be available for some rings.
158 #[must_use]
159 #[inline(always)]
160 fn square(&self) -> Self {
161 self.clone() * self.clone()
162 }
163
164 /// The elementary function `cube(a) = a^3`.
165 ///
166 /// This function should be preferred over calling `a * a * a`, as a faster implementation may be available for some rings.
167 #[must_use]
168 #[inline(always)]
169 fn cube(&self) -> Self {
170 self.square() * self.clone()
171 }
172
173 /// Computes the arithmetic generalization of boolean `xor`.
174 ///
175 /// For boolean inputs, `x ^ y = x + y - 2 xy`.
176 #[must_use]
177 #[inline(always)]
178 fn xor(&self, y: &Self) -> Self {
179 self.clone() + y.clone() - self.clone() * y.clone().double()
180 }
181
182 /// Computes the arithmetic generalization of a triple `xor`.
183 ///
184 /// For boolean inputs `x ^ y ^ z = x + y + z - 2(xy + xz + yz) + 4xyz`.
185 #[must_use]
186 #[inline(always)]
187 fn xor3(&self, y: &Self, z: &Self) -> Self {
188 self.xor(y).xor(z)
189 }
190
191 /// Computes the arithmetic generalization of `andnot`.
192 ///
193 /// For boolean inputs `(!x) & y = (1 - x)y`.
194 #[must_use]
195 #[inline(always)]
196 fn andn(&self, y: &Self) -> Self {
197 (Self::ONE - self.clone()) * y.clone()
198 }
199
200 /// The vanishing polynomial for boolean values: `x * (x - 1)`.
201 ///
202 /// This is a polynomial of degree `2` that evaluates to `0` if the input is `0` or `1`.
203 /// If our space is a field, then this will be nonzero on all other inputs.
204 #[must_use]
205 #[inline(always)]
206 fn bool_check(&self) -> Self {
207 // Note: We could delegate to `andn`, but to maintain backwards
208 // compatible AIR definitions, we stick with `x * (x - 1)` here.
209 self.clone() * (self.clone() - Self::ONE)
210 }
211
212 /// Exponentiation by a `u64` power.
213 ///
214 /// This uses the standard square and multiply approach.
215 /// For specific powers regularly used and known in advance,
216 /// this will be slower than custom addition chain exponentiation.
217 #[must_use]
218 #[inline]
219 fn exp_u64(&self, power: u64) -> Self {
220 let mut current = self.clone();
221 let mut product = Self::ONE;
222
223 for j in 0..bits_u64(power) {
224 if (power >> j) & 1 != 0 {
225 product *= current.clone();
226 }
227 current = current.square();
228 }
229 product
230 }
231
232 /// Exponentiation by a small constant power.
233 ///
234 /// For a collection of small values we implement custom multiplication chain circuits which can be faster than the
235 /// simpler square and multiply approach.
236 ///
237 /// For large values this defaults back to `self.exp_u64`.
238 #[must_use]
239 #[inline(always)]
240 fn exp_const_u64<const POWER: u64>(&self) -> Self {
241 match POWER {
242 0 => Self::ONE,
243 1 => self.clone(),
244 2 => self.square(),
245 3 => self.cube(),
246 4 => self.square().square(),
247 5 => self.square().square() * self.clone(),
248 6 => self.square().cube(),
249 7 => {
250 let x2 = self.square();
251 let x3 = x2.clone() * self.clone();
252 let x4 = x2.square();
253 x3 * x4
254 }
255 _ => self.exp_u64(POWER),
256 }
257 }
258
259 /// The elementary function `exp_power_of_2(a, power_log) = a^{2^power_log}`.
260 ///
261 /// Computed via repeated squaring.
262 #[must_use]
263 #[inline]
264 fn exp_power_of_2(&self, power_log: usize) -> Self {
265 let mut res = self.clone();
266 for _ in 0..power_log {
267 res = res.square();
268 }
269 res
270 }
271
272 /// The elementary function `mul_2exp_u64(a, exp) = a * 2^{exp}`.
273 ///
274 /// Here `2^{exp}` is computed using the square and multiply approach.
275 #[must_use]
276 #[inline]
277 fn mul_2exp_u64(&self, exp: u64) -> Self {
278 // Some rings might want to reimplement this to avoid the
279 // exponentiations (and potentially even the multiplication).
280 self.clone() * Self::TWO.exp_u64(exp)
281 }
282
283 /// Divide by a given power of two. `div_2exp_u64(a, exp) = a/2^exp`
284 ///
285 /// # Panics
286 /// The function will panic if the field has characteristic 2.
287 #[must_use]
288 #[inline]
289 fn div_2exp_u64(&self, exp: u64) -> Self {
290 // Some rings might want to reimplement this to avoid the
291 // exponentiations (and potentially even the multiplication).
292 self.clone() * Self::from_prime_subfield(Self::PrimeSubfield::ONE.halve().exp_u64(exp))
293 }
294
295 /// Construct an iterator which returns powers of `self`: `self^0, self^1, self^2, ...`.
296 #[must_use]
297 #[inline]
298 fn powers(&self) -> Powers<Self> {
299 self.shifted_powers(Self::ONE)
300 }
301
302 /// Construct an iterator which returns powers of `self` shifted by `start`: `start, start*self^1, start*self^2, ...`.
303 #[must_use]
304 #[inline]
305 fn shifted_powers(&self, start: Self) -> Powers<Self> {
306 Powers {
307 base: self.clone(),
308 current: start,
309 }
310 }
311
312 /// Compute the dot product of two vectors.
313 #[must_use]
314 #[inline]
315 fn dot_product<const N: usize>(u: &[Self; N], v: &[Self; N]) -> Self {
316 u.iter().zip(v).map(|(x, y)| x.clone() * y.clone()).sum()
317 }
318
319 /// Compute the sum of a slice of elements whose length is a compile time constant.
320 ///
321 /// The rust compiler doesn't realize that add is associative
322 /// so we help it out and minimize the dependency chains by hand.
323 /// Thus while this function has the same throughput as `input.iter().sum()`,
324 /// it will usually have much lower latency.
325 ///
326 /// # Panics
327 ///
328 /// May panic if the length of the input slice is not equal to `N`.
329 #[must_use]
330 #[inline]
331 fn sum_array<const N: usize>(input: &[Self]) -> Self {
332 // It looks a little strange but using a const parameter and an assert_eq! instead of
333 // using input.len() leads to a significant performance improvement.
334 // We could make this input &[Self; N] but that would require sticking .try_into().unwrap() everywhere.
335 // Checking godbolt, the compiler seems to unroll everything anyway.
336 assert_eq!(N, input.len());
337
338 // For `N <= 8` we implement a tree sum structure and for `N > 8` we break the input into
339 // chunks of `8`, perform a tree sum on each chunk and sum the results. The parameter `8`
340 // was determined experimentally by testing the speed of the poseidon2 internal layer computations.
341 // This is a useful benchmark as we have a mix of summations of size 15, 23 with other work in between.
342 // I only tested this on `AVX2` though so there might be a better value for other architectures.
343 match N {
344 0 => Self::ZERO,
345 1 => input[0].clone(),
346 2 => input[0].clone() + input[1].clone(),
347 3 => input[0].clone() + input[1].clone() + input[2].clone(),
348 4 => (input[0].clone() + input[1].clone()) + (input[2].clone() + input[3].clone()),
349 5 => Self::sum_array::<4>(&input[..4]) + Self::sum_array::<1>(&input[4..]),
350 6 => Self::sum_array::<4>(&input[..4]) + Self::sum_array::<2>(&input[4..]),
351 7 => Self::sum_array::<4>(&input[..4]) + Self::sum_array::<3>(&input[4..]),
352 8 => Self::sum_array::<4>(&input[..4]) + Self::sum_array::<4>(&input[4..]),
353 _ => {
354 // We know that N > 8 here so this saves an add over the usual
355 // initialisation of acc to Self::ZERO.
356 let mut acc = Self::sum_array::<8>(&input[..8]);
357 for i in (16..=N).step_by(8) {
358 acc += Self::sum_array::<8>(&input[(i - 8)..i]);
359 }
360 // This would be much cleaner if we could use const generic expressions but
361 // this will do for now.
362 match N & 7 {
363 0 => acc,
364 1 => acc + Self::sum_array::<1>(&input[(8 * (N / 8))..]),
365 2 => acc + Self::sum_array::<2>(&input[(8 * (N / 8))..]),
366 3 => acc + Self::sum_array::<3>(&input[(8 * (N / 8))..]),
367 4 => acc + Self::sum_array::<4>(&input[(8 * (N / 8))..]),
368 5 => acc + Self::sum_array::<5>(&input[(8 * (N / 8))..]),
369 6 => acc + Self::sum_array::<6>(&input[(8 * (N / 8))..]),
370 7 => acc + Self::sum_array::<7>(&input[(8 * (N / 8))..]),
371 _ => unreachable!(),
372 }
373 }
374 }
375 }
376
377 /// Allocates a vector of zero elements of length `len`. Many operating systems zero pages
378 /// before assigning them to a userspace process. In that case, our process should not need to
379 /// write zeros, which would be redundant. However, the compiler may not always recognize this.
380 ///
381 /// In particular, `vec![Self::ZERO; len]` appears to result in redundant userspace zeroing.
382 /// This is the default implementation, but implementers may wish to provide their own
383 /// implementation which transmutes something like `vec![0u32; len]`.
384 #[must_use]
385 #[inline]
386 fn zero_vec(len: usize) -> Vec<Self> {
387 vec![Self::ZERO; len]
388 }
389}
390
391/// A vector space `V` over `F` with a fixed basis. Fixing the basis allows elements of `V` to be
392/// converted to and from `DIMENSION` many elements of `F` which are interpreted as basis coefficients.
393///
394/// We usually expect `F` to be a field but do not enforce this and so allow it to be just a ring.
395/// This lets every ring implement `BasedVectorSpace<Self>` and is useful in a couple of other cases.
396///
397/// ## Safety
398/// We make no guarantees about consistency of the choice of basis across different versions of Plonky3.
399/// If this choice of basis changes, the behaviour of `BasedVectorSpace` will also change. Due to this,
400/// we recommend avoiding using this trait unless absolutely necessary.
401///
402/// ### Mathematical Description
403/// Given a vector space, `A` over `F`, a basis is a set of elements `B = {b_0, ..., b_{n-1}}`
404/// in `A` such that, given any element `a`, we can find a unique set of `n` elements of `F`,
405/// `f_0, ..., f_{n - 1}` satisfying `a = f_0 b_0 + ... + f_{n - 1} b_{n - 1}`. Thus the choice
406/// of `B` gives rise to a natural linear map between the vector space `A` and the canonical
407/// `n` dimensional vector space `F^n`.
408///
409/// This allows us to map between elements of `A` and arrays of `n` elements of `F`.
410/// Clearly this map depends entirely on the choice of basis `B` which may change
411/// across versions of Plonky3.
412///
413/// The situation is slightly more complicated in cases where `F` is not a field but boils down
414/// to an identical description once we enforce that `A` is a free module over `F`.
415pub trait BasedVectorSpace<F: PrimeCharacteristicRing>: Sized {
416 /// The dimension of the vector space, i.e. the number of elements in
417 /// its basis.
418 const DIMENSION: usize;
419
420 /// Fixes a basis for the algebra `A` and uses this to
421 /// map an element of `A` to a slice of `DIMENSION` `F` elements.
422 ///
423 /// # Safety
424 ///
425 /// The value produced by this function fundamentally depends
426 /// on the choice of basis. Care must be taken
427 /// to ensure portability if these values might ever be passed to
428 /// (or rederived within) another compilation environment where a
429 /// different basis might have been used.
430 #[must_use]
431 fn as_basis_coefficients_slice(&self) -> &[F];
432
433 /// Fixes a basis for the algebra `A` and uses this to
434 /// map `DIMENSION` `F` elements to an element of `A`.
435 ///
436 /// # Safety
437 ///
438 /// The value produced by this function fundamentally depends
439 /// on the choice of basis. Care must be taken
440 /// to ensure portability if these values might ever be passed to
441 /// (or rederived within) another compilation environment where a
442 /// different basis might have been used.
443 ///
444 /// Returns `None` if the length of the slice is different to `DIMENSION`.
445 #[must_use]
446 #[inline]
447 fn from_basis_coefficients_slice(slice: &[F]) -> Option<Self> {
448 Self::from_basis_coefficients_iter(slice.iter().cloned())
449 }
450
451 /// Fixes a basis for the algebra `A` and uses this to
452 /// map `DIMENSION` `F` elements to an element of `A`. Similar
453 /// to `core:array::from_fn`, the `DIMENSION` `F` elements are
454 /// given by `Fn(0), ..., Fn(DIMENSION - 1)` called in that order.
455 ///
456 /// # Safety
457 ///
458 /// The value produced by this function fundamentally depends
459 /// on the choice of basis. Care must be taken
460 /// to ensure portability if these values might ever be passed to
461 /// (or rederived within) another compilation environment where a
462 /// different basis might have been used.
463 #[must_use]
464 fn from_basis_coefficients_fn<Fn: FnMut(usize) -> F>(f: Fn) -> Self;
465
466 /// Fixes a basis for the algebra `A` and uses this to
467 /// map `DIMENSION` `F` elements to an element of `A`.
468 ///
469 /// # Safety
470 ///
471 /// The value produced by this function fundamentally depends
472 /// on the choice of basis. Care must be taken
473 /// to ensure portability if these values might ever be passed to
474 /// (or rederived within) another compilation environment where a
475 /// different basis might have been used.
476 ///
477 /// Returns `None` if the length of the iterator is different to `DIMENSION`.
478 #[must_use]
479 fn from_basis_coefficients_iter<I: ExactSizeIterator<Item = F>>(iter: I) -> Option<Self>;
480
481 /// Given a basis for the Algebra `A`, return the i'th basis element.
482 ///
483 /// # Safety
484 ///
485 /// The value produced by this function fundamentally depends
486 /// on the choice of basis. Care must be taken
487 /// to ensure portability if these values might ever be passed to
488 /// (or rederived within) another compilation environment where a
489 /// different basis might have been used.
490 ///
491 /// Returns `None` if `i` is greater than or equal to `DIMENSION`.
492 #[must_use]
493 #[inline]
494 fn ith_basis_element(i: usize) -> Option<Self> {
495 (i < Self::DIMENSION).then(|| Self::from_basis_coefficients_fn(|j| F::from_bool(i == j)))
496 }
497
498 /// Convert from a vector of `Self` to a vector of `F` by flattening the basis coefficients.
499 ///
500 /// Depending on the `BasedVectorSpace` this may be essentially a no-op and should certainly
501 /// be reimplemented in those cases.
502 ///
503 /// # Safety
504 ///
505 /// The value produced by this function fundamentally depends
506 /// on the choice of basis. Care must be taken
507 /// to ensure portability if these values might ever be passed to
508 /// (or rederived within) another compilation environment where a
509 /// different basis might have been used.
510 #[must_use]
511 #[inline]
512 fn flatten_to_base(vec: Vec<Self>) -> Vec<F> {
513 vec.into_iter()
514 .flat_map(|x| x.as_basis_coefficients_slice().to_vec())
515 .collect()
516 }
517
518 /// Convert from a vector of `F` to a vector of `Self` by combining the basis coefficients.
519 ///
520 /// Depending on the `BasedVectorSpace` this may be essentially a no-op and should certainly
521 /// be reimplemented in those cases.
522 ///
523 /// # Panics
524 /// This will panic if the length of `vec` is not a multiple of `Self::DIMENSION`.
525 ///
526 /// # Safety
527 ///
528 /// The value produced by this function fundamentally depends
529 /// on the choice of basis. Care must be taken
530 /// to ensure portability if these values might ever be passed to
531 /// (or rederived within) another compilation environment where a
532 /// different basis might have been used.
533 #[must_use]
534 #[inline]
535 fn reconstitute_from_base(vec: Vec<F>) -> Vec<Self>
536 where
537 F: Sync,
538 Self: Send,
539 {
540 assert_eq!(vec.len() % Self::DIMENSION, 0);
541
542 vec.par_chunks_exact(Self::DIMENSION)
543 .map(|chunk| {
544 Self::from_basis_coefficients_slice(chunk)
545 .expect("Chunk length not equal to dimension")
546 })
547 .collect()
548 }
549}
550
551/// Values that can act as sponge lanes for delimiter padding.
552///
553/// This is used by symmetric sponge adapters that need canonical `0` and `1` symbols while
554/// supporting both field/ring-based lanes and `u64`-based Keccak lanes behind one API.
555pub trait SpongePaddingValue: Copy {
556 /// The empty-lane value.
557 const PAD_ZERO: Self;
558
559 /// The delimiter value injected after the final absorbed element.
560 const PAD_ONE: Self;
561}
562
563impl<T: PrimeCharacteristicRing + Copy> SpongePaddingValue for T {
564 const PAD_ZERO: Self = Self::ZERO;
565 const PAD_ONE: Self = Self::ONE;
566}
567
568impl SpongePaddingValue for u64 {
569 const PAD_ZERO: Self = 0;
570 const PAD_ONE: Self = 1;
571}
572
573impl<const N: usize> SpongePaddingValue for [u64; N] {
574 const PAD_ZERO: Self = [0; N];
575 const PAD_ONE: Self = [1; N];
576}
577
578impl<F: PrimeCharacteristicRing> BasedVectorSpace<F> for F {
579 const DIMENSION: usize = 1;
580
581 #[inline]
582 fn as_basis_coefficients_slice(&self) -> &[F] {
583 slice::from_ref(self)
584 }
585
586 #[inline]
587 fn from_basis_coefficients_fn<Fn: FnMut(usize) -> F>(mut f: Fn) -> Self {
588 f(0)
589 }
590
591 #[inline]
592 fn from_basis_coefficients_iter<I: ExactSizeIterator<Item = F>>(mut iter: I) -> Option<Self> {
593 (iter.len() == 1).then(|| iter.next().unwrap()) // Unwrap will not panic as we know the length is 1.
594 }
595
596 #[inline]
597 fn flatten_to_base(vec: Vec<Self>) -> Vec<F> {
598 vec
599 }
600
601 #[inline]
602 fn reconstitute_from_base(vec: Vec<F>) -> Vec<Self> {
603 vec
604 }
605}
606
607/// A ring implements `InjectiveMonomial<N>` if the algebraic function
608/// `f(x) = x^N` is an injective map on elements of the ring.
609///
610/// We do not enforce that this map be invertible as there are useful
611/// cases such as polynomials or symbolic expressions where no inverse exists.
612///
613/// However, if the ring is a field with order `q` or an array of such field elements,
614/// then `f(x) = x^N` will be injective if and only if it is invertible and so in
615/// such cases this monomial acts as a permutation. Moreover, this will occur
616/// exactly when `N` and `q - 1` are relatively prime i.e. `gcd(N, q - 1) = 1`.
617pub trait InjectiveMonomial<const N: u64>: PrimeCharacteristicRing {
618 /// Compute `x -> x^n` for a given `n > 1` such that this
619 /// map is injective.
620 #[must_use]
621 #[inline]
622 fn injective_exp_n(&self) -> Self {
623 self.exp_const_u64::<N>()
624 }
625}
626
627/// A ring implements `PermutationMonomial<N>` if the algebraic function
628/// `f(x) = x^N` is invertible and thus acts as a permutation on elements of the ring.
629///
630/// In all cases we care about, this means that we can find another integer `K` such
631/// that `x = x^{NK}` for all elements of our ring.
632pub trait PermutationMonomial<const N: u64>: InjectiveMonomial<N> {
633 /// Compute `x -> x^K` for a given `K > 1` such that
634 /// `x^{NK} = x` for all elements `x`.
635 #[must_use]
636 fn injective_exp_root_n(&self) -> Self;
637}
638
639/// A ring `R` implements `Algebra<F>` if there is an injective homomorphism
640/// from `F` into `R`; in particular only `F::ZERO` maps to `R::ZERO`.
641///
642/// For the most part, we will usually expect `F` to be a field but there
643/// are a few cases where it is handy to allow it to just be a ring. In
644/// particular, every ring naturally implements `Algebra<Self>`.
645///
646/// ### Mathematical Description
647///
648/// Let `x` and `y` denote arbitrary elements of `F`. Then
649/// we require that our map `from` has the properties:
650/// - Preserves Identity: `from(F::ONE) = R::ONE`
651/// - Commutes with Addition: `from(x + y) = from(x) + from(y)`
652/// - Commutes with Multiplication: `from(x * y) = from(x) * from(y)`
653///
654/// Such maps are known as ring homomorphisms and are injective if the
655/// only element which maps to `R::ZERO` is `F::ZERO`.
656///
657/// The existence of this map makes `R` into an `F`-module and hence an `F`-algebra.
658/// If, additionally, `R` is a field, then this makes `R` a field extension of `F`.
659pub trait Algebra<F>:
660 PrimeCharacteristicRing
661 + From<F>
662 + Add<F, Output = Self>
663 + AddAssign<F>
664 + Sub<F, Output = Self>
665 + SubAssign<F>
666 + Mul<F, Output = Self>
667 + MulAssign<F>
668{
669}
670
671// Every ring is an algebra over itself.
672impl<R: PrimeCharacteristicRing> Algebra<R> for R {}
673
674/// A collection of methods designed to help hash field elements.
675///
676/// Most fields will want to reimplement many/all of these methods as the default implementations
677/// are slow and involve converting to/from byte representations.
678pub trait RawDataSerializable: Sized {
679 /// The number of bytes which this field element occupies in memory.
680 /// Must be equal to the length of self.into_bytes().
681 const NUM_BYTES: usize;
682
683 /// Convert a field element into a collection of bytes.
684 #[must_use]
685 fn into_bytes(self) -> impl IntoIterator<Item = u8>;
686
687 /// Convert an iterator of field elements into an iterator of bytes.
688 #[must_use]
689 fn into_byte_stream(input: impl IntoIterator<Item = Self>) -> impl IntoIterator<Item = u8> {
690 input.into_iter().flat_map(|elem| elem.into_bytes())
691 }
692
693 /// Convert an iterator of field elements into an iterator of u32s.
694 ///
695 /// If `NUM_BYTES` does not divide `4`, multiple `F`s may be packed together to make a single `u32`. Furthermore,
696 /// if `NUM_BYTES * input.len()` does not divide `4`, the final `u32` will involve padding bytes which are set to `0`.
697 #[must_use]
698 fn into_u32_stream(input: impl IntoIterator<Item = Self>) -> impl IntoIterator<Item = u32> {
699 let bytes = Self::into_byte_stream(input);
700 iter_array_chunks_padded(bytes, 0).map(u32::from_le_bytes)
701 }
702
703 /// Convert an iterator of field elements into an iterator of u64s.
704 ///
705 /// If `NUM_BYTES` does not divide `8`, multiple `F`s may be packed together to make a single `u64`. Furthermore,
706 /// if `NUM_BYTES * input.len()` does not divide `8`, the final `u64` will involve padding bytes which are set to `0`.
707 #[must_use]
708 fn into_u64_stream(input: impl IntoIterator<Item = Self>) -> impl IntoIterator<Item = u64> {
709 let bytes = Self::into_byte_stream(input);
710 iter_array_chunks_padded(bytes, 0).map(u64::from_le_bytes)
711 }
712
713 /// Convert an iterator of field element arrays into an iterator of byte arrays.
714 ///
715 /// Converts an element `[F; N]` into the byte array `[[u8; N]; NUM_BYTES]`. This is
716 /// intended for use with vectorized hash functions which use vector operations
717 /// to compute several hashes in parallel.
718 #[must_use]
719 fn into_parallel_byte_streams<const N: usize>(
720 input: impl IntoIterator<Item = [Self; N]>,
721 ) -> impl IntoIterator<Item = [u8; N]> {
722 input.into_iter().flat_map(|vector| {
723 let bytes = vector.map(|elem| elem.into_bytes().into_iter().collect::<Vec<_>>());
724 (0..Self::NUM_BYTES).map(move |i| array::from_fn(|j| bytes[j][i]))
725 })
726 }
727
728 /// Convert an iterator of field element arrays into an iterator of u32 arrays.
729 ///
730 /// Converts an element `[F; N]` into the u32 array `[[u32; N]; NUM_BYTES/4]`. This is
731 /// intended for use with vectorized hash functions which use vector operations
732 /// to compute several hashes in parallel.
733 ///
734 /// This function is guaranteed to be equivalent to starting with `Iterator<[F; N]>` performing a transpose
735 /// operation to get `[Iterator<F>; N]`, calling `into_u32_stream` on each element to get `[Iterator<u32>; N]` and then
736 /// performing another transpose operation to get `Iterator<[u32; N]>`.
737 ///
738 /// If `NUM_BYTES` does not divide `4`, multiple `[F; N]`s may be packed together to make a single `[u32; N]`. Furthermore,
739 /// if `NUM_BYTES * input.len()` does not divide `4`, the final `[u32; N]` will involve padding bytes which are set to `0`.
740 #[must_use]
741 fn into_parallel_u32_streams<const N: usize>(
742 input: impl IntoIterator<Item = [Self; N]>,
743 ) -> impl IntoIterator<Item = [u32; N]> {
744 let bytes = Self::into_parallel_byte_streams(input);
745 iter_array_chunks_padded(bytes, [0; N]).map(|byte_array: [[u8; N]; 4]| {
746 array::from_fn(|i| u32::from_le_bytes(array::from_fn(|j| byte_array[j][i])))
747 })
748 }
749
750 /// Convert an iterator of field element arrays into an iterator of u64 arrays.
751 ///
752 /// Converts an element `[F; N]` into the u64 array `[[u64; N]; NUM_BYTES/8]`. This is
753 /// intended for use with vectorized hash functions which use vector operations
754 /// to compute several hashes in parallel.
755 ///
756 /// This function is guaranteed to be equivalent to starting with `Iterator<[F; N]>` performing a transpose
757 /// operation to get `[Iterator<F>; N]`, calling `into_u64_stream` on each element to get `[Iterator<u64>; N]` and then
758 /// performing another transpose operation to get `Iterator<[u64; N]>`.
759 ///
760 /// If `NUM_BYTES` does not divide `8`, multiple `[F; N]`s may be packed together to make a single `[u64; N]`. Furthermore,
761 /// if `NUM_BYTES * input.len()` does not divide `8`, the final `[u64; N]` will involve padding bytes which are set to `0`.
762 #[must_use]
763 fn into_parallel_u64_streams<const N: usize>(
764 input: impl IntoIterator<Item = [Self; N]>,
765 ) -> impl IntoIterator<Item = [u64; N]> {
766 let bytes = Self::into_parallel_byte_streams(input);
767 iter_array_chunks_padded(bytes, [0; N]).map(|byte_array: [[u8; N]; 8]| {
768 array::from_fn(|i| u64::from_le_bytes(array::from_fn(|j| byte_array[j][i])))
769 })
770 }
771}
772
773/// A field `F`. This permits both modular fields `ℤ/p` along with their field extensions.
774///
775/// A ring is a field if every element `x` has a unique multiplicative inverse `x^{-1}`
776/// which satisfies `x * x^{-1} = F::ONE`.
777pub trait Field:
778 Algebra<Self>
779 + RawDataSerializable
780 + Packable
781 + 'static
782 + Copy
783 + Div<Self, Output = Self>
784 + DivAssign
785 + Add<Self::Packing, Output = Self::Packing>
786 + Sub<Self::Packing, Output = Self::Packing>
787 + Mul<Self::Packing, Output = Self::Packing>
788 + Eq
789 + Hash
790 + Send
791 + Sync
792 + Display
793 + Serialize
794 + DeserializeOwned
795{
796 type Packing: PackedField<Scalar = Self>;
797
798 /// A generator of this field's multiplicative group.
799 const GENERATOR: Self;
800
801 /// Check if the given field element is equal to the unique additive identity (ZERO).
802 #[must_use]
803 #[inline]
804 fn is_zero(&self) -> bool {
805 *self == Self::ZERO
806 }
807
808 /// Check if the given field element is equal to the unique multiplicative identity (ONE).
809 #[must_use]
810 #[inline]
811 fn is_one(&self) -> bool {
812 *self == Self::ONE
813 }
814
815 /// The multiplicative inverse of this field element, if it exists.
816 ///
817 /// NOTE: The inverse of `0` is undefined and will return `None`.
818 #[must_use]
819 fn try_inverse(&self) -> Option<Self>;
820
821 /// The multiplicative inverse of this field element.
822 ///
823 /// # Panics
824 /// The function will panic if the field element is `0`.
825 /// Use try_inverse if you want to handle this case.
826 #[must_use]
827 fn inverse(&self) -> Self {
828 self.try_inverse().expect("Tried to invert zero")
829 }
830
831 /// Add two slices of field elements together, returning the result in the first slice.
832 ///
833 /// Makes use of packing to speed up the addition.
834 ///
835 /// This is optimal for cases where the two slices are small to medium length. E.g. between
836 /// `F::Packing::WIDTH` and roughly however many elements fit in a cache line.
837 ///
838 /// For larger slices, it's likely worthwhile to use parallelization before calling this.
839 /// Similarly if you need to add a large number of slices together, it's best to
840 /// break them into small chunks and call this on the smaller chunks.
841 ///
842 /// # Panics
843 /// The function will panic if the lengths of the two slices are not equal.
844 #[inline]
845 fn add_slices(slice_1: &mut [Self], slice_2: &[Self]) {
846 let (shorts_1, suffix_1) = Self::Packing::pack_slice_with_suffix_mut(slice_1);
847 let (shorts_2, suffix_2) = Self::Packing::pack_slice_with_suffix(slice_2);
848 debug_assert_eq!(shorts_1.len(), shorts_2.len());
849 debug_assert_eq!(suffix_1.len(), suffix_2.len());
850 for (x_1, &x_2) in shorts_1.iter_mut().zip(shorts_2) {
851 *x_1 += x_2;
852 }
853 for (x_1, &x_2) in suffix_1.iter_mut().zip(suffix_2) {
854 *x_1 += x_2;
855 }
856 }
857
858 /// The number of elements in the field.
859 ///
860 /// This will either be prime if the field is a PrimeField or a power of a
861 /// prime if the field is an extension field.
862 #[must_use]
863 fn order() -> BigUint;
864
865 /// The number of bits required to define an element of this field.
866 ///
867 /// Usually due to storage and practical reasons the memory size of
868 /// a field element will be a little larger than bits().
869 #[must_use]
870 #[inline]
871 fn bits() -> usize {
872 Self::order().bits() as usize
873 }
874}
875
876/// A field isomorphic to `ℤ/p` for some prime `p`.
877///
878/// There is a natural map from `ℤ` to `ℤ/p` which sends an integer `r` to its conjugacy class `[r]`.
879/// Canonically, each conjugacy class `[r]` can be represented by the unique integer `s` in `[0, p - 1)`
880/// satisfying `s = r mod p`. This however is often not the most convenient computational representation
881/// and so internal representations of field elements might differ from this and may change over time.
882pub trait PrimeField:
883 Field
884 + Ord
885 + QuotientMap<u8>
886 + QuotientMap<u16>
887 + QuotientMap<u32>
888 + QuotientMap<u64>
889 + QuotientMap<u128>
890 + QuotientMap<usize>
891 + QuotientMap<i8>
892 + QuotientMap<i16>
893 + QuotientMap<i32>
894 + QuotientMap<i64>
895 + QuotientMap<i128>
896 + QuotientMap<isize>
897{
898 /// Return the representative of `value` in canonical form
899 /// which lies in the range `0 <= x < self.order()`.
900 #[must_use]
901 fn as_canonical_biguint(&self) -> BigUint;
902}
903
904/// A prime field `ℤ/p` with order, `p < 2^64`.
905pub trait PrimeField64: PrimeField {
906 const ORDER_U64: u64;
907
908 /// Return the representative of `value` in canonical form
909 /// which lies in the range `0 <= x < ORDER_U64`.
910 #[must_use]
911 fn as_canonical_u64(&self) -> u64;
912
913 /// Convert a field element to a `u64` such that any two field elements
914 /// are converted to the same `u64` if and only if they represent the same value.
915 ///
916 /// This will be the fastest way to convert a field element to a `u64` and
917 /// is intended for use in hashing. It will also be consistent across different targets.
918 #[must_use]
919 #[inline(always)]
920 fn to_unique_u64(&self) -> u64 {
921 // A simple default which is optimal for some fields.
922 self.as_canonical_u64()
923 }
924}
925
926/// A prime field `ℤ/p` with order `p < 2^32`.
927pub trait PrimeField32: PrimeField64 {
928 const ORDER_U32: u32;
929
930 /// Return the representative of `value` in canonical form
931 /// which lies in the range `0 <= x < ORDER_U64`.
932 #[must_use]
933 fn as_canonical_u32(&self) -> u32;
934
935 /// Convert a field element to a `u32` such that any two field elements
936 /// are converted to the same `u32` if and only if they represent the same value.
937 ///
938 /// This will be the fastest way to convert a field element to a `u32` and
939 /// is intended for use in hashing. It will also be consistent across different targets.
940 #[must_use]
941 #[inline(always)]
942 fn to_unique_u32(&self) -> u32 {
943 // A simple default which is optimal for some fields.
944 self.as_canonical_u32()
945 }
946}
947
948/// A field `EF` which is also an algebra over a field `F`.
949///
950/// This provides a couple of convenience methods on top of the
951/// standard methods provided by `Field`, `Algebra<F>` and `BasedVectorSpace<F>`.
952///
953/// It also provides a type which handles packed vectors of extension field elements.
954pub trait ExtensionField<Base: Field>: Field + Algebra<Base> + BasedVectorSpace<Base> {
955 type ExtensionPacking: PackedFieldExtension<Base, Self> + 'static + Copy + Send + Sync;
956
957 /// Determine if the given element lies in the base field.
958 #[must_use]
959 fn is_in_basefield(&self) -> bool;
960
961 /// If the element lies in the base field project it down.
962 /// Otherwise return None.
963 #[must_use]
964 fn as_base(&self) -> Option<Base>;
965}
966
967// Every field is trivially a one dimensional extension over itself.
968impl<F: Field> ExtensionField<F> for F {
969 type ExtensionPacking = F::Packing;
970
971 #[inline]
972 fn is_in_basefield(&self) -> bool {
973 true
974 }
975
976 #[inline]
977 fn as_base(&self) -> Option<F> {
978 Some(*self)
979 }
980}
981
982/// A field which supplies information like the two-adicity of its multiplicative group, and methods
983/// for obtaining two-adic generators.
984pub trait TwoAdicField: Field {
985 /// The number of factors of two in this field's multiplicative group.
986 const TWO_ADICITY: usize;
987
988 /// Returns a generator of the multiplicative group of order `2^bits`.
989 /// Assumes `bits <= TWO_ADICITY`, otherwise the result is undefined.
990 #[must_use]
991 fn two_adic_generator(bits: usize) -> Self;
992}
993
994/// An iterator which returns the powers of a base element `b` shifted by current `c`: `c, c * b, c * b^2, ...`.
995#[derive(Clone, Debug)]
996pub struct Powers<R: PrimeCharacteristicRing> {
997 pub base: R,
998 pub current: R,
999}
1000
1001impl<R: PrimeCharacteristicRing> Iterator for Powers<R> {
1002 type Item = R;
1003
1004 fn next(&mut self) -> Option<R> {
1005 let result = self.current.clone();
1006 self.current *= self.base.clone();
1007 Some(result)
1008 }
1009}
1010
1011impl<R: PrimeCharacteristicRing> Powers<R> {
1012 /// Returns an iterator yielding the first `n` powers.
1013 #[inline]
1014 #[must_use]
1015 pub const fn take(self, n: usize) -> BoundedPowers<R> {
1016 BoundedPowers { iter: self, n }
1017 }
1018
1019 /// Fills `slice` with the next `slice.len()` powers yielded by the iterator.
1020 #[inline]
1021 pub fn fill(self, slice: &mut [R]) {
1022 slice
1023 .iter_mut()
1024 .zip(self)
1025 .for_each(|(out, next)| *out = next);
1026 }
1027
1028 /// Wrapper for `self.take(n).collect()`.
1029 #[inline]
1030 #[must_use]
1031 pub fn collect_n(self, n: usize) -> Vec<R> {
1032 self.take(n).collect()
1033 }
1034}
1035
1036impl<F: Field> BoundedPowers<F> {
1037 /// Collect exactly `num_powers` ascending powers of `self.base`, starting at `self.current`.
1038 ///
1039 /// # Details
1040 ///
1041 /// The computation is split evenly amongst available threads, and each chunk is computed
1042 /// using packed fields.
1043 ///
1044 /// # Performance
1045 ///
1046 /// Enable the `parallel` feature to enable parallelization.
1047 #[must_use]
1048 pub fn collect(self) -> Vec<F> {
1049 let num_powers = self.n;
1050
1051 // When num_powers is small, fallback to serial computation
1052 if num_powers < 16 {
1053 return self.take(num_powers).collect();
1054 }
1055
1056 // Allocate buffer storing packed powers, containing at least `num_powers` scalars.
1057 let width = F::Packing::WIDTH;
1058 let num_packed = num_powers.div_ceil(width);
1059 let mut points_packed = F::Packing::zero_vec(num_packed);
1060
1061 // Split computation evenly among threads
1062 let num_threads = current_num_threads().max(1);
1063 let chunk_size = num_packed.div_ceil(num_threads);
1064
1065 // Precompute base for each chunk.
1066 let base = self.iter.base;
1067 let chunk_base = base.exp_u64((chunk_size * width) as u64);
1068 let shift = self.iter.current;
1069
1070 points_packed
1071 .par_chunks_mut(chunk_size)
1072 .enumerate()
1073 .for_each(|(chunk_idx, chunk_slice)| {
1074 // First power in this chunk
1075 let chunk_start = shift * chunk_base.exp_u64(chunk_idx as u64);
1076
1077 // Fill the chunk with packed powers.
1078 F::Packing::packed_shifted_powers(base, chunk_start).fill(chunk_slice);
1079 });
1080
1081 // return the number of requested points, discarding the unused packed powers
1082 // SAFETY: size_of::<F::Packing> always divides size_of::<F::Packing>.
1083 let mut points = unsafe { flatten_to_base(points_packed) };
1084 points.truncate(num_powers);
1085 points
1086 }
1087}
1088
1089/// Same as [`Powers`], but returns a bounded number of powers.
1090#[derive(Clone, Debug)]
1091pub struct BoundedPowers<R: PrimeCharacteristicRing> {
1092 iter: Powers<R>,
1093 n: usize,
1094}
1095
1096impl<R: PrimeCharacteristicRing> Iterator for BoundedPowers<R> {
1097 type Item = R;
1098
1099 fn next(&mut self) -> Option<R> {
1100 (self.n != 0).then(|| {
1101 self.n -= 1;
1102 self.iter.next().unwrap()
1103 })
1104 }
1105}