Add allocation-free RistrettoPoint::double_and_compress_batch()

daxpedda · daxpedda · commit d2dec5d2be1f · 2025-08-14T00:49:34.000+02:00
diff --git a/curve25519-dalek/benches/dalek_benchmarks.rs b/curve25519-dalek/benches/dalek_benchmarks.rs
@@ -289,7 +289,7 @@ mod ristretto_benches {
                     let points: Vec<RistrettoPoint> = (0..size)
                         .map(|_| RistrettoPoint::try_from_rng(&mut rng).unwrap())
                         .collect();
-                    b.iter(|| RistrettoPoint::double_and_compress_batch(&points));
+                    b.iter(|| RistrettoPoint::double_and_compress_alloc_batch(&points));
                 },
             );
         }
diff --git a/curve25519-dalek/src/edwards.rs b/curve25519-dalek/src/edwards.rs
@@ -599,7 +599,7 @@ impl EdwardsPoint {
 
         // Compute the denominators in a batch
         let mut denominators = eds.iter().map(|p| &p.Z - &p.Y).collect::<Vec<_>>();
-        FieldElement::batch_invert(&mut denominators);
+        FieldElement::batch_alloc_invert(&mut denominators);
 
         // Now compute the Montgomery u coordinate for every point
         let mut ret = Vec::with_capacity(eds.len());
@@ -621,7 +621,7 @@ impl EdwardsPoint {
     #[cfg(feature = "alloc")]
     pub fn compress_batch(inputs: &[EdwardsPoint]) -> Vec<CompressedEdwardsY> {
         let mut zs = inputs.iter().map(|input| input.Z).collect::<Vec<_>>();
-        FieldElement::batch_invert(&mut zs);
+        FieldElement::batch_alloc_invert(&mut zs);
 
         inputs
             .iter()
diff --git a/curve25519-dalek/src/field.rs b/curve25519-dalek/src/field.rs
@@ -203,17 +203,32 @@ impl FieldElement {
         (t19, t3)
     }
 
+    /// Given a slice of pub(crate)lic `FieldElements`, replace each with its inverse.
+    ///
+    /// When an input `FieldElement` is zero, its value is unchanged.
+    pub(crate) fn batch_invert<const N: usize>(inputs: &mut [FieldElement; N]) {
+        let mut scratch = [FieldElement::ONE; N];
+
+        Self::internal_batch_invert(inputs, &mut scratch);
+    }
+
     /// Given a slice of pub(crate)lic `FieldElements`, replace each with its inverse.
     ///
     /// When an input `FieldElement` is zero, its value is unchanged.
     #[cfg(feature = "alloc")]
-    pub(crate) fn batch_invert(inputs: &mut [FieldElement]) {
+    pub(crate) fn batch_alloc_invert(inputs: &mut [FieldElement]) {
+        let n = inputs.len();
+        let mut scratch = vec![FieldElement::ONE; n];
+
+        Self::internal_batch_invert(inputs, &mut scratch);
+    }
+
+    fn internal_batch_invert(inputs: &mut [FieldElement], scratch: &mut [FieldElement]) {
         // Montgomery’s Trick and Fast Implementation of Masked AES
         // Genelle, Prouff and Quisquater
         // Section 3.2
 
-        let n = inputs.len();
-        let mut scratch = vec![FieldElement::ONE; n];
+        debug_assert_eq!(inputs.len(), scratch.len());
 
         // Keep an accumulator of all of the previous products
         let mut acc = FieldElement::ONE;
@@ -234,12 +249,12 @@ impl FieldElement {
 
         // Pass through the vector backwards to compute the inverses
         // in place
-        for (input, scratch) in inputs.iter_mut().rev().zip(scratch.into_iter().rev()) {
+        for (input, scratch) in inputs.iter_mut().rev().zip(scratch.iter_mut().rev()) {
             let tmp = &acc * input;
             // input <- acc * scratch, then acc <- tmp
             // Again, we skip zeros in a constant-time way
             let nz = !input.is_zero();
-            input.conditional_assign(&(&acc * &scratch), nz);
+            input.conditional_assign(&(&acc * scratch), nz);
             acc.conditional_assign(&tmp, nz);
         }
     }
@@ -485,7 +500,7 @@ mod test {
         let a2 = &a + &a;
         let a_list = vec![a, ap58, asq, ainv, a0, a2];
         let mut ainv_list = a_list.clone();
-        FieldElement::batch_invert(&mut ainv_list[..]);
+        FieldElement::batch_alloc_invert(&mut ainv_list[..]);
         for i in 0..6 {
             assert_eq!(a_list[i].invert(), ainv_list[i]);
         }
diff --git a/curve25519-dalek/src/ristretto.rs b/curve25519-dalek/src/ristretto.rs
@@ -161,7 +161,7 @@
 #[cfg(feature = "alloc")]
 use alloc::vec::Vec;
 
-use core::array::TryFromSliceError;
+use core::array::{self, TryFromSliceError};
 use core::borrow::Borrow;
 use core::fmt::Debug;
 use core::iter::Sum;
@@ -532,6 +532,47 @@ impl RistrettoPoint {
         CompressedRistretto(s.to_bytes())
     }
 
+    /// Double-and-compress a batch of points.  The Ristretto encoding
+    /// is not batchable, since it requires an inverse square root.
+    ///
+    /// However, given input points \\( P\_1, \ldots, P\_n, \\)
+    /// it is possible to compute the encodings of their doubles \\(
+    /// \mathrm{enc}( \[2\]P\_1), \ldots, \mathrm{enc}( \[2\]P\_n ) \\)
+    /// in a batch.
+    ///
+    #[cfg_attr(feature = "rand_core", doc = "```")]
+    #[cfg_attr(not(feature = "rand_core"), doc = "```ignore")]
+    /// # use curve25519_dalek::ristretto::RistrettoPoint;
+    /// use rand_core::{OsRng, TryRngCore};
+    ///
+    /// # // Need fn main() here in comment so the doctest compiles
+    /// # // See https://doc.rust-lang.org/book/documentation.html#documentation-as-tests
+    /// # fn main() {
+    /// let mut rng = OsRng.unwrap_err();
+    ///
+    /// let points: [RistrettoPoint; 32] =
+    ///     core::array::from_fn(|_| RistrettoPoint::random(&mut rng));
+    ///
+    /// let compressed = RistrettoPoint::double_and_compress_batch(&points);
+    ///
+    /// for (P, P2_compressed) in points.iter().zip(compressed.iter()) {
+    ///     assert_eq!(*P2_compressed, (P + P).compress());
+    /// }
+    /// # }
+    /// ```
+    pub fn double_and_compress_batch<const N: usize>(
+        points: &[RistrettoPoint; N],
+    ) -> [CompressedRistretto; N] {
+        let states: [BatchCompressState; N] =
+            array::from_fn(|i| BatchCompressState::from(&points[i]));
+
+        let mut invs: [FieldElement; N] = array::from_fn(|i| states[i].efgh());
+
+        FieldElement::batch_invert(&mut invs);
+
+        array::from_fn(|i| Self::internal_double_and_compress_batch(&states[i], &invs[i]))
+    }
+
     /// Double-and-compress a batch of points.  The Ristretto encoding
     /// is not batchable, since it requires an inverse square root.
     ///
@@ -553,97 +594,68 @@ impl RistrettoPoint {
     /// let points: Vec<RistrettoPoint> =
     ///     (0..32).map(|_| RistrettoPoint::random(&mut rng)).collect();
     ///
-    /// let compressed = RistrettoPoint::double_and_compress_batch(&points);
+    /// let compressed = RistrettoPoint::double_and_compress_alloc_batch(&points);
     ///
     /// for (P, P2_compressed) in points.iter().zip(compressed.iter()) {
     ///     assert_eq!(*P2_compressed, (P + P).compress());
     /// }
     /// # }
     /// ```
     #[cfg(feature = "alloc")]
-    pub fn double_and_compress_batch<'a, I>(points: I) -> Vec<CompressedRistretto>
+    pub fn double_and_compress_alloc_batch<'a, I>(points: I) -> Vec<CompressedRistretto>
     where
         I: IntoIterator<Item = &'a RistrettoPoint>,
     {
-        #[derive(Copy, Clone, Debug)]
-        struct BatchCompressState {
-            e: FieldElement,
-            f: FieldElement,
-            g: FieldElement,
-            h: FieldElement,
-            eg: FieldElement,
-            fh: FieldElement,
-        }
-
-        impl BatchCompressState {
-            fn efgh(&self) -> FieldElement {
-                &self.eg * &self.fh
-            }
-        }
-
-        impl<'a> From<&'a RistrettoPoint> for BatchCompressState {
-            #[rustfmt::skip] // keep alignment of explanatory comments
-            fn from(P: &'a RistrettoPoint) -> BatchCompressState {
-                let XX = P.0.X.square();
-                let YY = P.0.Y.square();
-                let ZZ = P.0.Z.square();
-                let dTT = &P.0.T.square() * &constants::EDWARDS_D;
-
-                let e = &P.0.X * &(&P.0.Y + &P.0.Y); // = 2*X*Y
-                let f = &ZZ + &dTT;                  // = Z^2 + d*T^2
-                let g = &YY + &XX;                   // = Y^2 - a*X^2
-                let h = &ZZ - &dTT;                  // = Z^2 - d*T^2
-
-                let eg = &e * &g;
-                let fh = &f * &h;
-
-                BatchCompressState{ e, f, g, h, eg, fh }
-            }
-        }
-
         let states: Vec<BatchCompressState> =
             points.into_iter().map(BatchCompressState::from).collect();
 
         let mut invs: Vec<FieldElement> = states.iter().map(|state| state.efgh()).collect();
 
-        FieldElement::batch_invert(&mut invs[..]);
+        FieldElement::batch_alloc_invert(&mut invs[..]);
 
         states
             .iter()
             .zip(invs.iter())
             .map(|(state, inv): (&BatchCompressState, &FieldElement)| {
-                let Zinv = &state.eg * inv;
-                let Tinv = &state.fh * inv;
+                Self::internal_double_and_compress_batch(state, inv)
+            })
+            .collect()
+    }
 
-                let mut magic = constants::INVSQRT_A_MINUS_D;
+    fn internal_double_and_compress_batch(
+        state: &BatchCompressState,
+        inv: &FieldElement,
+    ) -> CompressedRistretto {
+        let Zinv = &state.eg * inv;
+        let Tinv = &state.fh * inv;
 
-                let negcheck1 = (&state.eg * &Zinv).is_negative();
+        let mut magic = constants::INVSQRT_A_MINUS_D;
 
-                let mut e = state.e;
-                let mut g = state.g;
-                let mut h = state.h;
+        let negcheck1 = (&state.eg * &Zinv).is_negative();
 
-                let minus_e = -&e;
-                let f_times_sqrta = &state.f * &constants::SQRT_M1;
+        let mut e = state.e;
+        let mut g = state.g;
+        let mut h = state.h;
 
-                e.conditional_assign(&state.g, negcheck1);
-                g.conditional_assign(&minus_e, negcheck1);
-                h.conditional_assign(&f_times_sqrta, negcheck1);
+        let minus_e = -&e;
+        let f_times_sqrta = &state.f * &constants::SQRT_M1;
 
-                magic.conditional_assign(&constants::SQRT_M1, negcheck1);
+        e.conditional_assign(&state.g, negcheck1);
+        g.conditional_assign(&minus_e, negcheck1);
+        h.conditional_assign(&f_times_sqrta, negcheck1);
 
-                let negcheck2 = (&(&h * &e) * &Zinv).is_negative();
+        magic.conditional_assign(&constants::SQRT_M1, negcheck1);
 
-                g.conditional_negate(negcheck2);
+        let negcheck2 = (&(&h * &e) * &Zinv).is_negative();
 
-                let mut s = &(&h - &g) * &(&magic * &(&g * &Tinv));
+        g.conditional_negate(negcheck2);
 
-                let s_is_negative = s.is_negative();
-                s.conditional_negate(s_is_negative);
+        let mut s = &(&h - &g) * &(&magic * &(&g * &Tinv));
 
-                CompressedRistretto(s.to_bytes())
-            })
-            .collect()
+        let s_is_negative = s.is_negative();
+        s.conditional_negate(s_is_negative);
+
+        CompressedRistretto(s.to_bytes())
     }
 
     /// Return the coset self + E\[4\], for debugging.
@@ -1156,6 +1168,42 @@ impl RistrettoBasepointTable {
     }
 }
 
+#[derive(Copy, Clone, Debug)]
+struct BatchCompressState {
+    e: FieldElement,
+    f: FieldElement,
+    g: FieldElement,
+    h: FieldElement,
+    eg: FieldElement,
+    fh: FieldElement,
+}
+
+impl BatchCompressState {
+    fn efgh(&self) -> FieldElement {
+        &self.eg * &self.fh
+    }
+}
+
+impl<'a> From<&'a RistrettoPoint> for BatchCompressState {
+    #[rustfmt::skip] // keep alignment of explanatory comments
+    fn from(P: &'a RistrettoPoint) -> BatchCompressState {
+        let XX = P.0.X.square();
+        let YY = P.0.Y.square();
+        let ZZ = P.0.Z.square();
+        let dTT = &P.0.T.square() * &constants::EDWARDS_D;
+
+        let e = &P.0.X * &(&P.0.Y + &P.0.Y); // = 2*X*Y
+        let f = &ZZ + &dTT;                  // = Z^2 + d*T^2
+        let g = &YY + &XX;                   // = Y^2 - a*X^2
+        let h = &ZZ - &dTT;                  // = Z^2 - d*T^2
+
+        let eg = &e * &g;
+        let fh = &f * &h;
+
+        BatchCompressState{ e, f, g, h, eg, fh }
+    }
+}
+
 // ------------------------------------------------------------------------
 // Constant-time conditional selection
 // ------------------------------------------------------------------------
@@ -1860,7 +1908,7 @@ mod test {
             .collect();
         points[500] = <RistrettoPoint as Group>::identity();
 
-        let compressed = RistrettoPoint::double_and_compress_batch(&points);
+        let compressed = RistrettoPoint::double_and_compress_alloc_batch(&points);
 
         for (P, P2_compressed) in points.iter().zip(compressed.iter()) {
             assert_eq!(*P2_compressed, (P + P).compress());

Original file line number	Diff line number	Diff line change
`@@ -289,7 +289,7 @@ mod ristretto_benches {`
`289`	`289`	`let points: Vec<RistrettoPoint> = (0..size)`
`290`	`290`	`.map(\|_\| RistrettoPoint::try_from_rng(&mut rng).unwrap())`
`291`	`291`	`.collect();`
`292`		`- b.iter(\|\| RistrettoPoint::double_and_compress_batch(&points));`
	`292`	`+ b.iter(\|\| RistrettoPoint::double_and_compress_alloc_batch(&points));`
`293`	`293`	`},`
`294`	`294`	`);`
`295`	`295`	`}`