From b1499a77f9366e8d0124c0bb4803952b776831c0 Mon Sep 17 00:00:00 2001
From: Alexander Evgin <aleasims@gmail.com>
Date: Wed, 18 Oct 2023 18:34:54 +0300
Subject: [PATCH] Revert "Clean up hash-to-field (#678)"

This reverts commit 9469e1b92d1df7cd6f08cfd6cb6455e8495abdf5.
---
 ec/src/hashing/map_to_curve_hasher.rs         |   2 +-
 ff/Cargo.toml                                 |   1 -
 ff/src/fields/field_hashers/expander/mod.rs   | 133 ++++++++----------
 ff/src/fields/field_hashers/expander/tests.rs |  11 +-
 ff/src/fields/field_hashers/mod.rs            |  64 ++++-----
 test-templates/src/h2c/mod.rs                 |   6 +-
 6 files changed, 91 insertions(+), 126 deletions(-)
diff --git a/ec/src/hashing/map_to_curve_hasher.rs b/ec/src/hashing/map_to_curve_hasher.rs
index e0f46f323..fa50a5e57 100644
--- a/ec/src/hashing/map_to_curve_hasher.rs
+++ b/ec/src/hashing/map_to_curve_hasher.rs
@@ -56,7 +56,7 @@ where
         // 5. P = clear_cofactor(R)
         // 6. return P
 
-        let rand_field_elems = self.field_hasher.hash_to_field::<2>(msg);
+        let rand_field_elems = self.field_hasher.hash_to_field(msg, 2);
 
         let rand_curve_elem_0 = M2C::map_to_curve(rand_field_elems[0])?;
         let rand_curve_elem_1 = M2C::map_to_curve(rand_field_elems[1])?;
diff --git a/ff/Cargo.toml b/ff/Cargo.toml
index bfbf07798..b201b086b 100644
--- a/ff/Cargo.toml
+++ b/ff/Cargo.toml
@@ -19,7 +19,6 @@ ark-ff-asm.workspace = true
 ark-ff-macros.workspace = true
 ark-std.workspace = true
 ark-serialize.workspace = true
-arrayvec = { version = "0.7", default-features = false }
 derivative = { workspace = true, features = ["use_core"] }
 num-traits.workspace = true
 paste.workspace = true
diff --git a/ff/src/fields/field_hashers/expander/mod.rs b/ff/src/fields/field_hashers/expander/mod.rs
index 16cc17df5..8b1ef0a12 100644
--- a/ff/src/fields/field_hashers/expander/mod.rs
+++ b/ff/src/fields/field_hashers/expander/mod.rs
@@ -1,119 +1,99 @@
 // The below implementation is a rework of https://github.com/armfazh/h2c-rust-ref
 // With some optimisations
 
-use core::marker::PhantomData;
-
 use ark_std::vec::Vec;
-
-use arrayvec::ArrayVec;
-use digest::{ExtendableOutput, FixedOutputReset, Update};
-
+use digest::{DynDigest, ExtendableOutput, Update};
 pub trait Expander {
+    fn construct_dst_prime(&self) -> Vec<u8>;
     fn expand(&self, msg: &[u8], length: usize) -> Vec<u8>;
 }
 const MAX_DST_LENGTH: usize = 255;
 
-const LONG_DST_PREFIX: &[u8; 17] = b"H2C-OVERSIZE-DST-";
-
-/// Implements section [5.3.3](https://datatracker.ietf.org/doc/html/draft-irtf-cfrg-hash-to-curve-16#section-5.3.3)
-/// "Using DSTs longer than 255 bytes" of the
-/// [IRTF CFRG hash-to-curve draft #16](https://datatracker.ietf.org/doc/html/draft-irtf-cfrg-hash-to-curve-16#section-5.3.3).
-pub struct DST(arrayvec::ArrayVec<u8, MAX_DST_LENGTH>);
-
-impl DST {
-    pub fn new_xmd<H: FixedOutputReset + Default>(dst: &[u8]) -> DST {
-        let array = if dst.len() > MAX_DST_LENGTH {
-            let mut long = H::default();
-            long.update(&LONG_DST_PREFIX[..]);
-            long.update(&dst);
-            ArrayVec::try_from(long.finalize_fixed().as_ref()).unwrap()
-        } else {
-            ArrayVec::try_from(dst).unwrap()
-        };
-        DST(array)
-    }
-
-    pub fn new_xof<H: ExtendableOutput + Default>(dst: &[u8], k: usize) -> DST {
-        let array = if dst.len() > MAX_DST_LENGTH {
-            let mut long = H::default();
-            long.update(&LONG_DST_PREFIX[..]);
-            long.update(&dst);
-
-            let mut new_dst = [0u8; MAX_DST_LENGTH];
-            let new_dst = &mut new_dst[0..((2 * k + 7) >> 3)];
-            long.finalize_xof_into(new_dst);
-            ArrayVec::try_from(&*new_dst).unwrap()
-        } else {
-            ArrayVec::try_from(dst).unwrap()
-        };
-        DST(array)
-    }
-
-    pub fn update<H: Update>(&self, h: &mut H) {
-        h.update(self.0.as_ref());
-        // I2OSP(len,1) https://www.rfc-editor.org/rfc/rfc8017.txt
-        h.update(&[self.0.len() as u8]);
-    }
-}
+const LONG_DST_PREFIX: [u8; 17] = [
+    //'H', '2', 'C', '-', 'O', 'V', 'E', 'R', 'S', 'I', 'Z', 'E', '-', 'D', 'S', 'T', '-',
+    0x48, 0x32, 0x43, 0x2d, 0x4f, 0x56, 0x45, 0x52, 0x53, 0x49, 0x5a, 0x45, 0x2d, 0x44, 0x53, 0x54,
+    0x2d,
+];
 
-pub(super) struct ExpanderXof<H: ExtendableOutput + Clone + Default> {
-    pub(super) xofer: PhantomData<H>,
+pub(super) struct ExpanderXof<T: Update + Clone + ExtendableOutput> {
+    pub(super) xofer: T,
     pub(super) dst: Vec<u8>,
     pub(super) k: usize,
 }
 
-impl<H: ExtendableOutput + Clone + Default> Expander for ExpanderXof<H> {
+impl<T: Update + Clone + ExtendableOutput> Expander for ExpanderXof<T> {
+    fn construct_dst_prime(&self) -> Vec<u8> {
+        let mut dst_prime = if self.dst.len() > MAX_DST_LENGTH {
+            let mut xofer = self.xofer.clone();
+            xofer.update(&LONG_DST_PREFIX.clone());
+            xofer.update(&self.dst);
+            xofer.finalize_boxed((2 * self.k + 7) >> 3).to_vec()
+        } else {
+            self.dst.clone()
+        };
+        dst_prime.push(dst_prime.len() as u8);
+        dst_prime
+    }
     fn expand(&self, msg: &[u8], n: usize) -> Vec<u8> {
-        let mut xofer = H::default();
-        xofer.update(msg);
+        let dst_prime = self.construct_dst_prime();
+        let lib_str = &[((n >> 8) & 0xFF) as u8, (n & 0xFF) as u8];
 
-        // I2OSP(len,2) https://www.rfc-editor.org/rfc/rfc8017.txt
-        let lib_str = (n as u16).to_be_bytes();
-        xofer.update(&lib_str);
-
-        DST::new_xof::<H>(self.dst.as_ref(), self.k).update(&mut xofer);
-        xofer.finalize_boxed(n).into_vec()
+        let mut xofer = self.xofer.clone();
+        xofer.update(msg);
+        xofer.update(lib_str);
+        xofer.update(&dst_prime);
+        xofer.finalize_boxed(n).to_vec()
     }
 }
 
-pub(super) struct ExpanderXmd<H: FixedOutputReset + Default + Clone> {
-    pub(super) hasher: PhantomData<H>,
+pub(super) struct ExpanderXmd<T: DynDigest + Clone> {
+    pub(super) hasher: T,
     pub(super) dst: Vec<u8>,
     pub(super) block_size: usize,
 }
 
-static Z_PAD: [u8; 256] = [0u8; 256];
-
-impl<H: FixedOutputReset + Default + Clone> Expander for ExpanderXmd<H> {
+impl<T: DynDigest + Clone> Expander for ExpanderXmd<T> {
+    fn construct_dst_prime(&self) -> Vec<u8> {
+        let mut dst_prime = if self.dst.len() > MAX_DST_LENGTH {
+            let mut hasher = self.hasher.clone();
+            hasher.update(&LONG_DST_PREFIX);
+            hasher.update(&self.dst);
+            hasher.finalize_reset().to_vec()
+        } else {
+            self.dst.clone()
+        };
+        dst_prime.push(dst_prime.len() as u8);
+        dst_prime
+    }
     fn expand(&self, msg: &[u8], n: usize) -> Vec<u8> {
-        use digest::typenum::Unsigned;
+        let mut hasher = self.hasher.clone();
         // output size of the hash function, e.g. 32 bytes = 256 bits for sha2::Sha256
-        let b_len = H::OutputSize::to_usize();
+        let b_len = hasher.output_size();
         let ell = (n + (b_len - 1)) / b_len;
         assert!(
             ell <= 255,
             "The ratio of desired output to the output size of hash function is too large!"
         );
 
-        let dst_prime = DST::new_xmd::<H>(self.dst.as_ref());
+        let dst_prime = self.construct_dst_prime();
+        let z_pad: Vec<u8> = vec![0; self.block_size];
         // Represent `len_in_bytes` as a 2-byte array.
         // As per I2OSP method outlined in https://tools.ietf.org/pdf/rfc8017.pdf,
         // The program should abort if integer that we're trying to convert is too large.
         assert!(n < (1 << 16), "Length should be smaller than 2^16");
         let lib_str: [u8; 2] = (n as u16).to_be_bytes();
 
-        let mut hasher = H::default();
-        hasher.update(&Z_PAD[0..self.block_size]);
+        hasher.update(&z_pad);
         hasher.update(msg);
         hasher.update(&lib_str);
         hasher.update(&[0u8]);
-        dst_prime.update(&mut hasher);
-        let b0 = hasher.finalize_fixed_reset();
+        hasher.update(&dst_prime);
+        let b0 = hasher.finalize_reset();
 
         hasher.update(&b0);
         hasher.update(&[1u8]);
-        dst_prime.update(&mut hasher);
-        let mut bi = hasher.finalize_fixed_reset();
+        hasher.update(&dst_prime);
+        let mut bi = hasher.finalize_reset();
 
         let mut uniform_bytes: Vec<u8> = Vec::with_capacity(n);
         uniform_bytes.extend_from_slice(&bi);
@@ -123,12 +103,11 @@ impl<H: FixedOutputReset + Default + Clone> Expander for ExpanderXmd<H> {
                 hasher.update(&[*l ^ *r]);
             }
             hasher.update(&[i as u8]);
-            dst_prime.update(&mut hasher);
-            bi = hasher.finalize_fixed_reset();
+            hasher.update(&dst_prime);
+            bi = hasher.finalize_reset();
             uniform_bytes.extend_from_slice(&bi);
         }
-        uniform_bytes.truncate(n);
-        uniform_bytes
+        uniform_bytes[0..n].to_vec()
     }
 }
 
diff --git a/ff/src/fields/field_hashers/expander/tests.rs b/ff/src/fields/field_hashers/expander/tests.rs
index eeebc64a7..36b4190f9 100644
--- a/ff/src/fields/field_hashers/expander/tests.rs
+++ b/ff/src/fields/field_hashers/expander/tests.rs
@@ -5,7 +5,6 @@ use sha3::{Shake128, Shake256};
 use std::{
     fs::{read_dir, File},
     io::BufReader,
-    marker::PhantomData,
 };
 
 use super::{Expander, ExpanderXmd, ExpanderXof};
@@ -100,29 +99,29 @@ fn get_expander(id: ExpID, _dst: &[u8], k: usize) -> Box<dyn Expander> {
     match id {
         ExpID::XMD(h) => match h {
             HashID::SHA256 => Box::new(ExpanderXmd {
-                hasher: PhantomData::<Sha256>,
+                hasher: Sha256::default(),
                 block_size: 64,
                 dst,
             }),
             HashID::SHA384 => Box::new(ExpanderXmd {
-                hasher: PhantomData::<Sha384>,
+                hasher: Sha384::default(),
                 block_size: 128,
                 dst,
             }),
             HashID::SHA512 => Box::new(ExpanderXmd {
-                hasher: PhantomData::<Sha512>,
+                hasher: Sha512::default(),
                 block_size: 128,
                 dst,
             }),
         },
         ExpID::XOF(x) => match x {
             XofID::SHAKE128 => Box::new(ExpanderXof {
-                xofer: PhantomData::<Shake128>,
+                xofer: Shake128::default(),
                 k,
                 dst,
             }),
             XofID::SHAKE256 => Box::new(ExpanderXof {
-                xofer: PhantomData::<Shake256>,
+                xofer: Shake256::default(),
                 k,
                 dst,
             }),
diff --git a/ff/src/fields/field_hashers/mod.rs b/ff/src/fields/field_hashers/mod.rs
index f8bd0b26b..bfd44f231 100644
--- a/ff/src/fields/field_hashers/mod.rs
+++ b/ff/src/fields/field_hashers/mod.rs
@@ -1,10 +1,9 @@
 mod expander;
 
-use core::marker::PhantomData;
-
 use crate::{Field, PrimeField};
 
-use digest::{FixedOutputReset, XofReader};
+use ark_std::vec::Vec;
+use digest::DynDigest;
 use expander::Expander;
 
 use self::expander::ExpanderXmd;
@@ -18,8 +17,8 @@ pub trait HashToField<F: Field>: Sized {
     /// * `domain` - bytes that get concatenated with the `msg` during hashing, in order to separate potentially interfering instantiations of the hasher.
     fn new(domain: &[u8]) -> Self;
 
-    /// Hash an arbitrary `msg` to `N` elements of the field `F`.
-    fn hash_to_field<const N: usize>(&self, msg: &[u8]) -> [F; N];
+    /// Hash an arbitrary `msg` to #`count` elements from field `F`.
+    fn hash_to_field(&self, msg: &[u8], count: usize) -> Vec<F>;
 }
 
 /// This field hasher constructs a Hash-To-Field based on a fixed-output hash function,
@@ -34,16 +33,16 @@ pub trait HashToField<F: Field>: Sized {
 /// use sha2::Sha256;
 ///
 /// let hasher = <DefaultFieldHasher<Sha256> as HashToField<Fq>>::new(&[1, 2, 3]);
-/// let field_elements: [Fq; 2] = hasher.hash_to_field(b"Hello, World!");
+/// let field_elements: Vec<Fq> = hasher.hash_to_field(b"Hello, World!", 2);
 ///
 /// assert_eq!(field_elements.len(), 2);
 /// ```
-pub struct DefaultFieldHasher<H: FixedOutputReset + Default + Clone, const SEC_PARAM: usize = 128> {
+pub struct DefaultFieldHasher<H: Default + DynDigest + Clone, const SEC_PARAM: usize = 128> {
     expander: ExpanderXmd<H>,
     len_per_base_elem: usize,
 }
 
-impl<F: Field, H: FixedOutputReset + Default + Clone, const SEC_PARAM: usize> HashToField<F>
+impl<F: Field, H: Default + DynDigest + Clone, const SEC_PARAM: usize> HashToField<F>
     for DefaultFieldHasher<H, SEC_PARAM>
 {
     fn new(dst: &[u8]) -> Self {
@@ -52,7 +51,7 @@ impl<F: Field, H: FixedOutputReset + Default + Clone, const SEC_PARAM: usize> Ha
         let len_per_base_elem = get_len_per_elem::<F, SEC_PARAM>();
 
         let expander = ExpanderXmd {
-            hasher: PhantomData,
+            hasher: H::default(),
             dst: dst.to_vec(),
             block_size: len_per_base_elem,
         };
@@ -63,49 +62,38 @@ impl<F: Field, H: FixedOutputReset + Default + Clone, const SEC_PARAM: usize> Ha
         }
     }
 
-    fn hash_to_field<const N: usize>(&self, message: &[u8]) -> [F; N] {
+    fn hash_to_field(&self, message: &[u8], count: usize) -> Vec<F> {
         let m = F::extension_degree() as usize;
 
-        // The user requests `N` of elements of F_p^m to output per input msg,
+        // The user imposes a `count` of elements of F_p^m to output per input msg,
         // each field element comprising `m` BasePrimeField elements.
-        let len_in_bytes = N * m * self.len_per_base_elem;
+        let len_in_bytes = count * m * self.len_per_base_elem;
         let uniform_bytes = self.expander.expand(message, len_in_bytes);
 
-        let cb = |i| {
-            let base_prime_field_elem = |j| {
+        let mut output = Vec::with_capacity(count);
+        let mut base_prime_field_elems = Vec::with_capacity(m);
+        for i in 0..count {
+            base_prime_field_elems.clear();
+            for j in 0..m {
                 let elm_offset = self.len_per_base_elem * (j + i * m);
-                F::BasePrimeField::from_be_bytes_mod_order(
+                let val = F::BasePrimeField::from_be_bytes_mod_order(
                     &uniform_bytes[elm_offset..][..self.len_per_base_elem],
-                )
-            };
-            F::from_base_prime_field_elems((0..m).map(base_prime_field_elem)).unwrap()
-        };
-        ark_std::array::from_fn::<F, N, _>(cb)
-    }
-}
-
-pub fn hash_to_field<F: Field, H: XofReader, const SEC_PARAM: usize>(h: &mut H) -> F {
-    // The final output of `hash_to_field` will be an array of field
-    // elements from F::BaseField, each of size `len_per_elem`.
-    let len_per_base_elem = get_len_per_elem::<F, SEC_PARAM>();
-    // Rust *still* lacks alloca, hence this ugly hack.
-    let mut alloca = [0u8; 2048];
-    let alloca = &mut alloca[0..len_per_base_elem];
-
-    let m = F::extension_degree() as usize;
+                );
+                base_prime_field_elems.push(val);
+            }
+            let f = F::from_base_prime_field_elems(base_prime_field_elems.drain(..)).unwrap();
+            output.push(f);
+        }
 
-    let base_prime_field_elem = |_| {
-        h.read(alloca);
-        F::BasePrimeField::from_be_bytes_mod_order(alloca)
-    };
-    F::from_base_prime_field_elems((0..m).map(base_prime_field_elem)).unwrap()
+        output
+    }
 }
 
 /// This function computes the length in bytes that a hash function should output
 /// for hashing an element of type `Field`.
 /// See section 5.1 and 5.3 of the
 /// [IETF hash standardization draft](https://datatracker.ietf.org/doc/draft-irtf-cfrg-hash-to-curve/14/)
-const fn get_len_per_elem<F: Field, const SEC_PARAM: usize>() -> usize {
+fn get_len_per_elem<F: Field, const SEC_PARAM: usize>() -> usize {
     // ceil(log(p))
     let base_field_size_in_bits = F::BasePrimeField::MODULUS_BIT_SIZE as usize;
     // ceil(log(p)) + security_parameter
diff --git a/test-templates/src/h2c/mod.rs b/test-templates/src/h2c/mod.rs
index 77b9a1a42..4cd52eb35 100644
--- a/test-templates/src/h2c/mod.rs
+++ b/test-templates/src/h2c/mod.rs
@@ -52,11 +52,11 @@ macro_rules! test_h2c {
 
                 for v in data.vectors.iter() {
                     // first, hash-to-field tests
-                    let got: [$base_prime_field; { 2 * $m }] =
-                        hasher.hash_to_field(&v.msg.as_bytes());
+                    let got: Vec<$base_prime_field> =
+                        hasher.hash_to_field(&v.msg.as_bytes(), 2 * $m);
                     let want: Vec<$base_prime_field> =
                         v.u.iter().map(read_fq_vec).flatten().collect();
-                    assert_eq!(got[..], *want);
+                    assert_eq!(got, want);
 
                     // then, test curve points
                     let x = read_fq_vec(&v.p.x);