From efc3d734b0c8c1044f1c270db277ddaa5422e382 Mon Sep 17 00:00:00 2001 From: behzad nouri Date: Sun, 1 Jan 2023 08:58:16 -0500 Subject: [PATCH] simplifies sigverify copy_return_values --- ledger/src/sigverify_shreds.rs | 7 ++----- perf/src/sigverify.rs | 34 +++++++++++++--------------------- 2 files changed, 15 insertions(+), 26 deletions(-) diff --git a/ledger/src/sigverify_shreds.rs b/ledger/src/sigverify_shreds.rs index ae58a35334368b..99d3630123d4e2 100644 --- a/ledger/src/sigverify_shreds.rs +++ b/ledger/src/sigverify_shreds.rs @@ -246,12 +246,9 @@ pub fn verify_shreds_gpu( trace!("out buf {:?}", out); // Each shred has exactly one signature. - let v_sig_lens: Vec<_> = batches - .iter() - .map(|batch| vec![1u32; batch.len()]) - .collect(); + let v_sig_lens = batches.iter().map(|batch| repeat(1u32).take(batch.len())); let mut rvs: Vec<_> = batches.iter().map(|batch| vec![0u8; batch.len()]).collect(); - sigverify::copy_return_values(&v_sig_lens, &out, &mut rvs); + sigverify::copy_return_values(v_sig_lens, &out, &mut rvs); inc_new_counter_debug!("ed25519_shred_verify_gpu", out.len()); rvs diff --git a/perf/src/sigverify.rs b/perf/src/sigverify.rs index af5ac15884c64b..d37630961ec31e 100644 --- a/perf/src/sigverify.rs +++ b/perf/src/sigverify.rs @@ -664,26 +664,18 @@ pub fn ed25519_verify_disabled(batches: &mut [PacketBatch]) { inc_new_counter_debug!("ed25519_verify_disabled", packet_count); } -pub fn copy_return_values(sig_lens: &[Vec], out: &PinnedVec, rvs: &mut [Vec]) { - let mut num = 0; - for (vs, sig_vs) in rvs.iter_mut().zip(sig_lens.iter()) { - for (v, sig_v) in vs.iter_mut().zip(sig_vs.iter()) { - if *sig_v == 0 { - *v = 0; - } else { - let mut vout = 1; - for _ in 0..*sig_v { - if 0 == out[num] { - vout = 0; - } - num = num.saturating_add(1); - } - *v = vout; - } - if *v != 0 { - trace!("VERIFIED PACKET!!!!!"); - } - } +pub fn copy_return_values(sig_lens: I, out: &PinnedVec, rvs: &mut [Vec]) +where + I: IntoIterator, + T: IntoIterator, +{ + debug_assert!(rvs.iter().flatten().all(|&rv| rv == 0u8)); + let mut offset = 0; + let rvs = rvs.iter_mut().flatten(); + for (k, rv) in sig_lens.into_iter().flatten().zip(rvs) { + let out = out[offset..].iter().take(k as usize).all(|&x| x == 1); + *rv = u8::from(k != 0 && out); + offset = offset.saturating_add(k as usize); } } @@ -796,7 +788,7 @@ pub fn ed25519_verify( } } trace!("done verify"); - copy_return_values(&sig_lens, &out, &mut rvs); + copy_return_values(sig_lens, &out, &mut rvs); mark_disabled(batches, &rvs); inc_new_counter_debug!("ed25519_verify_gpu", valid_packet_count); }