|
1 |
| -use criterion::{black_box, criterion_group, criterion_main, BatchSize, Criterion, Throughput}; |
2 |
| -use rand::{thread_rng, Rng}; |
| 1 | +use divan; |
| 2 | +use divan::counter::{BytesCount, BytesFormat, ItemsCount}; |
| 3 | +use rand::prelude::*; |
| 4 | +use rand_chacha::ChaCha8Rng; |
3 | 5 | use turboshake::keccak;
|
4 | 6 |
|
5 |
| -#[cfg(any( |
6 |
| - target_arch = "x86_64", |
7 |
| - target_arch = "x86", |
8 |
| - target_arch = "aarch64", |
9 |
| - target_arch = "loongarch64" |
10 |
| -))] |
11 |
| -use criterion_cycles_per_byte::CyclesPerByte; |
12 |
| - |
13 |
| -#[cfg(any( |
14 |
| - target_arch = "x86_64", |
15 |
| - target_arch = "x86", |
16 |
| - target_arch = "aarch64", |
17 |
| - target_arch = "loongarch64" |
18 |
| -))] |
19 |
| -type CriterionHandler = Criterion<CyclesPerByte>; |
20 |
| - |
21 |
| -#[cfg(not(any( |
22 |
| - target_arch = "x86_64", |
23 |
| - target_arch = "x86", |
24 |
| - target_arch = "aarch64", |
25 |
| - target_arch = "loongarch64" |
26 |
| -)))] |
27 |
| -type CriterionHandler = Criterion; |
28 |
| - |
29 |
| -#[cfg(not(any(feature = "simdx2", feature = "simdx4")))] |
30 |
| -fn keccak(c: &mut CriterionHandler) { |
31 |
| - let mut rng = thread_rng(); |
32 |
| - |
33 |
| - let mut group = c.benchmark_group("keccak"); |
34 |
| - group.throughput(Throughput::Bytes(200u64)); // size of keccak-p[1600] permutation state |
35 |
| - |
36 |
| - group.bench_function("keccak-p[1600, 12] (cached)", |bench| { |
37 |
| - let mut state = [0u64; 25]; |
38 |
| - rng.fill(&mut state); |
39 |
| - |
40 |
| - bench.iter(|| keccak::permute(black_box(&mut state))) |
41 |
| - }); |
42 |
| - group.bench_function("keccak-p[1600, 12] (random)", |bench| { |
43 |
| - let mut state = [0u64; 25]; |
44 |
| - rng.fill(&mut state); |
45 |
| - |
46 |
| - bench.iter_batched( |
47 |
| - || state.clone(), |
48 |
| - |mut state| keccak::permute(black_box(&mut state)), |
49 |
| - BatchSize::SmallInput, |
50 |
| - ) |
51 |
| - }); |
52 |
| - |
53 |
| - group.finish(); |
| 7 | +fn main() { |
| 8 | + divan::Divan::default().bytes_format(BytesFormat::Binary).run_benches(); |
54 | 9 | }
|
55 | 10 |
|
56 |
| -#[cfg(any(feature = "simdx2", feature = "simdx4"))] |
57 |
| -fn keccak(c: &mut CriterionHandler) { |
58 |
| - let mut rng = thread_rng(); |
59 |
| - |
60 |
| - let mut group = c.benchmark_group("keccak"); |
61 |
| - |
62 |
| - #[cfg(feature = "simdx2")] |
63 |
| - { |
64 |
| - group.throughput(Throughput::Bytes(200u64 * 2)); |
| 11 | +#[divan::bench] |
| 12 | +fn permute_12_rounds(bencher: divan::Bencher) { |
| 13 | + let mut rng = ChaCha8Rng::from_os_rng(); |
65 | 14 |
|
66 |
| - group.bench_function("keccak-p[1600, 12] x2 (cached)", |bench| { |
67 |
| - let mut state0 = [0u64; 25]; |
68 |
| - let mut state1 = [0u64; 25]; |
69 |
| - rng.fill(&mut state0); |
70 |
| - rng.fill(&mut state1); |
| 15 | + let mut state = [0u64; 25]; |
| 16 | + let state_byte_len = state.len() * 8; |
| 17 | + rng.fill(&mut state); |
71 | 18 |
|
72 |
| - bench.iter(|| keccak::permutex2(black_box(&mut state0), black_box(&mut state1))); |
73 |
| - }); |
74 |
| - group.bench_function("keccak-p[1600, 12] x2 (random)", |bench| { |
75 |
| - let mut state0 = [0u64; 25]; |
76 |
| - let mut state1 = [0u64; 25]; |
77 |
| - rng.fill(&mut state0); |
78 |
| - rng.fill(&mut state1); |
79 |
| - |
80 |
| - bench.iter_batched( |
81 |
| - || (state0.clone(), state1.clone()), |
82 |
| - |(mut state0, mut state1)| { |
83 |
| - keccak::permutex2(black_box(&mut state0), black_box(&mut state1)) |
84 |
| - }, |
85 |
| - BatchSize::SmallInput, |
86 |
| - ) |
87 |
| - }); |
88 |
| - } |
89 |
| - |
90 |
| - #[cfg(feature = "simdx4")] |
91 |
| - { |
92 |
| - group.throughput(Throughput::Bytes(200u64 * 4)); |
93 |
| - |
94 |
| - group.bench_function("keccak-p[1600, 12] x4 (cached)", |bench| { |
95 |
| - let mut state0 = [0u64; 25]; |
96 |
| - let mut state1 = [0u64; 25]; |
97 |
| - let mut state2 = [0u64; 25]; |
98 |
| - let mut state3 = [0u64; 25]; |
99 |
| - rng.fill(&mut state0); |
100 |
| - rng.fill(&mut state1); |
101 |
| - rng.fill(&mut state2); |
102 |
| - rng.fill(&mut state3); |
103 |
| - |
104 |
| - bench.iter(|| { |
105 |
| - keccak::permutex4( |
106 |
| - black_box(&mut state0), |
107 |
| - black_box(&mut state1), |
108 |
| - black_box(&mut state2), |
109 |
| - black_box(&mut state3), |
110 |
| - ) |
111 |
| - }); |
112 |
| - }); |
113 |
| - group.bench_function("keccak-p[1600, 12] x4 (random)", |bench| { |
114 |
| - let mut state0 = [0u64; 25]; |
115 |
| - let mut state1 = [0u64; 25]; |
116 |
| - let mut state2 = [0u64; 25]; |
117 |
| - let mut state3 = [0u64; 25]; |
118 |
| - rng.fill(&mut state0); |
119 |
| - rng.fill(&mut state1); |
120 |
| - rng.fill(&mut state2); |
121 |
| - rng.fill(&mut state3); |
122 |
| - |
123 |
| - bench.iter_batched( |
124 |
| - || { |
125 |
| - ( |
126 |
| - state0.clone(), |
127 |
| - state1.clone(), |
128 |
| - state2.clone(), |
129 |
| - state3.clone(), |
130 |
| - ) |
131 |
| - }, |
132 |
| - |(mut state0, mut state1, mut state2, mut state3)| { |
133 |
| - keccak::permutex4( |
134 |
| - black_box(&mut state0), |
135 |
| - black_box(&mut state1), |
136 |
| - black_box(&mut state2), |
137 |
| - black_box(&mut state3), |
138 |
| - ) |
139 |
| - }, |
140 |
| - BatchSize::SmallInput, |
141 |
| - ) |
142 |
| - }); |
143 |
| - } |
144 |
| - |
145 |
| - group.finish(); |
| 19 | + bencher |
| 20 | + .counter(BytesCount::new(state_byte_len)) |
| 21 | + .counter(ItemsCount::new(1usize)) |
| 22 | + .with_inputs(|| (state.clone())) |
| 23 | + .bench_values(|mut state| keccak::permute(divan::black_box(&mut state))); |
146 | 24 | }
|
147 |
| - |
148 |
| -#[cfg(any( |
149 |
| - target_arch = "x86_64", |
150 |
| - target_arch = "x86", |
151 |
| - target_arch = "aarch64", |
152 |
| - target_arch = "loongarch64" |
153 |
| -))] |
154 |
| -criterion_group!(name = permutation; config = Criterion::default().with_measurement(CyclesPerByte); targets = keccak); |
155 |
| - |
156 |
| -#[cfg(not(any( |
157 |
| - target_arch = "x86_64", |
158 |
| - target_arch = "x86", |
159 |
| - target_arch = "aarch64", |
160 |
| - target_arch = "loongarch64" |
161 |
| -)))] |
162 |
| -criterion_group!(permutation, keccak); |
163 |
| - |
164 |
| -criterion_main!(permutation); |
0 commit comments