From 4f2e3ab022e887e33aff5e2dccb8e6dc7074cbcf Mon Sep 17 00:00:00 2001
From: Paul Duncan <pabs@pablotron.org>
Date: Mon, 29 Apr 2024 12:06:36 -0400
Subject: sha3.c: build permute12_scalar() during testing, remove old comment

---
 sha3.c | 8 +-------
 1 file changed, 1 insertion(+), 7 deletions(-)

(limited to 'sha3.c')

diff --git a/sha3.c b/sha3.c
index 3e8a28c..887c5c2 100644
--- a/sha3.c
+++ b/sha3.c
@@ -177,9 +177,7 @@ static inline void chi(uint64_t dst[static 25], const uint64_t src[static 25]) {
 static inline void iota(uint64_t a[static 25], const int i) {
   a[0] ^= RCS[i];
 }
-#endif /* !defined(__AVX512F__) || defined(SHA3_TEST) */
 
-#ifndef __AVX512F__
 // 24-round keccak permutation (scalar implementation)
 static inline void permute_scalar(uint64_t a[static 25]) {
   uint64_t tmp[25] = { 0 };
@@ -204,17 +202,13 @@ static inline void permute12_scalar(uint64_t a[static 25]) {
     iota(a, 12 + i);
   }
 }
-#endif /* !__AVX512F__ */
+#endif /* !defined(__AVX512F__) || defined(SHA3_TEST) */
 
 #ifdef __AVX512F__
 #include <immintrin.h>
 
 // 24 round keccak permutation (avx512 implementation).
 //
-// copied from `permute_avx512_fast()` in `tests/permute/permute.c`. all
-// steps are inlined as blocks. ~3x faster than scalar implementation,
-// but could be sped up more.
-//
 // how it operates (roughly):
 //
 // 1. load rows from state `s` into avx512 registers r0-r4, like so:
-- 
cgit v1.2.3