roll up chi loop for gcc -Os Signed-off-by: Dave Rodgman <dave.rodgman@arm.com>

commit: 693fb4f0b2ccdde00ffdd7c1b5d2531b10ed79b9 [log] [tgz]
author: Dave Rodgman <dave.rodgman@arm.com> Wed Feb 14 13:46:30 2024 +0000
committer: Dave Rodgman <dave.rodgman@arm.com> Wed Feb 14 13:56:53 2024 +0000
tree: f20b379606046435967a1c0337b7c3d9a6dc24d3
parent: 1cf3585ee4fe188664de6b75d62b280b3d720072 [diff] [blame]
diff --git a/library/sha3.c b/library/sha3.c
index 5a854e4..935a666 100644
--- a/library/sha3.c
+++ b/library/sha3.c

@@ -10,6 +10,8 @@
  *  https://nvlpubs.nist.gov/nistpubs/fips/nist.fips.202.pdf
  */
 
+#include "common.h"
+
 /*
  * These macros select manually unrolled implementations of parts of the main permutation function.
  *
@@ -23,9 +25,13 @@
 #undef   MBEDTLS_SHA3_THETA_UNROLL //no-check-names
 #define  MBEDTLS_SHA3_RHO_UNROLL   //no-check-names
 #define  MBEDTLS_SHA3_PI_UNROLL    //no-check-names
-#undef   MBEDTLS_SHA3_CHI_UNROLL   //no-check-names
-
-#include "common.h"
+#if !defined(MBEDTLS_COMPILER_IS_GCC) || defined(__OPTIMIZE_SIZE__)
+/* GCC doesn't perform well with the rolled-up version, especially at -O2, so only enable on gcc
+ * if optimising for size. Always enable for other compilers. */
+#undef   MBEDTLS_SHA3_CHI_UNROLL    //no-check-names
+#else
+#define  MBEDTLS_SHA3_CHI_UNROLL    //no-check-names
+#endif
 
 #if defined(MBEDTLS_SHA3_C)
 
@@ -156,8 +162,7 @@
 #endif
 
         /* Chi */
-#if !defined(MBEDTLS_SHA3_CHI_UNROLL) && !defined(MBEDTLS_COMPILER_IS_GCC) //no-check-names
-        /* GCC doesn't perform well with the rolled-up version, especially at -O2. */
+#if !defined(MBEDTLS_SHA3_CHI_UNROLL) //no-check-names
         for (i = 0; i <= 20; i += 5) {
             lane[0] = s[i]; lane[1] = s[i + 1]; lane[2] = s[i + 2]; lane[3] = s[i + 3]; lane[4] = s[i + 4];
             s[i + 0] ^= (~lane[1]) & lane[2];
commit	693fb4f0b2ccdde00ffdd7c1b5d2531b10ed79b9	[log] [tgz]
author	Dave Rodgman <dave.rodgman@arm.com>	Wed Feb 14 13:46:30 2024 +0000
committer	Dave Rodgman <dave.rodgman@arm.com>	Wed Feb 14 13:56:53 2024 +0000
tree	f20b379606046435967a1c0337b7c3d9a6dc24d3
parent	1cf3585ee4fe188664de6b75d62b280b3d720072 [diff] [blame]