Merge pull request #7462 from daverodgman/clz_size_opt

clz size/perf optimisation
This commit is contained in:
Tom Cosgrove 2023-04-26 07:06:30 +01:00 committed by GitHub
commit 10f40916eb
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23
4 changed files with 90 additions and 12 deletions

View file

@ -33,8 +33,25 @@
#include "bn_mul.h"
#include "constant_time_internal.h"
size_t mbedtls_mpi_core_clz(mbedtls_mpi_uint a)
inline size_t mbedtls_mpi_core_clz(mbedtls_mpi_uint a)
{
#if defined(__has_builtin)
#if __has_builtin(__builtin_clz)
if (sizeof(mbedtls_mpi_uint) == sizeof(unsigned int)) {
return (size_t) __builtin_clz(a);
}
#endif
#if __has_builtin(__builtin_clzl)
if (sizeof(mbedtls_mpi_uint) == sizeof(unsigned long)) {
return (size_t) __builtin_clzl(a);
}
#endif
#if __has_builtin(__builtin_clzll)
if (sizeof(mbedtls_mpi_uint) == sizeof(unsigned long long)) {
return (size_t) __builtin_clzll(a);
}
#endif
#endif
size_t j;
mbedtls_mpi_uint mask = (mbedtls_mpi_uint) 1 << (biL - 1);
@ -51,21 +68,17 @@ size_t mbedtls_mpi_core_clz(mbedtls_mpi_uint a)
size_t mbedtls_mpi_core_bitlen(const mbedtls_mpi_uint *A, size_t A_limbs)
{
size_t i, j;
int i;
size_t j;
if (A_limbs == 0) {
return 0;
}
for (i = A_limbs - 1; i > 0; i--) {
for (i = ((int) A_limbs) - 1; i >= 0; i--) {
if (A[i] != 0) {
break;
}
}
j = biL - mbedtls_mpi_core_clz(A[i]);
return (i * biL) + j;
}
}
return 0;
}
/* Convert a big-endian byte array aligned to the size of mbedtls_mpi_uint

View file

@ -101,10 +101,13 @@
(((X)[(i) / ciL] >> (((i) % ciL) * 8)) & 0xff)
/** Count leading zero bits in a given integer.
*
* \warning The result is undefined if \p a == 0
*
* \param a Integer to count leading zero bits.
*
* \return The number of leading zero bits in \p a.
* \return The number of leading zero bits in \p a, if \p a != 0.
* If \p a == 0, the result is undefined.
*/
size_t mbedtls_mpi_core_clz(mbedtls_mpi_uint a);

View file

@ -309,6 +309,36 @@ exit:
}
/* END_CASE */
/* BEGIN_CASE */
void mpi_core_clz(int leading_zeros, int trailing_zeros)
{
if ((size_t) (leading_zeros + trailing_zeros) >= (sizeof(mbedtls_mpi_uint) * 8)) {
// can't fit required number of leading and trailing zeros - skip test
goto exit;
}
// Construct a test input value where the count of leading zeros and
// trailing zeros is given in the test case, and we add ones to fill
// the gap.
mbedtls_mpi_uint x;
if ((leading_zeros + trailing_zeros) > 0) {
// some zero bits
uint32_t s = (sizeof(mbedtls_mpi_uint) * 8 - leading_zeros - trailing_zeros);
x = ((((mbedtls_mpi_uint) 1) << s) - 1) << trailing_zeros;
} else {
// all bits set
x = ~((mbedtls_mpi_uint) 0);
}
size_t n = mbedtls_mpi_core_clz(x);
TEST_EQUAL(n, leading_zeros);
exit:
;
}
/* END_CASE */
/* BEGIN_CASE */
void mpi_core_lt_ct(char *input_X, char *input_Y, int exp_ret)
{

View file

@ -491,3 +491,35 @@ mpi_core_fill_random:42:0:-1:0:MBEDTLS_ERR_MPI_BAD_INPUT_DATA
Fill random core: 42 bytes, 5 missing limbs
mpi_core_fill_random:42:0:-5:0:MBEDTLS_ERR_MPI_BAD_INPUT_DATA
CLZ: 0 0: all ones
mpi_core_clz:0:0
CLZ: 1 0
mpi_core_clz:1:0
CLZ: 1 1
mpi_core_clz:1:1
CLZ: 4 5
mpi_core_clz:4:5
CLZ: 8 16
mpi_core_clz:8:16
CLZ: 31 0
mpi_core_clz:31:0
CLZ: 32 0
mpi_core_clz:32:0
CLZ: 33 0
mpi_core_clz:33:0
CLZ: 63 0
mpi_core_clz:63:0
CLZ: 64 0
mpi_core_clz:64:0
CLZ: 100000 0: skip overly long input
mpi_core_clz:100000:0