mirror of
https://github.com/yuzu-emu/mbedtls.git
synced 2024-12-26 07:35:35 +00:00
Optimize fix_negative
Reduce the code size, stack consumption and heap consumption in fix_negative by encoding the special-case subtraction manually. * Code size: ecp_curves.o goes down from 7837B down to 7769 in a sample Cortex-M0 build with all curves enabled. The savings come from not having to set up C in INIT (which is used many times) and from not having to catch errors in fix_negative. * Stack consumption: get rid of C on the stack. * Heap: mbedtls_mpi_sub_abs with destination == second operand would make a heap allocation. The new code doesn't do any heap allocation. * Performance: no measurable difference. Signed-off-by: Gilles Peskine <Gilles.Peskine@arm.com>
This commit is contained in:
parent
28f62f6212
commit
d10e8fae9e
|
@ -1000,25 +1000,20 @@ static inline void sub32( uint32_t *dst, uint32_t src, signed char *carry )
|
||||||
#define ADD( j ) add32( &cur, A( j ), &c );
|
#define ADD( j ) add32( &cur, A( j ), &c );
|
||||||
#define SUB( j ) sub32( &cur, A( j ), &c );
|
#define SUB( j ) sub32( &cur, A( j ), &c );
|
||||||
|
|
||||||
|
#define ciL (sizeof(mbedtls_mpi_uint)) /* chars in limb */
|
||||||
|
#define biL (ciL << 3) /* bits in limb */
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* Helpers for the main 'loop'
|
* Helpers for the main 'loop'
|
||||||
* (see fix_negative for the motivation of C)
|
|
||||||
*/
|
*/
|
||||||
#define INIT( b ) \
|
#define INIT( b ) \
|
||||||
int ret = MBEDTLS_ERR_ERROR_CORRUPTION_DETECTED; \
|
int ret = MBEDTLS_ERR_ERROR_CORRUPTION_DETECTED; \
|
||||||
signed char c = 0, cc; \
|
signed char c = 0, cc; \
|
||||||
uint32_t cur; \
|
uint32_t cur; \
|
||||||
size_t i = 0, bits = (b); \
|
size_t i = 0, bits = (b); \
|
||||||
mbedtls_mpi C; \
|
/* N is the size of the product of two b-bit numbers, plus one */ \
|
||||||
mbedtls_mpi_uint Cp[ (b) / 8 / sizeof( mbedtls_mpi_uint) + 1 ]; \
|
/* limb for fix_negative */ \
|
||||||
\
|
MBEDTLS_MPI_CHK( mbedtls_mpi_grow( N, ( b ) * 2 / biL + 1 ) ); \
|
||||||
C.s = 1; \
|
|
||||||
C.n = (b) / 8 / sizeof( mbedtls_mpi_uint) + 1; \
|
|
||||||
C.p = Cp; \
|
|
||||||
memset( Cp, 0, C.n * sizeof( mbedtls_mpi_uint ) ); \
|
|
||||||
\
|
|
||||||
MBEDTLS_MPI_CHK( mbedtls_mpi_grow( N, (b) * 2 / 8 / \
|
|
||||||
sizeof( mbedtls_mpi_uint ) ) ); \
|
|
||||||
LOAD32;
|
LOAD32;
|
||||||
|
|
||||||
#define NEXT \
|
#define NEXT \
|
||||||
|
@ -1033,33 +1028,32 @@ static inline void sub32( uint32_t *dst, uint32_t src, signed char *carry )
|
||||||
STORE32; i++; \
|
STORE32; i++; \
|
||||||
cur = c > 0 ? c : 0; STORE32; \
|
cur = c > 0 ? c : 0; STORE32; \
|
||||||
cur = 0; while( ++i < MAX32 ) { STORE32; } \
|
cur = 0; while( ++i < MAX32 ) { STORE32; } \
|
||||||
if( c < 0 ) MBEDTLS_MPI_CHK( fix_negative( N, c, &C, bits ) );
|
if( c < 0 ) fix_negative( N, c, bits );
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* If the result is negative, we get it in the form
|
* If the result is negative, we get it in the form
|
||||||
* c * 2^(bits + 32) + N, with c negative and N positive shorter than 'bits'
|
* c * 2^(bits + 32) + N, with c negative and N positive shorter than 'bits'
|
||||||
*/
|
*/
|
||||||
static inline int fix_negative( mbedtls_mpi *N, signed char c, mbedtls_mpi *C, size_t bits )
|
static inline void fix_negative( mbedtls_mpi *N, signed char c, size_t bits )
|
||||||
{
|
{
|
||||||
int ret = MBEDTLS_ERR_ERROR_CORRUPTION_DETECTED;
|
size_t i;
|
||||||
|
|
||||||
/* C = - c * 2^(bits + 32) */
|
/* Set N := N - 2^bits */
|
||||||
#if !defined(MBEDTLS_HAVE_INT64)
|
--N->p[0];
|
||||||
((void) bits);
|
for( i = 0; i <= bits / 8 / sizeof( mbedtls_mpi_uint ); i++ )
|
||||||
#else
|
{
|
||||||
if( bits == 224 )
|
N->p[i] = ~(mbedtls_mpi_uint)0 - N->p[i];
|
||||||
C->p[ C->n - 1 ] = ((mbedtls_mpi_uint) -c) << 32;
|
}
|
||||||
else
|
|
||||||
#endif
|
|
||||||
C->p[ C->n - 1 ] = (mbedtls_mpi_uint) -c;
|
|
||||||
|
|
||||||
/* N = - ( C - N ) */
|
|
||||||
MBEDTLS_MPI_CHK( mbedtls_mpi_sub_abs( N, C, N ) );
|
|
||||||
N->s = -1;
|
N->s = -1;
|
||||||
|
|
||||||
cleanup:
|
/* Add |c| * 2^(bits + 32) to the absolute value. Since c and N are
|
||||||
|
* negative, this adds c * 2^(bits + 32). */
|
||||||
return( ret );
|
mbedtls_mpi_uint msw = (mbedtls_mpi_uint) -c;
|
||||||
|
#if defined(MBEDTLS_HAVE_INT64)
|
||||||
|
if( bits == 224 )
|
||||||
|
msw <<= 32;
|
||||||
|
#endif
|
||||||
|
N->p[bits / 8 / sizeof( mbedtls_mpi_uint)] += msw;
|
||||||
}
|
}
|
||||||
|
|
||||||
#if defined(MBEDTLS_ECP_DP_SECP224R1_ENABLED)
|
#if defined(MBEDTLS_ECP_DP_SECP224R1_ENABLED)
|
||||||
|
|
Loading…
Reference in a new issue