Optimize fix_negative

Reduce the code size, stack consumption and heap consumption in fix_negative by encoding the special-case subtraction manually. * Code size: ecp_curves.o goes down from 7837B down to 7769 in a sample Cortex-M0 build with all curves enabled. The savings come from not having to set up C in INIT (which is used many times) and from not having to catch errors in fix_negative. * Stack consumption: get rid of C on the stack. * Heap: mbedtls_mpi_sub_abs with destination == second operand would make a heap allocation. The new code doesn't do any heap allocation. * Performance: no measurable difference. Signed-off-by: Gilles Peskine <Gilles.Peskine@arm.com>
2025-10-03 01:17:10 +00:00 · 2020-07-22 19:58:28 +02:00 · 2020-07-22 19:58:28 +02:00 · d10e8fae9e
parent 28f62f6212
commit d10e8fae9e
1 changed files with 24 additions and 30 deletions
--- a/library/ecp_curves.c
+++ b/library/ecp_curves.c
@ -1000,25 +1000,20 @@ static inline void sub32( uint32_t *dst, uint32_t src, signed char *carry )
 #define ADD( j )    add32( &cur, A( j ), &c );
 #define SUB( j )    sub32( &cur, A( j ), &c );
 #define ciL    (sizeof(mbedtls_mpi_uint))         /* chars in limb  */
 #define biL    (ciL << 3)               /* bits  in limb  */
 /*
 * Helpers for the main 'loop'
 * (see fix_negative for the motivation of C)
 */
 #define INIT( b )                                                       \
    int ret = MBEDTLS_ERR_ERROR_CORRUPTION_DETECTED;                    \
    signed char c = 0, cc;                                              \
    uint32_t cur;                                                       \
    size_t i = 0, bits = (b);                                           \
-    mbedtls_mpi C;                                                      \
+    /* N is the size of the product of two b-bit numbers, plus one */   \
-    mbedtls_mpi_uint Cp[ (b) / 8 / sizeof( mbedtls_mpi_uint) + 1 ];     \
+    /* limb for fix_negative */                                         \
-                                                                        \
+    MBEDTLS_MPI_CHK( mbedtls_mpi_grow( N, ( b ) * 2 / biL + 1 ) );      \
    C.s = 1;                                                            \
    C.n = (b) / 8 / sizeof( mbedtls_mpi_uint) + 1;                      \
    C.p = Cp;                                                           \
    memset( Cp, 0, C.n * sizeof( mbedtls_mpi_uint ) );                  \
                                                                        \
    MBEDTLS_MPI_CHK( mbedtls_mpi_grow( N, (b) * 2 / 8 /                 \
                                       sizeof( mbedtls_mpi_uint ) ) );  \
    LOAD32;
 #define NEXT                    \
@ -1033,33 +1028,32 @@ static inline void sub32( uint32_t *dst, uint32_t src, signed char *carry )
    STORE32; i++;                               \
    cur = c > 0 ? c : 0; STORE32;               \
    cur = 0; while( ++i < MAX32 ) { STORE32; }  \
-    if( c < 0 ) MBEDTLS_MPI_CHK( fix_negative( N, c, &C, bits ) );
+    if( c < 0 ) fix_negative( N, c, bits );
 /*
 * If the result is negative, we get it in the form
 * c * 2^(bits + 32) + N, with c negative and N positive shorter than 'bits'
 */
-static inline int fix_negative( mbedtls_mpi *N, signed char c, mbedtls_mpi *C, size_t bits )
+static inline void fix_negative( mbedtls_mpi *N, signed char c, size_t bits )
 {
-    int ret = MBEDTLS_ERR_ERROR_CORRUPTION_DETECTED;
+    size_t i;
-    /* C = - c * 2^(bits + 32) */
+    /* Set N := N - 2^bits */
-#if !defined(MBEDTLS_HAVE_INT64)
+    --N->p[0];
-    ((void) bits);
+    for( i = 0; i <= bits / 8 / sizeof( mbedtls_mpi_uint ); i++ )
-#else
+    {
-    if( bits == 224 )
+        N->p[i] = ~(mbedtls_mpi_uint)0 - N->p[i];
-        C->p[ C->n - 1 ] = ((mbedtls_mpi_uint) -c) << 32;
+    }
    else
 #endif
        C->p[ C->n - 1 ] = (mbedtls_mpi_uint) -c;
    /* N = - ( C - N ) */
    MBEDTLS_MPI_CHK( mbedtls_mpi_sub_abs( N, C, N ) );
    N->s = -1;
-cleanup:
+    /* Add |c| * 2^(bits + 32) to the absolute value. Since c and N are
-
+    * negative, this adds c * 2^(bits + 32). */
-    return( ret );
+    mbedtls_mpi_uint msw = (mbedtls_mpi_uint) -c;
 #if defined(MBEDTLS_HAVE_INT64)
    if( bits == 224 )
        msw <<= 32;
 #endif
    N->p[bits / 8 / sizeof( mbedtls_mpi_uint)] += msw;
 }
 #if defined(MBEDTLS_ECP_DP_SECP224R1_ENABLED)