awslabs · jargh · Mar 22, 2025 · Mar 22, 2025 · Mar 23, 2025 · Mar 24, 2025
diff --git a/arm/curve25519/bignum_add_p25519.S b/arm/curve25519/bignum_add_p25519.S
@@ -10,9 +10,11 @@
 //
 // Standard ARM ABI: X0 = z, X1 = x, X2 = y
 // ----------------------------------------------------------------------------
-#include "_internal_s2n_bignum.h"
+
+#include "_internal_s2n_bignum_arm.h"
 
         S2N_BN_SYM_VISIBILITY_DIRECTIVE(bignum_add_p25519)
+        S2N_BN_FUNCTION_TYPE_DIRECTIVE(bignum_add_p25519)
         S2N_BN_SYM_PRIVACY_DIRECTIVE(bignum_add_p25519)
 
         .text
@@ -31,6 +33,7 @@
 #define c3 x10
 
 S2N_BN_SYMBOL(bignum_add_p25519):
+        CFI_START
 
 // Add as [d3; d2; d1; d0] = x + y; since we assume x, y < 2^255 - 19
 // this sum fits in 256 bits
@@ -67,7 +70,7 @@ S2N_BN_SYMBOL(bignum_add_p25519):
         stp     d0, d1, [z]
         stp     d2, d3, [z, #16]
 
-        ret
+        CFI_RET
 
 #if defined(__linux__) && defined(__ELF__)
 .section .note.GNU-stack,"",%progbits

diff --git a/arm/curve25519/bignum_cmul_p25519.S b/arm/curve25519/bignum_cmul_p25519.S
@@ -11,11 +11,14 @@
 //
 // Standard ARM ABI: X0 = z, X1 = c, X2 = x
 // ----------------------------------------------------------------------------
-#include "_internal_s2n_bignum.h"
+
+#include "_internal_s2n_bignum_arm.h"
 
         S2N_BN_SYM_VISIBILITY_DIRECTIVE(bignum_cmul_p25519)
+        S2N_BN_FUNCTION_TYPE_DIRECTIVE(bignum_cmul_p25519)
         S2N_BN_SYM_PRIVACY_DIRECTIVE(bignum_cmul_p25519)
         S2N_BN_SYM_VISIBILITY_DIRECTIVE(bignum_cmul_p25519_alt)
+        S2N_BN_FUNCTION_TYPE_DIRECTIVE(bignum_cmul_p25519_alt)
         S2N_BN_SYM_PRIVACY_DIRECTIVE(bignum_cmul_p25519_alt)
         .text
         .balign 4
@@ -44,6 +47,7 @@
 
 S2N_BN_SYMBOL(bignum_cmul_p25519):
 S2N_BN_SYMBOL(bignum_cmul_p25519_alt):
+        CFI_START
 
 // First do the multiply, straightforwardly to get [d4;d3;d2;d1;d0]
 
@@ -92,7 +96,7 @@ S2N_BN_SYMBOL(bignum_cmul_p25519_alt):
         stp     d0, d1, [z]
         stp     d2, d3, [z, #16]
 
-        ret
+        CFI_RET
 
 #if defined(__linux__) && defined(__ELF__)
 .section .note.GNU-stack,"",%progbits

diff --git a/arm/curve25519/bignum_double_p25519.S b/arm/curve25519/bignum_double_p25519.S
@@ -10,9 +10,11 @@
 //
 // Standard ARM ABI: X0 = z, X1 = x
 // ----------------------------------------------------------------------------
-#include "_internal_s2n_bignum.h"
+
+#include "_internal_s2n_bignum_arm.h"
 
         S2N_BN_SYM_VISIBILITY_DIRECTIVE(bignum_double_p25519)
+        S2N_BN_FUNCTION_TYPE_DIRECTIVE(bignum_double_p25519)
         S2N_BN_SYM_PRIVACY_DIRECTIVE(bignum_double_p25519)
 
         .text
@@ -30,6 +32,7 @@
 #define c3 x9
 
 S2N_BN_SYMBOL(bignum_double_p25519):
+        CFI_START
 
 // Double by adding as [d3; d2; d1; d0] = 2 * x; since we assume
 // x < 2^255 - 19 this result fits in 256 bits
@@ -64,7 +67,7 @@ S2N_BN_SYMBOL(bignum_double_p25519):
         stp     d0, d1, [z]
         stp     d2, d3, [z, #16]
 
-        ret
+        CFI_RET
 
 #if defined(__linux__) && defined(__ELF__)
 .section .note.GNU-stack,"",%progbits

diff --git a/arm/curve25519/bignum_inv_p25519.S b/arm/curve25519/bignum_inv_p25519.S
@@ -13,9 +13,11 @@
 //
 // Standard ARM ABI: X0 = z, X1 = x
 // ----------------------------------------------------------------------------
-#include "_internal_s2n_bignum.h"
+
+#include "_internal_s2n_bignum_arm.h"
 
         S2N_BN_SYM_VISIBILITY_DIRECTIVE(bignum_inv_p25519)
+        S2N_BN_FUNCTION_TYPE_DIRECTIVE(bignum_inv_p25519)
         S2N_BN_SYM_PRIVACY_DIRECTIVE(bignum_inv_p25519)
 
         .text
@@ -70,7 +72,7 @@
 
 // Total size to reserve on the stack
 
-#define NSPACE #(16*N)
+#define NSPACE (16*N)
 
 // Very similar to a subroutine call to the s2n-bignum word_divstep59.
 // But different in register usage and returning the final matrix in
@@ -695,12 +697,13 @@
         movk    nn, n3, lsl #48
 
 S2N_BN_SYMBOL(bignum_inv_p25519):
+        CFI_START
 
 // Save registers and make room for temporaries
 
-        stp     x19, x20, [sp, -16]!
-        stp     x21, x22, [sp, -16]!
-        sub     sp, sp, NSPACE
+        CFI_PUSH2(x19,x20)
+        CFI_PUSH2(x21,x22)
+        CFI_DEC_SP(NSPACE)
 
 // Save the return pointer for the end so we can overwrite x0 later
 
@@ -755,9 +758,9 @@ S2N_BN_SYMBOL(bignum_inv_p25519):
 
         mov     i, #10
         mov     d, #1
-        b       bignum_inv_p25519_midloop
+        b       Lbignum_inv_p25519_midloop
 
-bignum_inv_p25519_loop:
+Lbignum_inv_p25519_loop:
 
 // Separate the matrix elements into sign-magnitude pairs
 
@@ -1086,7 +1089,7 @@ bignum_inv_p25519_loop:
         stp     x0, x1, [v]
         stp     x3, x2, [v+16]
 
-bignum_inv_p25519_midloop:
+Lbignum_inv_p25519_midloop:
 
         mov     x1, d
         ldr     x2, [f]
@@ -1097,7 +1100,7 @@ bignum_inv_p25519_midloop:
 // Next iteration
 
         subs    i, i, #1
-        bne     bignum_inv_p25519_loop
+        bne     Lbignum_inv_p25519_loop
 
 // The 10th and last iteration does not need anything except the
 // u value and the sign of f; the latter can be obtained from the
@@ -1245,10 +1248,10 @@ bignum_inv_p25519_midloop:
 
 // Restore stack and registers
 
-        add     sp, sp, NSPACE
-        ldp     x21, x22, [sp], 16
-        ldp     x19, x20, [sp], 16
-        ret
+        CFI_INC_SP(NSPACE)
+        CFI_POP2(x21,x22)
+        CFI_POP2(x19,x20)
+        CFI_RET
 
 #if defined(__linux__) && defined(__ELF__)
 .section .note.GNU-stack, "", %progbits

diff --git a/arm/curve25519/bignum_invsqrt_p25519.S b/arm/curve25519/bignum_invsqrt_p25519.S
@@ -20,11 +20,16 @@
 //
 // Standard ARM ABI: X0 = z, X1 = x
 // ----------------------------------------------------------------------------
-#include "_internal_s2n_bignum.h"
+
+#include "_internal_s2n_bignum_arm.h"
 
         S2N_BN_SYM_VISIBILITY_DIRECTIVE(bignum_invsqrt_p25519)
+        S2N_BN_FUNCTION_TYPE_DIRECTIVE(bignum_invsqrt_p25519)
         S2N_BN_SYM_PRIVACY_DIRECTIVE(bignum_invsqrt_p25519)
 
+        S2N_BN_FUNCTION_TYPE_DIRECTIVE(Lbignum_invsqrt_p25519_mul_p25519)
+        S2N_BN_FUNCTION_TYPE_DIRECTIVE(Lbignum_invsqrt_p25519_nsqr_p25519)
+
         .text
         .balign 4
 
@@ -45,7 +50,7 @@
 
 // Total size to reserve on the stack
 
-#define NSPACE #(16*N)
+#define NSPACE (16*N)
 
 // Loading large constants
 
@@ -61,20 +66,21 @@
         add     x0, dest __LF                                              \
         add     x1, src1 __LF                                              \
         add     x2, src2 __LF                                              \
-        bl      bignum_invsqrt_p25519_mul_p25519
+        CFI_BL(Lbignum_invsqrt_p25519_mul_p25519)
 
 #define nsqr(dest,n,src)                                                \
         add     x0, dest __LF                                              \
         mov     x1, n __LF                                                 \
         add     x2, src __LF                                               \
-        bl      bignum_invsqrt_p25519_nsqr_p25519
+        CFI_BL(Lbignum_invsqrt_p25519_nsqr_p25519)
 
 S2N_BN_SYMBOL(bignum_invsqrt_p25519):
+        CFI_START
 
 // Save registers and make room for temporaries
 
-        stp     x19, x30, [sp, -16]!
-        sub     sp, sp, NSPACE
+        CFI_PUSH2(x19,x30)
+        CFI_DEC_SP(NSPACE)
 
 // Save the return pointer for the end so we can overwrite x0 later
 
@@ -215,7 +221,7 @@ S2N_BN_SYMBOL(bignum_invsqrt_p25519):
 
         add     x0, b
         mov     x1, #1
-        bl      bignum_invsqrt_p25519_nsqr_p25519
+        CFI_BL(Lbignum_invsqrt_p25519_nsqr_p25519)
         mulp(b,a,b)
 
         ldp     x10, x11, [b]
@@ -236,15 +242,16 @@ S2N_BN_SYMBOL(bignum_invsqrt_p25519):
 
 // Restore stack and registers
 
-        add     sp, sp, NSPACE
-        ldp     x19, x30, [sp], 16
-        ret
+        CFI_INC_SP(NSPACE)
+        CFI_POP2(x19,x30)
+        CFI_RET
 
 // *************************************************************
 // Local z = x * y
 // *************************************************************
 
-bignum_invsqrt_p25519_mul_p25519:
+Lbignum_invsqrt_p25519_mul_p25519:
+        CFI_START
         ldp     x3, x4, [x1]
         ldp     x5, x6, [x2]
         umull   x7, w3, w5
@@ -425,13 +432,14 @@ bignum_invsqrt_p25519_mul_p25519:
         and     x10, x10, #0x7fffffffffffffff
         stp     x7, x8, [x0]
         stp     x9, x10, [x0, #16]
-        ret
+        CFI_RET
 
 // *************************************************************
 // Local z = 2^n * x
 // *************************************************************
 
-bignum_invsqrt_p25519_nsqr_p25519:
+Lbignum_invsqrt_p25519_nsqr_p25519:
+        CFI_START
 
 // Copy input argument into [x13;x12;x11;x10]
 
@@ -441,7 +449,7 @@ bignum_invsqrt_p25519_nsqr_p25519:
 // Main squaring loop, accumulating in [x13;x12;x11;x10] consistently and
 // only ensuring the intermediates are < 2 * p_25519 = 2^256 - 38
 
-bignum_invsqrt_p25519_loop:
+Lbignum_invsqrt_p25519_loop:
         umull   x2, w10, w10
         lsr     x14, x10, #32
         umull   x3, w14, w14
@@ -572,7 +580,7 @@ bignum_invsqrt_p25519_loop:
 // Loop as applicable
 
         subs    x1, x1, #1
-        bne     bignum_invsqrt_p25519_loop
+        bne     Lbignum_invsqrt_p25519_loop
 
 // We know the intermediate result x < 2^256 - 38, and now we do strict
 // modular reduction mod 2^255 - 19. Note x < 2^255 - 19 <=> x + 19 < 2^255
@@ -593,7 +601,7 @@ bignum_invsqrt_p25519_loop:
 
         stp     x10, x11, [x0]
         stp     x12, x13, [x0, #16]
-        ret
+        CFI_RET
 
 #if defined(__linux__) && defined(__ELF__)
 .section .note.GNU-stack, "", %progbits