newlib: libc: strcmp M-profile PACBTI-enablement

Add function prologue/epilogue to conditionally add BTI landing pads
and/or PAC code generation & authentication instructions depending on
compilation flags.

This patch enables PACBTI for all relevant variants of strcmp:
     * Newlib for armv8.1-m.main+pacbti
     * Newlib for armv8.1-m.main+pacbti+mve
     * Newlib-nano
This commit is contained in:
Victor L. Do Nascimento 2022-12-21 11:21:22 +00:00 committed by Richard Earnshaw
parent 9d6b00511e
commit ebd922e77a
3 changed files with 60 additions and 31 deletions

View File

@ -29,10 +29,14 @@
/* Tiny version of strcmp in ARM state. Used only when optimizing /* Tiny version of strcmp in ARM state. Used only when optimizing
for size. Also supports Thumb-2. */ for size. Also supports Thumb-2. */
#include "arm_asm.h"
.syntax unified .syntax unified
def_fn strcmp def_fn strcmp
.fnstart
.cfi_sections .debug_frame .cfi_sections .debug_frame
.cfi_startproc .cfi_startproc
prologue
1: 1:
ldrb r2, [r0], #1 ldrb r2, [r0], #1
ldrb r3, [r1], #1 ldrb r3, [r1], #1
@ -42,6 +46,8 @@ def_fn strcmp
beq 1b beq 1b
2: 2:
subs r0, r2, r3 subs r0, r2, r3
bx lr epilogue
.cfi_endproc .cfi_endproc
.cantunwind
.fnend
.size strcmp, . - strcmp .size strcmp, . - strcmp

View File

@ -45,6 +45,8 @@
.thumb .thumb
.syntax unified .syntax unified
#include "arm_asm.h"
/* Parameters and result. */ /* Parameters and result. */
#define src1 r0 #define src1 r0
#define src2 r1 #define src2 r1
@ -91,8 +93,9 @@
ldrd r4, r5, [sp], #16 ldrd r4, r5, [sp], #16
.cfi_restore 4 .cfi_restore 4
.cfi_restore 5 .cfi_restore 5
.cfi_adjust_cfa_offset -16
sub result, result, r1, lsr #24 sub result, result, r1, lsr #24
bx lr epilogue push_ip=HAVE_PAC_LEAF
#else #else
/* To use the big-endian trick we'd have to reverse all three words. /* To use the big-endian trick we'd have to reverse all three words.
that's slower than this approach. */ that's slower than this approach. */
@ -112,22 +115,21 @@
ldrd r4, r5, [sp], #16 ldrd r4, r5, [sp], #16
.cfi_restore 4 .cfi_restore 4
.cfi_restore 5 .cfi_restore 5
.cfi_adjust_cfa_offset -16
sub result, result, r1 sub result, result, r1
bx lr epilogue push_ip=HAVE_PAC_LEAF
#endif #endif
.endm .endm
.text .text
.p2align 5 .p2align 5
.Lstrcmp_start_addr:
#ifndef STRCMP_NO_PRECHECK
.Lfastpath_exit:
sub r0, r2, r3
bx lr
nop
#endif
def_fn strcmp def_fn strcmp
.fnstart
.cfi_sections .debug_frame
.cfi_startproc
prologue push_ip=HAVE_PAC_LEAF
#ifndef STRCMP_NO_PRECHECK #ifndef STRCMP_NO_PRECHECK
ldrb r2, [src1] ldrb r2, [src1]
ldrb r3, [src2] ldrb r3, [src2]
@ -136,16 +138,14 @@ def_fn strcmp
cmpcs r2, r3 cmpcs r2, r3
bne .Lfastpath_exit bne .Lfastpath_exit
#endif #endif
.cfi_sections .debug_frame
.cfi_startproc
strd r4, r5, [sp, #-16]! strd r4, r5, [sp, #-16]!
.cfi_def_cfa_offset 16 .cfi_adjust_cfa_offset 16
.cfi_offset 4, -16 .cfi_rel_offset 4, 0
.cfi_offset 5, -12 .cfi_rel_offset 5, 4
orr tmp1, src1, src2 orr tmp1, src1, src2
strd r6, r7, [sp, #8] strd r6, r7, [sp, #8]
.cfi_offset 6, -8 .cfi_rel_offset 6, 8
.cfi_offset 7, -4 .cfi_rel_offset 7, 12
mvn const_m1, #0 mvn const_m1, #0
lsl r2, tmp1, #29 lsl r2, tmp1, #29
cbz r2, .Lloop_aligned8 cbz r2, .Lloop_aligned8
@ -270,7 +270,6 @@ def_fn strcmp
ldr data1, [src1], #4 ldr data1, [src1], #4
beq .Laligned_m2 beq .Laligned_m2
bcs .Laligned_m1 bcs .Laligned_m1
#ifdef STRCMP_NO_PRECHECK #ifdef STRCMP_NO_PRECHECK
ldrb data2, [src2, #1] ldrb data2, [src2, #1]
uxtb tmp1, data1, ror #BYTE1_OFFSET uxtb tmp1, data1, ror #BYTE1_OFFSET
@ -314,10 +313,19 @@ def_fn strcmp
mov result, tmp1 mov result, tmp1
ldr r4, [sp], #16 ldr r4, [sp], #16
.cfi_restore 4 .cfi_restore 4
bx lr .cfi_adjust_cfa_offset -16
epilogue push_ip=HAVE_PAC_LEAF
#ifndef STRCMP_NO_PRECHECK #ifndef STRCMP_NO_PRECHECK
.Lfastpath_exit:
.cfi_restore_state
.cfi_remember_state
sub r0, r2, r3
epilogue push_ip=HAVE_PAC_LEAF
.Laligned_m1: .Laligned_m1:
.cfi_restore_state
.cfi_remember_state
add src2, src2, #4 add src2, src2, #4
#endif #endif
.Lsrc1_aligned: .Lsrc1_aligned:
@ -364,8 +372,9 @@ def_fn strcmp
/* R6/7 Not used in this sequence. */ /* R6/7 Not used in this sequence. */
.cfi_restore 6 .cfi_restore 6
.cfi_restore 7 .cfi_restore 7
.cfi_adjust_cfa_offset -16
neg result, result neg result, result
bx lr epilogue push_ip=HAVE_PAC_LEAF
6: 6:
.cfi_restore_state .cfi_restore_state
@ -441,7 +450,8 @@ def_fn strcmp
/* R6/7 not used in this sequence. */ /* R6/7 not used in this sequence. */
.cfi_restore 6 .cfi_restore 6
.cfi_restore 7 .cfi_restore 7
bx lr .cfi_adjust_cfa_offset -16
epilogue push_ip=HAVE_PAC_LEAF
.Lstrcmp_tail: .Lstrcmp_tail:
.cfi_restore_state .cfi_restore_state
@ -463,7 +473,10 @@ def_fn strcmp
/* R6/7 not used in this sequence. */ /* R6/7 not used in this sequence. */
.cfi_restore 6 .cfi_restore 6
.cfi_restore 7 .cfi_restore 7
.cfi_adjust_cfa_offset -16
sub result, result, data2, lsr #24 sub result, result, data2, lsr #24
bx lr epilogue push_ip=HAVE_PAC_LEAF
.cfi_endproc .cfi_endproc
.size strcmp, . - .Lstrcmp_start_addr .cantunwind
.fnend
.size strcmp, . - strcmp

View File

@ -29,6 +29,8 @@
/* Very similar to the generic code, but uses Thumb2 as implemented /* Very similar to the generic code, but uses Thumb2 as implemented
in ARMv7-M. */ in ARMv7-M. */
#include "arm_asm.h"
/* Parameters and result. */ /* Parameters and result. */
#define src1 r0 #define src1 r0
#define src2 r1 #define src2 r1
@ -44,8 +46,10 @@
.thumb .thumb
.syntax unified .syntax unified
def_fn strcmp def_fn strcmp
.fnstart
.cfi_sections .debug_frame .cfi_sections .debug_frame
.cfi_startproc .cfi_startproc
prologue push_ip=HAVE_PAC_LEAF
eor tmp1, src1, src2 eor tmp1, src1, src2
tst tmp1, #3 tst tmp1, #3
/* Strings not at same byte offset from a word boundary. */ /* Strings not at same byte offset from a word boundary. */
@ -82,6 +86,7 @@ def_fn strcmp
ldreq data2, [src2], #4 ldreq data2, [src2], #4
beq 4b beq 4b
2: 2:
.cfi_remember_state
/* There's a zero or a different byte in the word */ /* There's a zero or a different byte in the word */
S2HI result, data1, #24 S2HI result, data1, #24
S2LO data1, data1, #8 S2LO data1, data1, #8
@ -106,7 +111,7 @@ def_fn strcmp
lsrs result, result, #24 lsrs result, result, #24
subs result, result, data2 subs result, result, data2
#endif #endif
bx lr epilogue push_ip=HAVE_PAC_LEAF
#if 0 #if 0
@ -205,8 +210,10 @@ def_fn strcmp
/* First of all, compare bytes until src1(sp1) is word-aligned. */ /* First of all, compare bytes until src1(sp1) is word-aligned. */
.Lstrcmp_unaligned: .Lstrcmp_unaligned:
.cfi_restore_state
tst src1, #3 tst src1, #3
beq 2f beq 2f
.cfi_remember_state
ldrb data1, [src1], #1 ldrb data1, [src1], #1
ldrb data2, [src2], #1 ldrb data2, [src2], #1
cmp data1, #1 cmp data1, #1
@ -214,12 +221,13 @@ def_fn strcmp
cmpcs data1, data2 cmpcs data1, data2
beq .Lstrcmp_unaligned beq .Lstrcmp_unaligned
sub result, data1, data2 sub result, data1, data2
bx lr epilogue push_ip=HAVE_PAC_LEAF
2: 2:
.cfi_restore_state
stmfd sp!, {r5} stmfd sp!, {r5}
.cfi_def_cfa_offset 4 .cfi_adjust_cfa_offset 4
.cfi_offset 5, -4 .cfi_rel_offset 5, 0
ldr data1, [src1], #4 ldr data1, [src1], #4
and tmp2, src2, #3 and tmp2, src2, #3
@ -355,8 +363,8 @@ def_fn strcmp
.cfi_remember_state .cfi_remember_state
ldmfd sp!, {r5} ldmfd sp!, {r5}
.cfi_restore 5 .cfi_restore 5
.cfi_def_cfa_offset 0 .cfi_adjust_cfa_offset -4
bx lr epilogue push_ip=HAVE_PAC_LEAF
.Lstrcmp_tail: .Lstrcmp_tail:
.cfi_restore_state .cfi_restore_state
@ -372,7 +380,9 @@ def_fn strcmp
sub result, r2, result sub result, r2, result
ldmfd sp!, {r5} ldmfd sp!, {r5}
.cfi_restore 5 .cfi_restore 5
.cfi_def_cfa_offset 0 .cfi_adjust_cfa_offset -4
bx lr epilogue push_ip=HAVE_PAC_LEAF
.cfi_endproc .cfi_endproc
.cantunwind
.fnend
.size strcmp, . - strcmp .size strcmp, . - strcmp