From 016b3002e13acefb5773da78659c050187d3a96f Mon Sep 17 00:00:00 2001 From: Uros Bizjak Date: Thu, 9 Nov 2023 19:47:57 +0100 Subject: [PATCH] i386: Improve stack protector patterns and peephole2s even more Improve stack protector patterns and peephole2s even more: a. Use unrelated register clears with integer mode size <= word mode size to clear stack protector scratch register. b. Use unrelated register initializations in front of stack protector sequence to clear stack protector scratch register. c. Use unrelated register initializations using LEA instructions to clear stack protector scratch register. These stack protector improvements reuse 6914 unrelated register initializations to substitute the clear of stack protector scratch register in 12034 instances of stack protector sequence in recent linux defconfig build. gcc/ChangeLog: * config/i386/i386.md (@stack_protect_set_1__): Use W mode iterator instead of SWI48. Output MOV instead of XOR for TARGET_USE_MOV0. (stack_protect_set_1 peephole2): Use integer modes with mode size <= word mode size for operand 3. (stack_protect_set_1 peephole2 #2): New peephole2 pattern to substitute stack protector scratch register clear with unrelated register initialization, originally in front of stack protector sequence. (*stack_protect_set_3__): New insn pattern. (stack_protect_set_1 peephole2): New peephole2 pattern to substitute stack protector scratch register clear with unrelated register initialization involving LEA instruction. --- gcc/config/i386/i386.md | 75 ++++++++++++++++++++++++++++++++++++----- 1 file changed, 66 insertions(+), 9 deletions(-) diff --git a/gcc/config/i386/i386.md b/gcc/config/i386/i386.md index ce7102af44fb5..046b6b7919e9f 100644 --- a/gcc/config/i386/i386.md +++ b/gcc/config/i386/i386.md @@ -6172,7 +6172,7 @@ gcc_assert (TARGET_64BIT); return "lea{l}\t{%E1, %k0|%k0, %E1}"; } - else + else return "lea{}\t{%E1, %0|%0, %E1}"; } [(set_attr "type" "lea") @@ -24306,11 +24306,11 @@ DONE; }) -(define_insn "@stack_protect_set_1__" +(define_insn "@stack_protect_set_1__" [(set (match_operand:PTR 0 "memory_operand" "=m") (unspec:PTR [(match_operand:PTR 1 "memory_operand" "m")] UNSPEC_SP_SET)) - (set (match_operand:SWI48 2 "register_operand" "=&r") (const_int 0)) + (set (match_operand:W 2 "register_operand" "=&r") (const_int 0)) (clobber (reg:CC FLAGS_REG))] "" { @@ -24318,7 +24318,10 @@ operands); output_asm_insn ("mov{}\t{%2, %0|%0, %2}", operands); - return "xor{l}\t%k2, %k2"; + if (!TARGET_USE_MOV0 || optimize_insn_for_size_p ()) + return "xor{l}\t%k2, %k2"; + else + return "mov{l}\t{$0, %k2|%k2, 0}"; } [(set_attr "type" "multi")]) @@ -24334,15 +24337,16 @@ UNSPEC_SP_SET)) (set (match_operand:W 2 "general_reg_operand") (const_int 0)) (clobber (reg:CC FLAGS_REG))]) - (parallel [(set (match_operand:SWI48 3 "general_reg_operand") - (match_operand:SWI48 4 "const0_operand")) - (clobber (reg:CC FLAGS_REG))])] - "peep2_reg_dead_p (0, operands[3]) + (set (match_operand 3 "general_reg_operand") + (match_operand 4 "const0_operand"))] + "GET_MODE_SIZE (GET_MODE (operands[3])) <= UNITS_PER_WORD + && peep2_reg_dead_p (0, operands[3]) && peep2_reg_dead_p (1, operands[2])" [(parallel [(set (match_dup 0) (unspec:PTR [(match_dup 1)] UNSPEC_SP_SET)) (set (match_dup 3) (const_int 0)) - (clobber (reg:CC FLAGS_REG))])]) + (clobber (reg:CC FLAGS_REG))])] + "operands[3] = gen_lowpart (word_mode, operands[3]);") (define_insn "*stack_protect_set_2__si" [(set (match_operand:PTR 0 "memory_operand" "=m") @@ -24401,6 +24405,59 @@ (unspec:PTR [(match_dup 1)] UNSPEC_SP_SET)) (set (match_dup 3) (match_dup 4))])]) +(define_peephole2 + [(set (match_operand:SWI48 3 "general_reg_operand") + (match_operand:SWI48 4 "general_gr_operand")) + (parallel [(set (match_operand:PTR 0 "memory_operand") + (unspec:PTR [(match_operand:PTR 1 "memory_operand")] + UNSPEC_SP_SET)) + (set (match_operand:W 2 "general_reg_operand") (const_int 0)) + (clobber (reg:CC FLAGS_REG))])] + "peep2_reg_dead_p (0, operands[3]) + && peep2_reg_dead_p (2, operands[2]) + && !reg_mentioned_p (operands[3], operands[0]) + && !reg_mentioned_p (operands[3], operands[1])" + [(parallel [(set (match_dup 0) + (unspec:PTR [(match_dup 1)] UNSPEC_SP_SET)) + (set (match_dup 3) (match_dup 4))])]) + +(define_insn "*stack_protect_set_3__" + [(set (match_operand:PTR 0 "memory_operand" "=m") + (unspec:PTR [(match_operand:PTR 3 "memory_operand" "m")] + UNSPEC_SP_SET)) + (set (match_operand:SWI48 1 "register_operand" "=&r") + (match_operand:SWI48 2 "address_no_seg_operand" "Ts"))] + "" +{ + output_asm_insn ("mov{}\t{%3, %1|%1, %3}", + operands); + output_asm_insn ("mov{}\t{%1, %0|%0, %1}", + operands); + if (SImode_address_operand (operands[2], VOIDmode)) + { + gcc_assert (TARGET_64BIT); + return "lea{l}\t{%E2, %k1|%k1, %E2}"; + } + else + return "lea{}\t{%E2, %1|%1, %E2}"; +} + [(set_attr "type" "multi") + (set_attr "length" "24")]) + +(define_peephole2 + [(parallel [(set (match_operand:PTR 0 "memory_operand") + (unspec:PTR [(match_operand:PTR 1 "memory_operand")] + UNSPEC_SP_SET)) + (set (match_operand:W 2 "general_reg_operand") (const_int 0)) + (clobber (reg:CC FLAGS_REG))]) + (set (match_operand:SWI48 3 "general_reg_operand") + (match_operand:SWI48 4 "address_no_seg_operand"))] + "peep2_reg_dead_p (0, operands[3]) + && peep2_reg_dead_p (1, operands[2])" + [(parallel [(set (match_dup 0) + (unspec:PTR [(match_dup 1)] UNSPEC_SP_SET)) + (set (match_dup 3) (match_dup 4))])]) + (define_expand "stack_protect_test" [(match_operand 0 "memory_operand") (match_operand 1 "memory_operand")