[RFA,PR,target/84128] Fix restore of scratch register used in probing loops

Message ID	328b4297-f032-6bf0-9252-1d7ee7b50133@redhat.com
State	New
Headers	show Return-Path: <gcc-patches-return-472340-incoming=patchwork.ozlabs.org@gcc.gnu.org> DomainKey-Signature: a=rsa-sha1; c=nofws; d=gcc.gnu.org; h=list-id :list-unsubscribe:list-archive:list-post:list-help:sender:from :to:cc:subject:message-id:date:mime-version:content-type; q=dns; s=default; b=QFNz1jJXEeRGHq4Jtkd+Lj5SjYnF+o0Aq0X9VNJdlwmPg5ahKR TUJekuldo0o/k8G19rTX2+WcQwgyaykaQTEtbcMXAdwFmDvEyFSy1yVfI3hC2bzt uclWm1Q0eK2/+PIhhK8+NwWXiY8ySGaA5/LFG3S/bXyiHQgwTNw5S2biU= Mailing-List: contact gcc-patches-help@gcc.gnu.org; run by ezmlm Precedence: bulk Sender: gcc-patches-owner@gcc.gnu.org From: Jeff Law <law@redhat.com> To: Uros Bizjak <ubizjak@gmail.com> Cc: gcc-patches <gcc-patches@gcc.gnu.org> Subject: [PATCH][RFA][PR target/84128] Fix restore of scratch register used in probing loops Message-ID: <328b4297-f032-6bf0-9252-1d7ee7b50133@redhat.com> Date: Tue, 30 Jan 2018 22:35:37 -0700 User-Agent: Mozilla/5.0 (X11; Linux x86_64; rv:52.0) Gecko/20100101 Thunderbird/52.5.2 MIME-Version: 1.0 Content-Type: multipart/mixed; boundary="------------F6806587F4374B72FB0084E8"
Series	[RFA,PR,target/84128] Fix restore of scratch register used in probing loops \| expand [RFA,PR,target/84128] Fix restore of scratch register used in probing loops

diff --git a/gcc/config/i386/i386.c b/gcc/config/i386/i386.c index fef34a1..93ce79c 100644 --- a/gcc/config/i386/i386.c +++ b/gcc/config/i386/i386.c @@ -12567,22 +12567,25 @@ get_scratch_register_on_entry (struct scratch_reg *sr) } } -/* Release a scratch register obtained from the preceding function. */ +/* Release a scratch register obtained from the preceding function. + + Note there will always be some kind of stack adjustment between + allocation and releasing the scratch register. So we can't just + pop the scratch register off the stack if we were forced to save it + (the stack pointer itself has a different value). + + Instead we're passed the offset into the stack where the value will + be found and the space becomes part of the local frame that is + deallocated by the epilogue. */ static void -release_scratch_register_on_entry (struct scratch_reg *sr) +release_scratch_register_on_entry (struct scratch_reg *sr, HOST_WIDE_INT offset) { if (sr->saved) { - struct machine_function *m = cfun->machine; - rtx x, insn = emit_insn (gen_pop (sr->reg)); - - /* The RTX_FRAME_RELATED_P mechanism doesn't know about pop. */ - RTX_FRAME_RELATED_P (insn) = 1; - x = gen_rtx_PLUS (Pmode, stack_pointer_rtx, GEN_INT (UNITS_PER_WORD)); - x = gen_rtx_SET (stack_pointer_rtx, x); - add_reg_note (insn, REG_FRAME_RELATED_EXPR, x); - m->fs.sp_offset -= UNITS_PER_WORD; + rtx x = gen_rtx_PLUS (Pmode, stack_pointer_rtx, GEN_INT (offset)); + x = gen_rtx_SET (sr->reg, gen_rtx_MEM (word_mode, x)); + emit_insn (x); } } @@ -12597,7 +12600,7 @@ release_scratch_register_on_entry (struct scratch_reg *sr) pushed on the stack. */ static void -ix86_adjust_stack_and_probe_stack_clash (const HOST_WIDE_INT size, +ix86_adjust_stack_and_probe_stack_clash (HOST_WIDE_INT size, const bool int_registers_saved) { struct machine_function *m = cfun->machine; @@ -12713,6 +12716,12 @@ ix86_adjust_stack_and_probe_stack_clash (const HOST_WIDE_INT size, struct scratch_reg sr; get_scratch_register_on_entry (&sr); + /* If we needed to save a register, then account for any space + that was pushed (we are not going to pop the register when + we do the restore). */ + if (sr.saved) + size -= UNITS_PER_WORD; + /* Step 1: round SIZE down to a multiple of the interval. */ HOST_WIDE_INT rounded_size = size & -probe_interval; @@ -12761,7 +12770,9 @@ ix86_adjust_stack_and_probe_stack_clash (const HOST_WIDE_INT size, m->fs.cfa_reg == stack_pointer_rtx); dump_stack_clash_frame_info (PROBE_LOOP, size != rounded_size); - release_scratch_register_on_entry (&sr); + /* This does not deallocate the space reserved for the scratch + register. That will be deallocated in the epilogue. */ + release_scratch_register_on_entry (&sr, size); } /* Make sure nothing is scheduled before we are done. */ @@ -12774,7 +12785,7 @@ ix86_adjust_stack_and_probe_stack_clash (const HOST_WIDE_INT size, pushed on the stack. */ static void -ix86_adjust_stack_and_probe (const HOST_WIDE_INT size, +ix86_adjust_stack_and_probe (HOST_WIDE_INT size, const bool int_registers_saved) { /* We skip the probe for the first interval + a small dope of 4 words and @@ -12847,6 +12858,11 @@ ix86_adjust_stack_and_probe (const HOST_WIDE_INT size, get_scratch_register_on_entry (&sr); + /* If we needed to save a register, then account for any space + that was pushed (we are not going to pop the register when + we do the restore). */ + if (sr.saved) + size -= UNITS_PER_WORD; /* Step 1: round SIZE to the previous multiple of the interval. */ @@ -12906,7 +12922,9 @@ ix86_adjust_stack_and_probe (const HOST_WIDE_INT size, (get_probe_interval () + dope)))); - release_scratch_register_on_entry (&sr); + /* This does not deallocate the space reserved for the scratch + register. That will be deallocated in the epilogue. */ + release_scratch_register_on_entry (&sr, size); } /* Even if the stack pointer isn't the CFA register, we need to correctly @@ -13015,6 +13033,11 @@ ix86_emit_probe_stack_range (HOST_WIDE_INT first, HOST_WIDE_INT size, get_scratch_register_on_entry (&sr); + /* If we needed to save a register, then account for any space + that was pushed (we are not going to pop the register when + we do the restore). */ + if (sr.saved) + size -= UNITS_PER_WORD; /* Step 1: round SIZE to the previous multiple of the interval. */ @@ -13055,7 +13078,9 @@ ix86_emit_probe_stack_range (HOST_WIDE_INT first, HOST_WIDE_INT size, sr.reg), rounded_size - size)); - release_scratch_register_on_entry (&sr); + /* This does not deallocate the space reserved for the scratch + register. That will be deallocated in the epilogue. */ + release_scratch_register_on_entry (&sr, size); } /* Make sure nothing is scheduled before we are done. */ diff --git a/gcc/testsuite/gcc.target/i386/pr84128.c b/gcc/testsuite/gcc.target/i386/pr84128.c new file mode 100644 index 0000000..a8323fd6 --- /dev/null +++ b/gcc/testsuite/gcc.target/i386/pr84128.c @@ -0,0 +1,30 @@ +/* { dg-do run } */ +/* { dg-options "-O2 -march=i686 -mtune=generic -fstack-clash-protection" } */ +/* { dg-require-effective-target ia32 } */ + +__attribute__ ((noinline, noclone, weak, regparm (3))) +int +f1 (long arg0, int (*pf) (long, void *)) +{ + unsigned char buf[32768]; + return pf (arg0, buf); +} + +__attribute__ ((noinline, noclone, weak)) +int +f2 (long arg0, void *ignored) +{ + if (arg0 != 17) + __builtin_abort (); + return 19; +} + +int +main (void) +{ + if (f1 (17, f2) != 19) + __builtin_abort (); + return 0; +} + +

[RFA,PR,target/84128] Fix restore of scratch register used in probing loops

Commit Message

Comments

Patch