diff mbox

[rs6000] Fix PR16458, eliminate redudant compares

Message ID 1327683378.14063.28.camel@otta
State New
Headers show

Commit Message

Peter Bergner Jan. 27, 2012, 4:56 p.m. UTC
This patch fixes PR16458 by using the type expression attached to a reg
rtx to detect its signedness and generating unsigned compares when
appropriate.  However, we continue to use signed compares for the
special case of when we compare an unsigned reg against the constant 0.
This is because signed and unsigned compares give the same results
for equality and "(unsigned)x > 0)" is equivalent to "x != 0".
Using a signed compare in this special case allows us to continue to
generate record form instructions (ie, instructions that implicitly
set cr0).

I'll note that for the moment, I have XFAILed pr16458-4.c, since this
test case isn't working yet, but it is due to a problem in expand not
attaching any type expression information on *index's reg rtx like it
does for *a and *b in pr16458-2.c.  We're tracking that down for 4.8.

This has passed bootstrap and regtesting with no regressions.
Ok for mainline?

Peter

gcc/
	PR target/16458
	* config/rs6000/rs6000.c (rs6000_unsigned_reg_p): New function.
	(rs6000_generate_compare): Use it.

gcc/testsuite/
	PR target/16458
	* gcc.target/powerpc/pr16458-1.c: New test.
	* gcc.target/powerpc/pr16458-2.c: Likewise.
	* gcc.target/powerpc/pr16458-3.c: Likewise.
	* gcc.target/powerpc/pr16458-4.c: Likewise.

Comments

Richard Biener Jan. 30, 2012, 9:46 a.m. UTC | #1
On Fri, Jan 27, 2012 at 5:56 PM, Peter Bergner <bergner@vnet.ibm.com> wrote:
> This patch fixes PR16458 by using the type expression attached to a reg
> rtx to detect its signedness and generating unsigned compares when
> appropriate.  However, we continue to use signed compares for the
> special case of when we compare an unsigned reg against the constant 0.
> This is because signed and unsigned compares give the same results
> for equality and "(unsigned)x > 0)" is equivalent to "x != 0".
> Using a signed compare in this special case allows us to continue to
> generate record form instructions (ie, instructions that implicitly
> set cr0).
>
> I'll note that for the moment, I have XFAILed pr16458-4.c, since this
> test case isn't working yet, but it is due to a problem in expand not
> attaching any type expression information on *index's reg rtx like it
> does for *a and *b in pr16458-2.c.  We're tracking that down for 4.8.
>
> This has passed bootstrap and regtesting with no regressions.
> Ok for mainline?

This does not sound suitable for stage4.  rs6000_unsigned_reg_p
looks suspiciously non-rs6000 specific, and if we really can rely
on the way it is implemented should find its way to general RTL
helper routines.  The question is - do we ever coalesce signed
and unsigned variables to the same pseudo?

IIRC avr people recently have come across the same idea.

Richard.

> Peter
>
> gcc/
>        PR target/16458
>        * config/rs6000/rs6000.c (rs6000_unsigned_reg_p): New function.
>        (rs6000_generate_compare): Use it.
>
> gcc/testsuite/
>        PR target/16458
>        * gcc.target/powerpc/pr16458-1.c: New test.
>        * gcc.target/powerpc/pr16458-2.c: Likewise.
>        * gcc.target/powerpc/pr16458-3.c: Likewise.
>        * gcc.target/powerpc/pr16458-4.c: Likewise.
>
> Index: gcc/config/rs6000/rs6000.c
> ===================================================================
> --- gcc/config/rs6000/rs6000.c  (revision 183628)
> +++ gcc/config/rs6000/rs6000.c  (working copy)
> @@ -15588,6 +15588,22 @@ rs6000_reverse_condition (enum machine_m
>     return reverse_condition (code);
>  }
>
> +static bool
> +rs6000_unsigned_reg_p (rtx op)
> +{
> +  enum rtx_code code = GET_CODE (op);
> +
> +  if (code == REG
> +      && REG_EXPR (op)
> +      && TYPE_UNSIGNED (TREE_TYPE (REG_EXPR (op))))
> +    return true;
> +
> +  if (code == SUBREG && SUBREG_PROMOTED_UNSIGNED_P (op))
> +    return true;
> +
> +  return false;
> +}
> +
>  /* Generate a compare for CODE.  Return a brand-new rtx that
>    represents the result of the compare.  */
>
> @@ -15606,14 +15622,11 @@ rs6000_generate_compare (rtx cmp, enum m
>           || code == GEU || code == LEU)
>     comp_mode = CCUNSmode;
>   else if ((code == EQ || code == NE)
> -          && GET_CODE (op0) == SUBREG
> -          && GET_CODE (op1) == SUBREG
> -          && SUBREG_PROMOTED_UNSIGNED_P (op0)
> -          && SUBREG_PROMOTED_UNSIGNED_P (op1))
> +          && rs6000_unsigned_reg_p (op0)
> +          && (rs6000_unsigned_reg_p (op1)
> +              || (CONST_INT_P (op1) && INTVAL (op1) != 0)))
>     /* These are unsigned values, perhaps there will be a later
> -       ordering compare that can be shared with this one.
> -       Unfortunately we cannot detect the signedness of the operands
> -       for non-subregs.  */
> +       ordering compare that can be shared with this one.  */
>     comp_mode = CCUNSmode;
>   else
>     comp_mode = CCmode;
> Index: gcc/testsuite/gcc.target/powerpc/pr16458-1.c
> ===================================================================
> --- gcc/testsuite/gcc.target/powerpc/pr16458-1.c        (revision 0)
> +++ gcc/testsuite/gcc.target/powerpc/pr16458-1.c        (revision 0)
> @@ -0,0 +1,18 @@
> +/* Test cse'ing of unsigned compares.  */
> +/* { dg-do compile } */
> +/* { dg-options "-O2" } */
> +
> +/* { dg-final { scan-assembler-not "cmpw" } } */
> +/* { dg-final { scan-assembler-times "cmplw" 1 } } */
> +
> +unsigned int a, b;
> +
> +int
> +foo (void)
> +{
> +  if (a == b) return 1;
> +  if (a > b)  return 2;
> +  if (a < b)  return 3;
> +  if (a != b) return 4;
> +  return 0;
> +}
> Index: gcc/testsuite/gcc.target/powerpc/pr16458-2.c
> ===================================================================
> --- gcc/testsuite/gcc.target/powerpc/pr16458-2.c        (revision 0)
> +++ gcc/testsuite/gcc.target/powerpc/pr16458-2.c        (revision 0)
> @@ -0,0 +1,18 @@
> +/* Test cse'ing of unsigned compares.  */
> +/* { dg-do compile } */
> +/* { dg-options "-O2" } */
> +
> +/* { dg-final { scan-assembler-not "cmpw" } } */
> +/* { dg-final { scan-assembler-times "cmplw" 1 } } */
> +
> +unsigned int *a, *b;
> +
> +int
> +foo (void)
> +{
> +  if (*a == *b) return 1;
> +  if (*a > *b)  return 2;
> +  if (*a < *b)  return 3;
> +  if (*a != *b) return 4;
> +  return 0;
> +}
> Index: gcc/testsuite/gcc.target/powerpc/pr16458-3.c
> ===================================================================
> --- gcc/testsuite/gcc.target/powerpc/pr16458-3.c        (revision 0)
> +++ gcc/testsuite/gcc.target/powerpc/pr16458-3.c        (revision 0)
> @@ -0,0 +1,41 @@
> +/* Test cse'ing of unsigned compares.  */
> +/* { dg-do compile } */
> +/* { dg-options "-O2 -fno-jump-tables" } */
> +
> +/* { dg-final { scan-assembler-not "cmpwi" } } */
> +/* { dg-final { scan-assembler-times "cmplwi" 5 } } */
> +
> +extern int case0 (void);
> +extern int case1 (void);
> +extern int case2 (void);
> +extern int case3 (void);
> +extern int case4 (void);
> +
> +enum CASE_VALUES
> +{
> +  CASE0 = 0,
> +  CASE1,
> +  CASE2,
> +  CASE3,
> +  CASE4
> +};
> +
> +int
> +foo (enum CASE_VALUES index)
> +{
> +  switch (index)
> +    {
> +    case CASE0:
> +      return case0 ();
> +    case CASE1:
> +      return case1 ();
> +    case CASE2:
> +      return case2 ();
> +    case CASE3:
> +      return case3 ();
> +    case CASE4:
> +      return case4 ();
> +    }
> +
> +  return 0;
> +}
> Index: gcc/testsuite/gcc.target/powerpc/pr16458-4.c
> ===================================================================
> --- gcc/testsuite/gcc.target/powerpc/pr16458-4.c        (revision 0)
> +++ gcc/testsuite/gcc.target/powerpc/pr16458-4.c        (revision 0)
> @@ -0,0 +1,44 @@
> +/* Test cse'ing of unsigned compares.  */
> +/* { dg-do compile } */
> +/* { dg-options "-O2 -fno-jump-tables" } */
> +
> +/* The following tests fail due to an issue in expand not
> +   attaching an type expression information on *index's reg rtx.  */
> +
> +/* { dg-final { scan-assembler-not "cmpwi" { xfail *-*-* } } } */
> +/* { dg-final { scan-assembler-times "cmplwi" 5 { xfail *-*-* } } } */
> +
> +extern int case0 (void);
> +extern int case1 (void);
> +extern int case2 (void);
> +extern int case3 (void);
> +extern int case4 (void);
> +
> +enum CASE_VALUES
> +{
> +  CASE0 = 0,
> +  CASE1,
> +  CASE2,
> +  CASE3,
> +  CASE4
> +};
> +
> +int
> +foo (enum CASE_VALUES *index)
> +{
> +  switch (*index)
> +    {
> +    case CASE0:
> +      return case0 ();
> +    case CASE1:
> +      return case1 ();
> +    case CASE2:
> +      return case2 ();
> +    case CASE3:
> +      return case3 ();
> +    case CASE4:
> +      return case4 ();
> +    }
> +
> +  return 0;
> +}
>
>
Peter Bergner Jan. 31, 2012, 2:55 p.m. UTC | #2
On Mon, 2012-01-30 at 10:46 +0100, Richard Guenther wrote:
> On Fri, Jan 27, 2012 at 5:56 PM, Peter Bergner <bergner@vnet.ibm.com> wrote:
> > This patch fixes PR16458 by using the type expression attached to a reg
> > rtx to detect its signedness and generating unsigned compares when
> > appropriate.  However, we continue to use signed compares for the
> > special case of when we compare an unsigned reg against the constant 0.
> > This is because signed and unsigned compares give the same results
> > for equality and "(unsigned)x > 0)" is equivalent to "x != 0".
> > Using a signed compare in this special case allows us to continue to
> > generate record form instructions (ie, instructions that implicitly
> > set cr0).


> > I'll note that for the moment, I have XFAILed pr16458-4.c, since this
> > test case isn't working yet, but it is due to a problem in expand not
> > attaching any type expression information on *index's reg rtx like it
> > does for *a and *b in pr16458-2.c.  We're tracking that down for 4.8.

I asked Bill to have a look at this one and he emailed the gcc mailing
list regarding the issue.  It looks like micha has a working answer:

  http://gcc.gnu.org/ml/gcc/2012-01/msg00349.html



> > This has passed bootstrap and regtesting with no regressions.
> > Ok for mainline?
> 
> This does not sound suitable for stage4.  

Since this has been around for a while, I'm fine with waiting until
stage1.


> rs6000_unsigned_reg_p
> looks suspiciously non-rs6000 specific, and if we really can rely
> on the way it is implemented should find its way to general RTL
> helper routines.

If other ports like avr can make use of it too, I have no problems
moving it somewhere else.


> The question is - do we ever coalesce signed
> and unsigned variables to the same pseudo?

What is it you are worried about?  The patch is only attempting
to emit unsigned compares for operands we know to be unsigned.
The fact that the compares are equality compares means we can
use either signed or unsigned compares.  It's just that the signed
versions don't CSE with any following non-equality unsigned compares
with the same unsigned operands.


> IIRC avr people recently have come across the same idea.

Do you have a pointer for this?


Peter
diff mbox

Patch

Index: gcc/config/rs6000/rs6000.c
===================================================================
--- gcc/config/rs6000/rs6000.c	(revision 183628)
+++ gcc/config/rs6000/rs6000.c	(working copy)
@@ -15588,6 +15588,22 @@  rs6000_reverse_condition (enum machine_m
     return reverse_condition (code);
 }
 
+static bool
+rs6000_unsigned_reg_p (rtx op)
+{
+  enum rtx_code code = GET_CODE (op);
+
+  if (code == REG
+      && REG_EXPR (op)
+      && TYPE_UNSIGNED (TREE_TYPE (REG_EXPR (op))))
+    return true;
+
+  if (code == SUBREG && SUBREG_PROMOTED_UNSIGNED_P (op))
+    return true;
+
+  return false;
+}
+
 /* Generate a compare for CODE.  Return a brand-new rtx that
    represents the result of the compare.  */
 
@@ -15606,14 +15622,11 @@  rs6000_generate_compare (rtx cmp, enum m
 	   || code == GEU || code == LEU)
     comp_mode = CCUNSmode;
   else if ((code == EQ || code == NE)
-	   && GET_CODE (op0) == SUBREG
-	   && GET_CODE (op1) == SUBREG
-	   && SUBREG_PROMOTED_UNSIGNED_P (op0)
-	   && SUBREG_PROMOTED_UNSIGNED_P (op1))
+	   && rs6000_unsigned_reg_p (op0)
+	   && (rs6000_unsigned_reg_p (op1)
+	       || (CONST_INT_P (op1) && INTVAL (op1) != 0)))
     /* These are unsigned values, perhaps there will be a later
-       ordering compare that can be shared with this one.
-       Unfortunately we cannot detect the signedness of the operands
-       for non-subregs.  */
+       ordering compare that can be shared with this one.  */
     comp_mode = CCUNSmode;
   else
     comp_mode = CCmode;
Index: gcc/testsuite/gcc.target/powerpc/pr16458-1.c
===================================================================
--- gcc/testsuite/gcc.target/powerpc/pr16458-1.c	(revision 0)
+++ gcc/testsuite/gcc.target/powerpc/pr16458-1.c	(revision 0)
@@ -0,0 +1,18 @@ 
+/* Test cse'ing of unsigned compares.  */
+/* { dg-do compile } */
+/* { dg-options "-O2" } */
+
+/* { dg-final { scan-assembler-not "cmpw" } } */
+/* { dg-final { scan-assembler-times "cmplw" 1 } } */
+
+unsigned int a, b;
+
+int
+foo (void)
+{
+  if (a == b) return 1;
+  if (a > b)  return 2;
+  if (a < b)  return 3;
+  if (a != b) return 4;
+  return 0;
+}
Index: gcc/testsuite/gcc.target/powerpc/pr16458-2.c
===================================================================
--- gcc/testsuite/gcc.target/powerpc/pr16458-2.c	(revision 0)
+++ gcc/testsuite/gcc.target/powerpc/pr16458-2.c	(revision 0)
@@ -0,0 +1,18 @@ 
+/* Test cse'ing of unsigned compares.  */
+/* { dg-do compile } */
+/* { dg-options "-O2" } */
+
+/* { dg-final { scan-assembler-not "cmpw" } } */
+/* { dg-final { scan-assembler-times "cmplw" 1 } } */
+
+unsigned int *a, *b;
+
+int
+foo (void)
+{
+  if (*a == *b) return 1;
+  if (*a > *b)  return 2;
+  if (*a < *b)  return 3;
+  if (*a != *b) return 4;
+  return 0;
+}
Index: gcc/testsuite/gcc.target/powerpc/pr16458-3.c
===================================================================
--- gcc/testsuite/gcc.target/powerpc/pr16458-3.c	(revision 0)
+++ gcc/testsuite/gcc.target/powerpc/pr16458-3.c	(revision 0)
@@ -0,0 +1,41 @@ 
+/* Test cse'ing of unsigned compares.  */
+/* { dg-do compile } */
+/* { dg-options "-O2 -fno-jump-tables" } */
+
+/* { dg-final { scan-assembler-not "cmpwi" } } */
+/* { dg-final { scan-assembler-times "cmplwi" 5 } } */
+
+extern int case0 (void);
+extern int case1 (void);
+extern int case2 (void);
+extern int case3 (void);
+extern int case4 (void);
+
+enum CASE_VALUES
+{
+  CASE0 = 0,
+  CASE1,
+  CASE2,
+  CASE3,
+  CASE4
+};
+
+int
+foo (enum CASE_VALUES index)
+{
+  switch (index)
+    {
+    case CASE0:
+      return case0 ();
+    case CASE1:
+      return case1 ();
+    case CASE2:
+      return case2 ();
+    case CASE3:
+      return case3 ();
+    case CASE4:
+      return case4 ();
+    }
+
+  return 0;
+}
Index: gcc/testsuite/gcc.target/powerpc/pr16458-4.c
===================================================================
--- gcc/testsuite/gcc.target/powerpc/pr16458-4.c	(revision 0)
+++ gcc/testsuite/gcc.target/powerpc/pr16458-4.c	(revision 0)
@@ -0,0 +1,44 @@ 
+/* Test cse'ing of unsigned compares.  */
+/* { dg-do compile } */
+/* { dg-options "-O2 -fno-jump-tables" } */
+
+/* The following tests fail due to an issue in expand not
+   attaching an type expression information on *index's reg rtx.  */
+
+/* { dg-final { scan-assembler-not "cmpwi" { xfail *-*-* } } } */
+/* { dg-final { scan-assembler-times "cmplwi" 5 { xfail *-*-* } } } */
+
+extern int case0 (void);
+extern int case1 (void);
+extern int case2 (void);
+extern int case3 (void);
+extern int case4 (void);
+
+enum CASE_VALUES
+{
+  CASE0 = 0,
+  CASE1,
+  CASE2,
+  CASE3,
+  CASE4
+};
+
+int
+foo (enum CASE_VALUES *index)
+{
+  switch (*index)
+    {
+    case CASE0:
+      return case0 ();
+    case CASE1:
+      return case1 ();
+    case CASE2:
+      return case2 ();
+    case CASE3:
+      return case3 ();
+    case CASE4:
+      return case4 ();
+    }
+
+  return 0;
+}