This is the mail archive of the
gcc-patches@gcc.gnu.org
mailing list for the GCC project.
Re: [ARM Patch 3/3]PR53189: optimizations of 64bit logic operation with constant
- From: Carrot Wei <carrot at google dot com>
- To: gcc-patches at gcc dot gnu dot org
- Date: Fri, 6 Jul 2012 16:17:22 +0800
- Subject: Re: [ARM Patch 3/3]PR53189: optimizations of 64bit logic operation with constant
Hi
I updated this patch to use const_ok_for_dimode_op to decide if a
const is legal for iordi3 insn. The special cases of all 0 and all 1
constant are also handled.
Tested on arm qemu with all thumb/arm neon/non-neon combination, no regression.
thanks
Carrot
2012-07-06 Wei Guozhi <carrot@google.com>
PR target/53189
* gcc.target/arm/pr53189-7.c: New testcase.
* gcc.target/arm/pr53189-8.c: New testcase.
* gcc.target/arm/pr53189-9.c: New testcase.
2012-07-06 Wei Guozhi <carrot@google.com>
PR target/53189
* config/arm/arm.c (const_ok_for_dimode_op): Handle IOR op.
* config/arm/constraints.md (Df): New constraint.
* config/arm/predicates.md (arm_iordi_operand): New predicate.
(arm_immediate_iordi_operand): Likewise.
(iordi_operand): Likewise.
* config/arm/arm.md (iorsi3_insn): Optimization for special constants.
(iordi3): Extend it to handle 64bit constants.
(iordi3_insn): Likewise.
* config/arm/neon.md (iordi3_neon): Likewise.
Index: gcc/testsuite/gcc.target/arm/pr53189-7.c
===================================================================
--- gcc/testsuite/gcc.target/arm/pr53189-7.c (revision 0)
+++ gcc/testsuite/gcc.target/arm/pr53189-7.c (revision 0)
@@ -0,0 +1,8 @@
+/* { dg-options "-O2" } */
+/* { dg-require-effective-target arm32 } */
+/* { dg-final { scan-assembler-not "mov" } } */
+
+void t0p(long long * p)
+{
+ *p |= 0x100000008;
+}
Index: gcc/testsuite/gcc.target/arm/pr53189-8.c
===================================================================
--- gcc/testsuite/gcc.target/arm/pr53189-8.c (revision 0)
+++ gcc/testsuite/gcc.target/arm/pr53189-8.c (revision 0)
@@ -0,0 +1,9 @@
+/* { dg-options "-O2" } */
+/* { dg-require-effective-target arm32 } */
+/* { dg-final { scan-assembler-times "mvn" 1 } } */
+/* { dg-final { scan-assembler-times "orr" 1 } } */
+
+void t0p(long long * p)
+{
+ *p |= 0x1FFFFFFFF;
+}
Index: gcc/testsuite/gcc.target/arm/pr53189-9.c
===================================================================
--- gcc/testsuite/gcc.target/arm/pr53189-9.c (revision 0)
+++ gcc/testsuite/gcc.target/arm/pr53189-9.c (revision 0)
@@ -0,0 +1,9 @@
+/* { dg-options "-O2" } */
+/* { dg-require-effective-target arm32 } */
+/* { dg-final { scan-assembler-not "mov" } } */
+/* { dg-final { scan-assembler-times "orr" 1 } } */
+
+void t0p(long long * p)
+{
+ *p |= 0x100000000;
+}
Index: gcc/config/arm/arm.c
===================================================================
--- gcc/config/arm/arm.c (revision 189278)
+++ gcc/config/arm/arm.c (working copy)
@@ -2524,6 +2524,16 @@
case PLUS:
return arm_not_operand (hi, SImode) && arm_add_operand (lo, SImode);
+ case IOR:
+ if ((const_ok_for_arm (hi_val) || (hi_val == 0xFFFFFFFF))
+ && (const_ok_for_arm (lo_val) || (lo_val == 0xFFFFFFFF)))
+ return 1;
+ if (TARGET_THUMB2
+ && (const_ok_for_arm (lo_val) || const_ok_for_arm (~lo_val))
+ && (const_ok_for_arm (hi_val) || const_ok_for_arm (~hi_val)))
+ return 1;
+ return 0;
+
default:
return 0;
}
Index: gcc/config/arm/neon.md
===================================================================
--- gcc/config/arm/neon.md (revision 189278)
+++ gcc/config/arm/neon.md (working copy)
@@ -731,9 +731,9 @@
)
(define_insn "iordi3_neon"
- [(set (match_operand:DI 0 "s_register_operand" "=w,w,?&r,?&r,?w,?w")
- (ior:DI (match_operand:DI 1 "s_register_operand" "%w,0,0,r,w,0")
- (match_operand:DI 2 "neon_logic_op2" "w,Dl,r,r,w,Dl")))]
+ [(set (match_operand:DI 0 "s_register_operand" "=w,w,?&r,?&r,?w,?w,?&r,?&r")
+ (ior:DI (match_operand:DI 1 "s_register_operand" "%w,0,0,r,w,0,0,r")
+ (match_operand:DI 2 "iordi_operand" "w,Dl,r,r,w,Dl,Df,Df")))]
"TARGET_NEON"
{
switch (which_alternative)
@@ -745,12 +745,14 @@
DImode, 0, VALID_NEON_QREG_MODE (DImode));
case 2: return "#";
case 3: return "#";
+ case 6: return "#";
+ case 7: return "#";
default: gcc_unreachable ();
}
}
- [(set_attr "neon_type" "neon_int_1,neon_int_1,*,*,neon_int_1,neon_int_1")
- (set_attr "length" "*,*,8,8,*,*")
- (set_attr "arch" "nota8,nota8,*,*,onlya8,onlya8")]
+ [(set_attr "neon_type" "neon_int_1,neon_int_1,*,*,neon_int_1,neon_int_1,*,*")
+ (set_attr "length" "*,*,8,8,*,*,8,8")
+ (set_attr "arch" "nota8,nota8,*,*,onlya8,onlya8,*,*")]
)
;; The concrete forms of the Neon immediate-logic instructions are vbic and
Index: gcc/config/arm/constraints.md
===================================================================
--- gcc/config/arm/constraints.md (revision 189278)
+++ gcc/config/arm/constraints.md (working copy)
@@ -31,7 +31,7 @@
;; 'H' was previously used for FPA.
;; The following multi-letter normal constraints have been used:
-;; in ARM/Thumb-2 state: Da, Db, Dc, Dd, Dn, Dl, DL, Dv, Dy, Di, Dt, Dz
+;; in ARM/Thumb-2 state: Da, Db, Dc, Dd, Df, Dn, Dl, DL, Dv, Dy, Di, Dt, Dz
;; in Thumb-1 state: Pa, Pb, Pc, Pd, Pe
;; in Thumb-2 state: Pj, PJ, Ps, Pt, Pu, Pv, Pw, Px, Py
@@ -248,6 +248,12 @@
(and (match_code "const_int")
(match_test "TARGET_32BIT && const_ok_for_dimode_op (ival, PLUS)")))
+(define_constraint "Df"
+ "@internal
+ In ARM/Thumb-2 state a const_int that can be used by iordi3_insn."
+ (and (match_code "const_int")
+ (match_test "TARGET_32BIT && const_ok_for_dimode_op (ival, IOR)")))
+
(define_constraint "Di"
"@internal
In ARM/Thumb-2 state a const_int or const_double where both the high
Index: gcc/config/arm/predicates.md
===================================================================
--- gcc/config/arm/predicates.md (revision 189278)
+++ gcc/config/arm/predicates.md (working copy)
@@ -104,6 +104,14 @@
(and (match_code "const_int,const_double")
(match_test "arm_const_double_by_immediates (op)")))
+(define_predicate "arm_immediate_iordi_operand"
+ (and (match_code "const_int")
+ (match_test "const_ok_for_dimode_op (INTVAL (op), IOR)")))
+
+(define_predicate "arm_iordi_operand"
+ (ior (match_operand 0 "arm_immediate_iordi_operand")
+ (match_operand 0 "s_register_operand")))
+
(define_predicate "arm_neg_immediate_operand"
(and (match_code "const_int")
(match_test "const_ok_for_arm (-INTVAL (op))")))
@@ -520,6 +528,10 @@
(ior (match_operand 0 "imm_for_neon_logic_operand")
(match_operand 0 "s_register_operand")))
+(define_predicate "iordi_operand"
+ (ior (match_operand 0 "neon_logic_op2")
+ (match_operand 0 "arm_iordi_operand")))
+
(define_predicate "neon_inv_logic_op2"
(ior (match_operand 0 "imm_for_neon_inv_logic_operand")
(match_operand 0 "s_register_operand")))
Index: gcc/config/arm/arm.md
===================================================================
--- gcc/config/arm/arm.md (revision 189278)
+++ gcc/config/arm/arm.md (working copy)
@@ -2828,17 +2828,30 @@
(define_expand "iordi3"
[(set (match_operand:DI 0 "s_register_operand" "")
(ior:DI (match_operand:DI 1 "s_register_operand" "")
- (match_operand:DI 2 "neon_logic_op2" "")))]
+ (match_operand:DI 2 "iordi_operand" "")))]
"TARGET_32BIT"
""
)
-(define_insn "*iordi3_insn"
- [(set (match_operand:DI 0 "s_register_operand" "=&r,&r")
- (ior:DI (match_operand:DI 1 "s_register_operand" "%0,r")
- (match_operand:DI 2 "s_register_operand" "r,r")))]
+(define_insn_and_split "*iordi3_insn"
+ [(set (match_operand:DI 0 "s_register_operand" "=&r,&r,&r,&r")
+ (ior:DI (match_operand:DI 1 "s_register_operand" "%0,r, 0, r")
+ (match_operand:DI 2 "arm_iordi_operand" "r, r, Df,Df")))]
"TARGET_32BIT && !TARGET_IWMMXT && !TARGET_NEON"
"#"
+ "TARGET_32BIT && !TARGET_IWMMXT && reload_completed
+ && !(TARGET_NEON && IS_VFP_REGNUM (REGNO (operands[0])))"
+ [(set (match_dup 0) (ior:SI (match_dup 1) (match_dup 2)))
+ (set (match_dup 3) (ior:SI (match_dup 4) (match_dup 5)))]
+ "
+ {
+ operands[3] = gen_highpart (SImode, operands[0]);
+ operands[0] = gen_lowpart (SImode, operands[0]);
+ operands[4] = gen_highpart (SImode, operands[1]);
+ operands[1] = gen_lowpart (SImode, operands[1]);
+ operands[5] = gen_highpart_mode (SImode, DImode, operands[2]);
+ operands[2] = gen_lowpart (SImode, operands[2]);
+ }"
[(set_attr "length" "8")
(set_attr "predicable" "yes")]
)
@@ -2902,10 +2915,29 @@
(ior:SI (match_operand:SI 1 "s_register_operand" "%r,r,r")
(match_operand:SI 2 "reg_or_int_operand" "rI,K,?n")))]
"TARGET_32BIT"
- "@
- orr%?\\t%0, %1, %2
- orn%?\\t%0, %1, #%B2
- #"
+ "*
+ {
+ if (CONST_INT_P (operands[2]))
+ {
+ HOST_WIDE_INT i = INTVAL (operands[2]) & 0xFFFFFFFF;
+ if (i == 0xFFFFFFFF)
+ return \"mvn%?\\t%0, #0\";
+ if (i == 0)
+ {
+ if (!rtx_equal_p (operands[0], operands[1]))
+ return \"mov%?\\t%0, %1\";
+ else
+ return \"\";
+ }
+ }
+
+ switch (which_alternative)
+ {
+ case 0: return \"orr%?\\t%0, %1, %2\";
+ case 1: return \"orn%?\\t%0, %1, #%B2\";
+ case 2: return \"#\";
+ }
+ }"
"TARGET_32BIT
&& GET_CODE (operands[2]) == CONST_INT
&& !(const_ok_for_arm (INTVAL (operands[2]))
On Tue, Jun 5, 2012 at 5:14 PM, Carrot Wei <carrot@google.com> wrote:
> Hi
>
> This is the fourth part of the patches that deals with 64bit ior. It directly
> extends the patterns iordi3, iordi3_insn and iordi3_neon to handle 64bit
> constant operands.
>
> Tested on arm qemu without regression.
>
> OK for trunk?
>
> thanks
> Carrot
>
> 2012-06-05 Wei Guozhi <carrot@google.com>
>
> PR target/53447
> * gcc.target/arm/pr53447-4.c: New testcase.
>
>
> 2012-06-05 Wei Guozhi <carrot@google.com>
>
> PR target/53447
> * config/arm/arm-protos.h (const_ok_for_iordi): New prototype.
> * config/arm/arm.c (const_ok_for_iordi): New function.
> * config/arm/constraints.md (Df): New constraint.
> * config/arm/predicates.md (arm_iordi_operand): New predicate.
> (arm_immediate_iordi_operand): Likewise.
> (iordi_operand): Likewise.
> * config/arm/arm.md (iordi3): Extend it to handle 64bit constants.
> (iordi3_insn): Likewise.
> * config/arm/neon.md (iordi3_neon): Likewise.
>
>
> Index: testsuite/gcc.target/arm/pr53447-4.c
> ===================================================================
> --- testsuite/gcc.target/arm/pr53447-4.c (revision 0)
> +++ testsuite/gcc.target/arm/pr53447-4.c (revision 0)
> @@ -0,0 +1,8 @@
> +/* { dg-options "-O2" } */
> +/* { dg-require-effective-target arm32 } */
> +/* { dg-final { scan-assembler-not "mov" } } */
> +
> +void t0p(long long * p)
> +{
> + *p |= 0x100000008;
> +}
>
>
> Index: config/arm/arm.c
> ===================================================================
> --- config/arm/arm.c (revision 188048)
> +++ config/arm/arm.c (working copy)
> @@ -2496,6 +2496,24 @@
> }
> }
>
> +/* Return TRUE if int I is a valid immediate constant used by pattern
> + iordi3_insn. */
> +int
> +const_ok_for_iordi (HOST_WIDE_INT i)
> +{
> + HOST_WIDE_INT high = ARM_SIGN_EXTEND ((i >> 32) & 0xFFFFFFFF);
> + HOST_WIDE_INT low = ARM_SIGN_EXTEND (i & 0xFFFFFFFF);
> +
> + if (TARGET_32BIT && const_ok_for_arm (low) && const_ok_for_arm (high))
> + return 1;
> +
> + if (TARGET_THUMB2 && (const_ok_for_arm (low) || const_ok_for_arm (~low))
> + && (const_ok_for_arm (high) || const_ok_for_arm (~high)))
> + return 1;
> +
> + return 0;
> +}
> +
> /* Emit a sequence of insns to handle a large constant.
> CODE is the code of the operation required, it can be any of SET, PLUS,
> IOR, AND, XOR, MINUS;
> Index: config/arm/arm-protos.h
> ===================================================================
> --- config/arm/arm-protos.h (revision 188048)
> +++ config/arm/arm-protos.h (working copy)
> @@ -47,6 +47,7 @@
> extern bool arm_small_register_classes_for_mode_p (enum machine_mode);
> extern int arm_hard_regno_mode_ok (unsigned int, enum machine_mode);
> extern bool arm_modes_tieable_p (enum machine_mode, enum machine_mode);
> +extern int const_ok_for_iordi (HOST_WIDE_INT);
> extern int const_ok_for_arm (HOST_WIDE_INT);
> extern int const_ok_for_op (HOST_WIDE_INT, enum rtx_code);
> extern int arm_split_constant (RTX_CODE, enum machine_mode, rtx,
> Index: config/arm/neon.md
> ===================================================================
> --- config/arm/neon.md (revision 188048)
> +++ config/arm/neon.md (working copy)
> @@ -729,9 +729,9 @@
> )
>
> (define_insn "iordi3_neon"
> - [(set (match_operand:DI 0 "s_register_operand" "=w,w,?&r,?&r,?w,?w")
> - (ior:DI (match_operand:DI 1 "s_register_operand" "%w,0,0,r,w,0")
> - (match_operand:DI 2 "neon_logic_op2" "w,Dl,r,r,w,Dl")))]
> + [(set (match_operand:DI 0 "s_register_operand" "=w,w,?&r,?&r,?w,?w,?&r,?&r")
> + (ior:DI (match_operand:DI 1 "s_register_operand" "%w,0,0,r,w,0,0,r")
> + (match_operand:DI 2 "iordi_operand" "w,Dl,r,r,w,Dl,Df,Df")))]
> "TARGET_NEON"
> {
> switch (which_alternative)
> @@ -743,12 +743,14 @@
> DImode, 0, VALID_NEON_QREG_MODE (DImode));
> case 2: return "#";
> case 3: return "#";
> + case 6: return "#";
> + case 7: return "#";
> default: gcc_unreachable ();
> }
> }
> - [(set_attr "neon_type" "neon_int_1,neon_int_1,*,*,neon_int_1,neon_int_1")
> - (set_attr "length" "*,*,8,8,*,*")
> - (set_attr "arch" "nota8,nota8,*,*,onlya8,onlya8")]
> + [(set_attr "neon_type" "neon_int_1,neon_int_1,*,*,neon_int_1,neon_int_1,*,*")
> + (set_attr "length" "*,*,8,8,*,*,8,8")
> + (set_attr "arch" "nota8,nota8,*,*,onlya8,onlya8,*,*")]
> )
>
> ;; The concrete forms of the Neon immediate-logic instructions are vbic and
> Index: config/arm/constraints.md
> ===================================================================
> --- config/arm/constraints.md (revision 188048)
> +++ config/arm/constraints.md (working copy)
> @@ -29,7 +29,7 @@
> ;; in Thumb-1 state: I, J, K, L, M, N, O
>
> ;; The following multi-letter normal constraints have been used:
> -;; in ARM/Thumb-2 state: Da, Db, Dc, Dn, Dl, DL, Dv, Dy, Di, Dt, Dz
> +;; in ARM/Thumb-2 state: Da, Db, Dc, Df, Dn, Dl, DL, Dv, Dy, Di, Dt, Dz
> ;; in Thumb-1 state: Pa, Pb, Pc, Pd, Pe
> ;; in Thumb-2 state: Pj, PJ, Ps, Pt, Pu, Pv, Pw, Px, Py
>
> @@ -251,6 +251,12 @@
> (match_test "TARGET_32BIT && arm_const_double_inline_cost (op) == 4
> && !(optimize_size || arm_ld_sched)")))
>
> +(define_constraint "Df"
> + "@internal
> + In ARM/Thumb-2 state a const_int that can be used by iordi3_insn. "
> + (and (match_code "const_int")
> + (match_test "TARGET_32BIT && const_ok_for_iordi (ival)")))
> +
> (define_constraint "Di"
> "@internal
> In ARM/Thumb-2 state a const_int or const_double where both the high
> Index: config/arm/predicates.md
> ===================================================================
> --- config/arm/predicates.md (revision 188048)
> +++ config/arm/predicates.md (working copy)
> @@ -117,6 +117,14 @@
> (and (match_code "const_int,const_double")
> (match_test "arm_const_double_by_immediates (op)")))
>
> +(define_predicate "arm_immediate_iordi_operand"
> + (and (match_code "const_int")
> + (match_test "const_ok_for_iordi (INTVAL (op))")))
> +
> +(define_predicate "arm_iordi_operand"
> + (ior (match_operand 0 "arm_immediate_iordi_operand")
> + (match_operand 0 "s_register_operand")))
> +
> (define_predicate "arm_neg_immediate_operand"
> (and (match_code "const_int")
> (match_test "const_ok_for_arm (-INTVAL (op))")))
> @@ -547,6 +555,10 @@
> (ior (match_operand 0 "imm_for_neon_logic_operand")
> (match_operand 0 "s_register_operand")))
>
> +(define_predicate "iordi_operand"
> + (ior (match_operand 0 "neon_logic_op2")
> + (match_operand 0 "arm_iordi_operand")))
> +
> (define_predicate "neon_inv_logic_op2"
> (ior (match_operand 0 "imm_for_neon_inv_logic_operand")
> (match_operand 0 "s_register_operand")))
> Index: config/arm/arm.md
> ===================================================================
> --- config/arm/arm.md (revision 188048)
> +++ config/arm/arm.md (working copy)
> @@ -2854,17 +2854,38 @@
> (define_expand "iordi3"
> [(set (match_operand:DI 0 "s_register_operand" "")
> (ior:DI (match_operand:DI 1 "s_register_operand" "")
> - (match_operand:DI 2 "neon_logic_op2" "")))]
> + (match_operand:DI 2 "iordi_operand" "")))]
> "TARGET_32BIT"
> ""
> )
>
> -(define_insn "*iordi3_insn"
> - [(set (match_operand:DI 0 "s_register_operand" "=&r,&r")
> - (ior:DI (match_operand:DI 1 "s_register_operand" "%0,r")
> - (match_operand:DI 2 "s_register_operand" "r,r")))]
> +(define_insn_and_split "*iordi3_insn"
> + [(set (match_operand:DI 0 "s_register_operand" "=&r,&r,&r,&r")
> + (ior:DI (match_operand:DI 1 "s_register_operand" "%0,r,0,r")
> + (match_operand:DI 2 "arm_iordi_operand" "r,r,Df,Df")))]
> "TARGET_32BIT && !TARGET_IWMMXT && !TARGET_NEON"
> "#"
> + "TARGET_32BIT && !TARGET_IWMMXT && reload_completed"
> + [(set (match_dup 0) (ior:SI (match_dup 1) (match_dup 2)))
> + (set (match_dup 3) (ior:SI (match_dup 4) (match_dup 5)))]
> + "
> + {
> + operands[3] = gen_highpart (SImode, operands[0]);
> + operands[0] = gen_lowpart (SImode, operands[0]);
> + operands[4] = gen_highpart (SImode, operands[1]);
> + operands[1] = gen_lowpart (SImode, operands[1]);
> + if (GET_CODE (operands[2]) == CONST_INT)
> + {
> + HOST_WIDE_INT v = INTVAL (operands[2]);
> + operands[5] = GEN_INT (ARM_SIGN_EXTEND ((v >> 32) & 0xFFFFFFFF));
> + operands[2] = GEN_INT (ARM_SIGN_EXTEND (v & 0xFFFFFFFF));
> + }
> + else
> + {
> + operands[5] = gen_highpart (SImode, operands[2]);
> + operands[2] = gen_lowpart (SImode, operands[2]);
> + }
> + }"
> [(set_attr "length" "8")
> (set_attr "predicable" "yes")]
> )