[gcc r12-7143] rs6000: Correct function prototypes for vec_replace_unaligned

Wed Feb 9 17:10:53 GMT 2022

https://gcc.gnu.org/g:ed3fea09b18f67e757b5768b42cb6e816626f1db

commit r12-7143-ged3fea09b18f67e757b5768b42cb6e816626f1db
Author: Bill Schmidt <wschmidt@linux.ibm.com>
Date:   Fri Feb 4 13:07:17 2022 -0600

    rs6000: Correct function prototypes for vec_replace_unaligned
    
    Due to a pasto error in the documentation, vec_replace_unaligned was
    implemented with the same function prototypes as vec_replace_elt.  It was
    intended that vec_replace_unaligned always specify output vectors as having
    type vector unsigned char, to emphasize that elements are potentially
    misaligned by this built-in function.  This patch corrects the
    misimplementation.
    
    2022-02-04  Bill Schmidt  <wschmidt@linux.ibm.com>
    
    gcc/
            * config/rs6000/rs6000-builtins.def (VREPLACE_UN_UV2DI): Change
            function prototype.
            (VREPLACE_UN_UV4SI): Likewise.
            (VREPLACE_UN_V2DF): Likewise.
            (VREPLACE_UN_V2DI): Likewise.
            (VREPLACE_UN_V4SF): Likewise.
            (VREPLACE_UN_V4SI): Likewise.
            * config/rs6000/rs6000-overload.def (VEC_REPLACE_UN): Change all
            function prototypes.
            * config/rs6000/vsx.md (vreplace_un_<mode>): Remove define_expand.
            (vreplace_un_<mode>): New define_insn.
    
    gcc/testsuite/
            * gcc.target/powerpc/vec-replace-word-runnable.c: Handle expected
            prototypes for each call to vec_replace_unaligned.

Diff:
---
 gcc/config/rs6000/rs6000-builtins.def              | 16 +++++++-------
 gcc/config/rs6000/rs6000-overload.def              | 12 +++++------
 gcc/config/rs6000/vsx.md                           | 25 +++++++++-------------
 .../gcc.target/powerpc/vec-replace-word-runnable.c | 20 +++++++++++------
 4 files changed, 38 insertions(+), 35 deletions(-)

diff --git a/gcc/config/rs6000/rs6000-builtins.def b/gcc/config/rs6000/rs6000-builtins.def
index 2d1e63fb20e..ae2760c3338 100644
--- a/gcc/config/rs6000/rs6000-builtins.def
+++ b/gcc/config/rs6000/rs6000-builtins.def
@@ -3387,25 +3387,25 @@
   const vull __builtin_altivec_vpextd (vull, vull);
     VPEXTD vpextd {}
 
-  const vull __builtin_altivec_vreplace_un_uv2di (vull, unsigned long long, \
-                                                  const int<4>);
+  const vuc __builtin_altivec_vreplace_un_uv2di (vull, unsigned long long, \
+                                                 const int<4>);
     VREPLACE_UN_UV2DI vreplace_un_v2di {}
 
-  const vui __builtin_altivec_vreplace_un_uv4si (vui, unsigned int, \
+  const vuc __builtin_altivec_vreplace_un_uv4si (vui, unsigned int, \
                                                  const int<4>);
     VREPLACE_UN_UV4SI vreplace_un_v4si {}
 
-  const vd __builtin_altivec_vreplace_un_v2df (vd, double, const int<4>);
+  const vuc __builtin_altivec_vreplace_un_v2df (vd, double, const int<4>);
     VREPLACE_UN_V2DF vreplace_un_v2df {}
 
-  const vsll __builtin_altivec_vreplace_un_v2di (vsll, signed long long, \
-                                                 const int<4>);
+  const vuc __builtin_altivec_vreplace_un_v2di (vsll, signed long long, \
+                                                const int<4>);
     VREPLACE_UN_V2DI vreplace_un_v2di {}
 
-  const vf __builtin_altivec_vreplace_un_v4sf (vf, float, const int<4>);
+  const vuc __builtin_altivec_vreplace_un_v4sf (vf, float, const int<4>);
     VREPLACE_UN_V4SF vreplace_un_v4sf {}
 
-  const vsi __builtin_altivec_vreplace_un_v4si (vsi, signed int, const int<4>);
+  const vuc __builtin_altivec_vreplace_un_v4si (vsi, signed int, const int<4>);
     VREPLACE_UN_V4SI vreplace_un_v4si {}
 
   const vull __builtin_altivec_vreplace_uv2di (vull, unsigned long long, \
diff --git a/gcc/config/rs6000/rs6000-overload.def b/gcc/config/rs6000/rs6000-overload.def
index 49a6104ddd2..44e2945aaa0 100644
--- a/gcc/config/rs6000/rs6000-overload.def
+++ b/gcc/config/rs6000/rs6000-overload.def
@@ -3059,17 +3059,17 @@
     VREPLACE_ELT_V2DF
 
 [VEC_REPLACE_UN, vec_replace_unaligned, __builtin_vec_replace_un]
-  vui __builtin_vec_replace_un (vui, unsigned int, const int);
+  vuc __builtin_vec_replace_un (vui, unsigned int, const int);
     VREPLACE_UN_UV4SI
-  vsi __builtin_vec_replace_un (vsi, signed int, const int);
+  vuc __builtin_vec_replace_un (vsi, signed int, const int);
     VREPLACE_UN_V4SI
-  vull __builtin_vec_replace_un (vull, unsigned long long, const int);
+  vuc __builtin_vec_replace_un (vull, unsigned long long, const int);
     VREPLACE_UN_UV2DI
-  vsll __builtin_vec_replace_un (vsll, signed long long, const int);
+  vuc __builtin_vec_replace_un (vsll, signed long long, const int);
     VREPLACE_UN_V2DI
-  vf __builtin_vec_replace_un (vf, float, const int);
+  vuc __builtin_vec_replace_un (vf, float, const int);
     VREPLACE_UN_V4SF
-  vd __builtin_vec_replace_un (vd, double, const int);
+  vuc __builtin_vec_replace_un (vd, double, const int);
     VREPLACE_UN_V2DF
 
 [VEC_REVB, vec_revb, __builtin_vec_revb]
diff --git a/gcc/config/rs6000/vsx.md b/gcc/config/rs6000/vsx.md
index 2f5a2f7828d..b53de103872 100644
--- a/gcc/config/rs6000/vsx.md
+++ b/gcc/config/rs6000/vsx.md
@@ -4197,21 +4197,6 @@
  }
 [(set_attr "type" "vecsimple")])
 
-(define_expand "vreplace_un_<mode>"
- [(set (match_operand:REPLACE_ELT 0 "register_operand")
- (unspec:REPLACE_ELT [(match_operand:REPLACE_ELT 1 "register_operand")
-		      (match_operand:<VS_scalar> 2 "register_operand")
-		      (match_operand:QI 3 "const_0_to_12_operand")]
-		     UNSPEC_REPLACE_UN))]
- "TARGET_POWER10"
-{
-   /* Immediate value is the byte index Big Endian numbering.  */
-   emit_insn (gen_vreplace_elt_<mode>_inst (operands[0], operands[1],
-					    operands[2], operands[3]));
-   DONE;
- }
-[(set_attr "type" "vecsimple")])
-
 (define_insn "vreplace_elt_<mode>_inst"
  [(set (match_operand:REPLACE_ELT 0 "register_operand" "=v")
   (unspec:REPLACE_ELT [(match_operand:REPLACE_ELT 1 "register_operand" "0")
@@ -4222,6 +4207,16 @@
  "vins<REPLACE_ELT_char> %0,%2,%3"
  [(set_attr "type" "vecsimple")])
 
+(define_insn "vreplace_un_<mode>"
+ [(set (match_operand:V16QI 0 "register_operand" "=v")
+  (unspec:V16QI [(match_operand:REPLACE_ELT 1 "register_operand" "0")
+                 (match_operand:<VS_scalar> 2 "register_operand" "r")
+		 (match_operand:QI 3 "const_0_to_12_operand" "n")]
+		UNSPEC_REPLACE_UN))]
+ "TARGET_POWER10"
+ "vins<REPLACE_ELT_char> %0,%2,%3"
+ [(set_attr "type" "vecsimple")])
+
 ;; VSX_EXTRACT optimizations
 ;; Optimize double d = (double) vec_extract (vi, <n>)
 ;; Get the element into the top position and use XVCVSWDP/XVCVUWDP
diff --git a/gcc/testsuite/gcc.target/powerpc/vec-replace-word-runnable.c b/gcc/testsuite/gcc.target/powerpc/vec-replace-word-runnable.c
index 9497cbf2ab0..27318822871 100644
--- a/gcc/testsuite/gcc.target/powerpc/vec-replace-word-runnable.c
+++ b/gcc/testsuite/gcc.target/powerpc/vec-replace-word-runnable.c
@@ -54,6 +54,8 @@ main (int argc, char *argv [])
   vector double src_va_double;
   double src_a_double;
 
+  vector unsigned char vresult_uchar;
+
   /* Vector replace 32-bit element */
   src_a_uint = 345;
   src_va_uint = (vector unsigned int) { 0, 1, 2, 3 };
@@ -172,7 +174,8 @@ main (int argc, char *argv [])
   /* Byte index 7 will overwrite part of elements 2 and 3 */
   expected_vresult_uint = (vector unsigned int) { 1, 2, 345*256, 0 };
 						 
-  vresult_uint = vec_replace_unaligned (src_va_uint, src_a_uint, 3);
+  vresult_uchar = vec_replace_unaligned (src_va_uint, src_a_uint, 3);
+  vresult_uint = (vector unsigned int) vresult_uchar;
 
   if (!vec_all_eq (vresult_uint,  expected_vresult_uint)) {
 #if DEBUG
@@ -191,7 +194,8 @@ main (int argc, char *argv [])
   /* Byte index 7 will over write part of elements 1 and 2 */
   expected_vresult_int = (vector int) { 1, 234*256, 0, 4 };
 						 
-  vresult_int = vec_replace_unaligned (src_va_int, src_a_int, 7);
+  vresult_uchar = vec_replace_unaligned (src_va_int, src_a_int, 7);
+  vresult_int = (vector signed int) vresult_uchar;
 
   if (!vec_all_eq (vresult_int,  expected_vresult_int)) {
 #if DEBUG
@@ -209,7 +213,8 @@ main (int argc, char *argv [])
   vresult_float = (vector float) { 0.0, 0.0, 0.0, 0.0 };
   expected_vresult_float = (vector float) { 0.0, 34.0, 20.0, 30.0 };
 						 
-  vresult_float = vec_replace_unaligned (src_va_float, src_a_float, 8);
+  vresult_uchar = vec_replace_unaligned (src_va_float, src_a_float, 8);
+  vresult_float = (vector float) vresult_uchar;
 
   if (!vec_all_eq (vresult_float,  expected_vresult_float)) {
 #if DEBUG
@@ -231,7 +236,8 @@ main (int argc, char *argv [])
 							      0x200 };
 						 
   /* Byte index 7 will over write least significant byte of  element 0  */
-  vresult_ullint = vec_replace_unaligned (src_va_ullint, src_a_ullint, 7);
+  vresult_uchar = vec_replace_unaligned (src_va_ullint, src_a_ullint, 7);
+  vresult_ullint = (vector unsigned long long) vresult_uchar;
 
   if (!vec_all_eq (vresult_ullint,  expected_vresult_ullint)) {
 #if DEBUG
@@ -251,7 +257,8 @@ main (int argc, char *argv [])
   /* Byte index 7 will over write least significant byte of  element 0  */
   expected_vresult_llint = (vector long long int) { 678*256, 0x100 };
 						 
-  vresult_llint = vec_replace_unaligned (src_va_llint, src_a_llint, 7);
+  vresult_uchar = vec_replace_unaligned (src_va_llint, src_a_llint, 7);
+  vresult_llint = (vector signed long long) vresult_uchar;
 
   if (!vec_all_eq (vresult_llint,  expected_vresult_llint)) {
 #if DEBUG
@@ -270,7 +277,8 @@ main (int argc, char *argv [])
   vresult_double = (vector double) { 0.0, 0.0 };
   expected_vresult_double = (vector double) { 0.0, 678.0 };
 						 
-  vresult_double = vec_replace_unaligned (src_va_double, src_a_double, 0);
+  vresult_uchar = vec_replace_unaligned (src_va_double, src_a_double, 0);
+  vresult_double = (vector double) vresult_uchar;
 
   if (!vec_all_eq (vresult_double,  expected_vresult_double)) {
 #if DEBUG