[PATCH 1/5] RS6000 Add 128-bit Binary Integer sign extend operations

will schmidt will_schmidt@vnet.ibm.com
Thu Sep 24 18:20:55 GMT 2020


On Mon, 2020-09-21 at 16:56 -0700, Carl Love wrote:
> Segher, Will:
> 
> Patch 1, adds the 128-bit sign extension instruction support and
> corresponding builtin support.
> 
> No changes from the previous version.
> 
> The patch has been tested on 
> 
>   powerpc64le-unknown-linux-gnu (Power 9 LE)
> 
> with no regression errors.
> 
> Fixed the issues in the ChangeLog noted by Will.
> 
>              Carl Love
> 
> ---------------------------------------------------
> 
> gcc/ChangeLog
> 
> 2020-09-21  Carl Love  <cel@us.ibm.com>
> 	* config/rs6000/altivec.h (vec_signextll, vec_signexti): Add define
> 	for new builtins.
> 	* config/rs6000/rs6000-builtin.def (VSIGNEXTI, VSIGNEXTLL):  Add
> 	overloaded builtin definitions.
> 	(VSIGNEXTSB2W, VSIGNEXTSB2D, VSIGNEXTSH2D,VSIGNEXTSW2D): Add builtin
> 	expansions.

+VSIGNEXTSH2W


> 	* config/rs6000-call.c (P9V_BUILTIN_VEC_VSIGNEXTI,
> 	P9V_BUILTIN_VEC_VSIGNEXTLL): Add overloaded argument definitions.
> 	* config/rs6000/vsx.md: Make define_insn vsx_sign_extend_si_v2di
> 	visible.
> 	* doc/extend.texi:  Add documentation for the vec_signexti and
> 	vec_signextll builtins.
> 
> gcc/testsuite/ChangeLog
> 
> 2020-09-21  Carl Love  <cel@us.ibm.com>
> 	* gcc.target/powerpc/p9-sign_extend-runnable.c:  New test case.
> ---
>  gcc/config/rs6000/altivec.h                   |   3 +
>  gcc/config/rs6000/rs6000-builtin.def          |   9 ++
>  gcc/config/rs6000/rs6000-call.c               |  13 ++
>  gcc/config/rs6000/vsx.md                      |   2 +-
>  gcc/doc/extend.texi                           |  15 ++
>  .../powerpc/p9-sign_extend-runnable.c         | 128 ++++++++++++++++++
>  6 files changed, 169 insertions(+), 1 deletion(-)
>  create mode 100644 gcc/testsuite/gcc.target/powerpc/p9-sign_extend-runnable.c
> 
> diff --git a/gcc/config/rs6000/altivec.h b/gcc/config/rs6000/altivec.h
> index 8a2dcda0144..acc365612be 100644
> --- a/gcc/config/rs6000/altivec.h
> +++ b/gcc/config/rs6000/altivec.h
> @@ -494,6 +494,9 @@
> 
>  #define vec_xlx __builtin_vec_vextulx
>  #define vec_xrx __builtin_vec_vexturx
> +#define vec_signexti  __builtin_vec_vsignexti
> +#define vec_signextll __builtin_vec_vsignextll
> +
>  #endif
> 
>  /* Predicates.
> diff --git a/gcc/config/rs6000/rs6000-builtin.def b/gcc/config/rs6000/rs6000-builtin.def
> index e91a48ddf5f..4c2e9460949 100644
> --- a/gcc/config/rs6000/rs6000-builtin.def
> +++ b/gcc/config/rs6000/rs6000-builtin.def
> @@ -2715,6 +2715,8 @@ BU_P9V_OVERLOAD_1 (VPRTYBD,	"vprtybd")
>  BU_P9V_OVERLOAD_1 (VPRTYBQ,	"vprtybq")
>  BU_P9V_OVERLOAD_1 (VPRTYBW,	"vprtybw")
>  BU_P9V_OVERLOAD_1 (VPARITY_LSBB,	"vparity_lsbb")
> +BU_P9V_OVERLOAD_1 (VSIGNEXTI,	"vsignexti")
> +BU_P9V_OVERLOAD_1 (VSIGNEXTLL,	"vsignextll")
> 
>  /* 2 argument functions added in ISA 3.0 (power9).  */
>  BU_P9_2 (CMPRB,	"byte_in_range",	CONST,	cmprb)
> @@ -2726,6 +2728,13 @@ BU_P9_OVERLOAD_2 (CMPRB,	"byte_in_range")
>  BU_P9_OVERLOAD_2 (CMPRB2,	"byte_in_either_range")
>  BU_P9_OVERLOAD_2 (CMPEQB,	"byte_in_set")
>  
> +/* Sign extend builtins that work on ISA 3.0, but not defined until ISA 3.1.  */
> +BU_P9V_AV_1 (VSIGNEXTSB2W,	"vsignextsb2w",		CONST,  vsx_sign_extend_qi_v4si)
> +BU_P9V_AV_1 (VSIGNEXTSH2W,	"vsignextsh2w",		CONST,  vsx_sign_extend_hi_v4si)
> +BU_P9V_AV_1 (VSIGNEXTSB2D,	"vsignextsb2d",		CONST,  vsx_sign_extend_qi_v2di)
> +BU_P9V_AV_1 (VSIGNEXTSH2D,	"vsignextsh2d",		CONST,  vsx_sign_extend_hi_v2di)
> +BU_P9V_AV_1 (VSIGNEXTSW2D,	"vsignextsw2d",		CONST,  vsx_sign_extend_si_v2di)
> +
>  /* Builtins for scalar instructions added in ISA 3.1 (power10).  */
>  BU_P10_MISC_2 (CFUGED, "cfuged", CONST, cfuged)
>  BU_P10_MISC_2 (CNTLZDM, "cntlzdm", CONST, cntlzdm)
> diff --git a/gcc/config/rs6000/rs6000-call.c b/gcc/config/rs6000/rs6000-call.c
> index a8b520834c7..9e514a01012 100644
> --- a/gcc/config/rs6000/rs6000-call.c
> +++ b/gcc/config/rs6000/rs6000-call.c
> @@ -5527,6 +5527,19 @@ const struct altivec_builtin_types altivec_overloaded_builtins[] = {
>      RS6000_BTI_unsigned_V2DI, RS6000_BTI_unsigned_V2DI,
>      RS6000_BTI_INTSI, RS6000_BTI_INTSI },
> 
> +  /* Sign extend builtins that work work on ISA 3.0, not added until ISA 3.1 */
> +  { P9V_BUILTIN_VEC_VSIGNEXTI, P9V_BUILTIN_VSIGNEXTSB2W,
> +    RS6000_BTI_V4SI, RS6000_BTI_V16QI, 0, 0 },
> +  { P9V_BUILTIN_VEC_VSIGNEXTI, P9V_BUILTIN_VSIGNEXTSH2W,
> +    RS6000_BTI_V4SI, RS6000_BTI_V8HI, 0, 0 },
> +
> +  { P9V_BUILTIN_VEC_VSIGNEXTLL, P9V_BUILTIN_VSIGNEXTSB2D,
> +    RS6000_BTI_V2DI, RS6000_BTI_V16QI, 0, 0 },
> +  { P9V_BUILTIN_VEC_VSIGNEXTLL, P9V_BUILTIN_VSIGNEXTSH2D,
> +    RS6000_BTI_V2DI, RS6000_BTI_V8HI, 0, 0 },
> +  { P9V_BUILTIN_VEC_VSIGNEXTLL, P9V_BUILTIN_VSIGNEXTSW2D,
> +    RS6000_BTI_V2DI, RS6000_BTI_V4SI, 0, 0 },
> +
>    /* Overloaded built-in functions for ISA3.1 (power10). */
>    { P10_BUILTIN_VEC_CLRL, P10V_BUILTIN_VCLRLB,
>      RS6000_BTI_V16QI, RS6000_BTI_V16QI, RS6000_BTI_UINTSI, 0 },
> diff --git a/gcc/config/rs6000/vsx.md b/gcc/config/rs6000/vsx.md
> index 4ff52455fd3..31fcffe8f33 100644
> --- a/gcc/config/rs6000/vsx.md
> +++ b/gcc/config/rs6000/vsx.md
> @@ -4787,7 +4787,7 @@
>    "vextsh2<wd> %0,%1"
>    [(set_attr "type" "vecexts")])
> 
> -(define_insn "*vsx_sign_extend_si_v2di"
> +(define_insn "vsx_sign_extend_si_v2di"
>    [(set (match_operand:V2DI 0 "vsx_register_operand" "=v")
>  	(unspec:V2DI [(match_operand:V4SI 1 "vsx_register_operand" "v")]
>  		     UNSPEC_VSX_SIGN_EXTEND))]
> diff --git a/gcc/doc/extend.texi b/gcc/doc/extend.texi
> index 5571c4f2ff2..c1c2c9f9bf7 100644
> --- a/gcc/doc/extend.texi
> +++ b/gcc/doc/extend.texi
> @@ -20800,6 +20800,21 @@ void vec_xst (vector unsigned char, int, vector unsigned char *);
>  void vec_xst (vector unsigned char, int, unsigned char *);
>  @end smallexample
> 
> +uThe following sign extension builtins are provided.
> +
> +@smallexample
> +vector signed int vec_signexti (vector signed char a)
> +vector signed long long vec_signextll (vector signed char a)
> +vector signed int vec_signexti (vector signed short a)
> +vector signed long long vec_signextll (vector signed short a)
> +vector signed long long vec_signextll (vector signed int a)

I'd sort by return type, versus parameter type, but I'd defer.. I don't
see that existing documentation is entirely consistent in the ordering.



Nothing else jumps out at me.

this one lgtm.
thanks
-Will




> +@end smallexample
> +
> +Each element of the result is produced by sign-extending the element of the
> +input vector that would fall in the least significant portion of the result
> +element. For example, a sign-extension of a vector signed char to a vector
> +signed long long will sign extend the rightmost byte of each doubleword.
> +
>  @node PowerPC AltiVec Built-in Functions Available on ISA 3.1
>  @subsubsection PowerPC AltiVec Built-in Functions Available on ISA 3.1
> 
> diff --git a/gcc/testsuite/gcc.target/powerpc/p9-sign_extend-runnable.c b/gcc/testsuite/gcc.target/powerpc/p9-sign_extend-runnable.c
> new file mode 100644
> index 00000000000..7bf979c6fd4
> --- /dev/null
> +++ b/gcc/testsuite/gcc.target/powerpc/p9-sign_extend-runnable.c
> @@ -0,0 +1,128 @@
> +/* { dg-do run { target { powerpc*-*-linux* && { lp64 && p9vector_hw } } } } */
> +/* { dg-require-effective-target powerpc_p9vector_ok } */
> +/* { dg-options "-O2 -mdejagnu-cpu=power9 -save-temps" } */
> +
> +/* These builtins were not defined until ISA 3.1 but only require ISA 3.0
> +   support.  */
> +
> +/* { dg-final { scan-assembler-times {\mvextsb2w\M} 1 } } */
> +/* { dg-final { scan-assembler-times {\mvextsb2d\M} 1 } } */
> +/* { dg-final { scan-assembler-times {\mvextsh2w\M} 1 } } */
> +/* { dg-final { scan-assembler-times {\mvextsh2d\M} 1 } } */
> +/* { dg-final { scan-assembler-times {\mvextsw2d\M} 1 } } */
> +
> +#include <altivec.h>
> +
> +#define DEBUG 0
> +
> +#if DEBUG
> +#include <stdio.h>
> +#include <stdlib.h>
> +#endif
> +
> +void abort (void);
> +
> +int main ()
> +{
> +  int i;
> +
> +  vector signed char vec_arg_qi, vec_result_qi;
> +  vector signed short int vec_arg_hi, vec_result_hi, vec_expected_hi;
> +  vector signed int vec_arg_wi, vec_result_wi, vec_expected_wi;
> +  vector signed long long vec_result_di, vec_expected_di;
> +
> +  /* test sign extend byte to word */
> +  vec_arg_qi = (vector signed char) {1, 2, 3, 4, 5, 6, 7, 8,
> +				     -1, -2, -3, -4, -5, -6, -7, -8};
> +  vec_expected_wi = (vector signed int) {1, 5, -1, -5};
> +
> +  vec_result_wi = vec_signexti (vec_arg_qi);
> +
> +  for (i = 0; i < 4; i++)
> +    if (vec_result_wi[i] != vec_expected_wi[i]) {
> +#if DEBUG
> +      printf("ERROR: vec_signexti(char, int):  ");
> +      printf("vec_result_wi[%d] != vec_expected_wi[%d]\n",
> +	     i, i);
> +      printf("vec_result_wi[%d] = %d\n", i, vec_result_wi[i]);
> +      printf("vec_expected_wi[%d] = %d\n", i, vec_expected_wi[i]);
> +#else
> +      abort();
> +#endif
> +    }
> +
> +  /* test sign extend byte to double */
> +  vec_arg_qi = (vector signed char){1, 2, 3, 4, 5, 6, 7, 8,
> +				    -1, -2, -3, -4, -5, -6, -7, -8};
> +  vec_expected_di = (vector signed long long int){1, -1};
> +
> +  vec_result_di = vec_signextll(vec_arg_qi);
> +
> +  for (i = 0; i < 2; i++)
> +    if (vec_result_di[i] != vec_expected_di[i]) {
> +#if DEBUG
> +      printf("ERROR: vec_signextll(byte, long long int):  ");
> +      printf("vec_result_di[%d] != vec_expected_di[%d]\n", i, i);
> +      printf("vec_result_di[%d] = %lld\n", i, vec_result_di[i]);
> +      printf("vec_expected_di[%d] = %lld\n", i, vec_expected_di[i]);
> +#else
> +      abort();
> +#endif
> +    }
> +
> +  /* test sign extend short to word */
> +  vec_arg_hi = (vector signed short int){1, 2, 3, 4, -1, -2, -3, -4};
> +  vec_expected_wi = (vector signed int){1, 3, -1, -3};
> +
> +  vec_result_wi = vec_signexti(vec_arg_hi);
> +
> +  for (i = 0; i < 4; i++)
> +    if (vec_result_wi[i] != vec_expected_wi[i]) {
> +#if DEBUG
> +      printf("ERROR: vec_signexti(short, int):  ");
> +      printf("vec_result_wi[%d] != vec_expected_wi[%d]\n", i, i);
> +      printf("vec_result_wi[%d] = %d\n", i, vec_result_wi[i]);
> +      printf("vec_expected_wi[%d] = %d\n", i, vec_expected_wi[i]);
> +#else
> +      abort();
> +#endif
> +    }
> +
> +  /* test sign extend short to double word */
> +  vec_arg_hi = (vector signed short int ){1, 3, 5, 7,  -1, -3, -5, -7};
> +  vec_expected_di = (vector signed long long int){1, -1};
> +
> +  vec_result_di = vec_signextll(vec_arg_hi);
> +
> +  for (i = 0; i < 2; i++)
> +    if (vec_result_di[i] != vec_expected_di[i]) {
> +#if DEBUG
> +      printf("ERROR: vec_signextll(short, double):  ");
> +      printf("vec_result_di[%d] != vec_expected_di[%d]\n", i, i);
> +      printf("vec_result_di[%d] = %lld\n", i, vec_result_di[i]);
> +      printf("vec_expected_di[%d] = %lld\n", i, vec_expected_di[i]);
> +#else
> +      abort();
> +#endif
> +    }
> +
> +  /* test sign extend word to double word */
> +  vec_arg_wi = (vector signed int ){1, 3, -1, -3};
> +  vec_expected_di = (vector signed long long int){1, -1};
> +
> +  vec_result_di = vec_signextll(vec_arg_wi);
> +
> +  for (i = 0; i < 2; i++)
> +    if (vec_result_di[i] != vec_expected_di[i]) {
> +#if DEBUG
> +      printf("ERROR: vec_signextll(word, double):  ");
> +      printf("vec_result_di[%d] != vec_expected_di[%d]\n", i, i);
> +      printf("vec_result_di[%d] = %lld\n", i, vec_result_di[i]);
> +      printf("vec_expected_di[%d] = %lld\n", i, vec_expected_di[i]);
> +#else
> +      abort();
> +#endif
> +    }
> +
> +  return 0;
> +}



More information about the Gcc-patches mailing list