Vector shuffling

Artem Shinkarov artyom.shinkaroff@gmail.com
Mon Oct 3 23:05:00 GMT 2011


On Mon, Oct 3, 2011 at 6:12 PM, Richard Henderson <rth@redhat.com> wrote:
> On 10/03/2011 09:43 AM, Artem Shinkarov wrote:
>> Hi, Richard
>>
>> There is a problem with the testcases of the patch you have committed
>> for me. The code in every test-case is doubled. Could you please,
>> apply the following patch, otherwise it would fail all the tests from
>> the vector-shuffle-patch would fail.
>
> Huh.  Dunno what happened there.  Fixed.
>
>> Also, if it is possible, could you change my name from in the
>> ChangeLog from "Artem Shinkarov" to "Artjoms Sinkarovs". The last
>> version is the way I am spelled in the passport, and the name I use in
>> the ChangeLog.
>
> Fixed.
>
>
> r~
>

Richard, there was a problem causing segfault in ix86_expand_vshuffle
which I have fixed with the patch attached.

Another thing I cannot figure out is the following case:
#define vector(elcount, type)  \
__attribute__((vector_size((elcount)*sizeof(type)))) type

vector (8, short) __attribute__ ((noinline))
f (vector (8, short) x, vector (8, short) y, vector (8, short) mask) {
    return  __builtin_shuffle (x, y, mask);
}

int main (int argc, char *argv[]) {
    vector (8, short) v0 = {argc, 1,2,3,4,5,6,7};
    vector (8, short) v1 = {argc, 1,argc,3,4,5,argc,7};
    vector (8, short) mask0 = {0,2,3,1,4,5,6,7};
    vector (8, short) v2;
    int i;

    v2 = f (v0, v1,  mask0);
    /* v2 =  __builtin_shuffle (v0, v1, mask0); */
    for (i = 0; i < 8; i ++)
      __builtin_printf ("%i, ", v2[i]);

    return 0;
}

I am compiling with support of ssse3, in my case it is ./xgcc -B. b.c
-O3 -mtune=core2 -march=core2

And I get 1, 1, 1, 3, 4, 5, 1, 7, on the output, which is wrong.

But if I will call __builtin_shuffle directly, then the answer is correct.

Any ideas?


Thanks,
Artem.
-------------- next part --------------
Index: gcc/config/i386/i386.c
===================================================================
--- gcc/config/i386/i386.c	(revision 179464)
+++ gcc/config/i386/i386.c	(working copy)
@@ -19312,14 +19312,17 @@ ix86_expand_vshuffle (rtx operands[])
       xops[1] = operands[1];
       xops[2] = operands[2];
       xops[3] = gen_rtx_EQ (mode, mask, w_vector);
-      xops[4] = t1;
-      xops[5] = t2;
+      xops[4] = t2;
+      xops[5] = t1;
 
       return ix86_expand_int_vcond (xops);
     }
 
-  /* mask = mask * {w, w, ...}  */
-  new_mask = expand_simple_binop (maskmode, MULT, new_mask, w_vector,
+  /* mask = mask * {16/w, 16/w, ...}  */
+  for (i = 0; i < w; i++)
+    vec[i] = GEN_INT (16/w);
+  vt = gen_rtx_CONST_VECTOR (maskmode, gen_rtvec_v (w, vec));
+  new_mask = expand_simple_binop (maskmode, MULT, new_mask, vt,
 				  NULL_RTX, 0, OPTAB_DIRECT);
 
   /* Convert mask to vector of chars.  */
@@ -19332,7 +19335,7 @@ ix86_expand_vshuffle (rtx operands[])
      ...  */
   for (i = 0; i < w; i++)
     for (j = 0; j < 16/w; j++)
-      vec[i*w+j] = GEN_INT (i*16/w);
+      vec[i*(16/w)+j] = GEN_INT (i*16/w);
   vt = gen_rtx_CONST_VECTOR (V16QImode, gen_rtvec_v (16, vec));
   vt = force_reg (V16QImode, vt);
 
@@ -19344,7 +19347,7 @@ ix86_expand_vshuffle (rtx operands[])
      new_mask = new_mask + {0,1,..,16/w, 0,1,..,16/w, ...}  */
   for (i = 0; i < w; i++)
     for (j = 0; j < 16/w; j++)
-      vec[i*w+j] = GEN_INT (j);
+      vec[i*(16/w)+j] = GEN_INT (j);
 
   vt = gen_rtx_CONST_VECTOR (V16QImode, gen_rtvec_v (16, vec));
   new_mask = expand_simple_binop (V16QImode, PLUS, new_mask, vt,
@@ -19386,8 +19389,8 @@ ix86_expand_vshuffle (rtx operands[])
       xops[1] = operands[1];
       xops[2] = operands[2];
       xops[3] = gen_rtx_EQ (mode, mask, w_vector);
-      xops[4] = t1;
-      xops[5] = t2;
+      xops[4] = t2;
+      xops[5] = t1;
 
       return ix86_expand_int_vcond (xops);
     }


More information about the Gcc-patches mailing list