blob: d310f70d3a571745b095140858f6cdff72526994 [file] [log] [blame]
/* { dg-do run } */
/* { dg-require-effective-target s390_vxe } */
/* { dg-options "-O3 -mzarch -march=z14 -mzvector --save-temps -Wno-attributes" } */
#include <string.h>
#include <vecintrin.h>
typedef vector signed char v16qi;
typedef vector unsigned char uv16qi;
typedef vector bool char bv16qi;
typedef vector signed short int v8hi;
typedef vector unsigned short int uv8hi;
typedef vector bool short int bv8hi;
typedef vector signed int v4si;
typedef vector unsigned int uv4si;
typedef vector bool int bv4si;
typedef vector signed long long v2di;
typedef vector unsigned long long uv2di;
typedef vector bool long long bv2di;
typedef vector float v4sf;
typedef vector double v2df;
#define NUM_CONSTS 8
const v16qi v16qi_vals[NUM_CONSTS] =
{ (v16qi){ 1 },
(v16qi){ 2 },
(v16qi){ 1,1,1,1,1,1,1,1,1,1,1,1,1,1,1 },
(v16qi){ 2,2,2,2,2,2,2,2,2,2,2,2,2,2,2 },
(v16qi){ -1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1 },
(v16qi){ 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0 },
(v16qi){ 1,2,3,4,5,6,7,8,9,10,11,12,13,14,15 },
(v16qi){ 15,14,13,12,11,10,9,8,7,6,5,4,3,2,1 }
};
const v8hi v8hi_vals[NUM_CONSTS] =
{ (v8hi){ 1 },
(v8hi){ 2 },
(v8hi){ 1,1,1,1,1,1,1,1 },
(v8hi){ 2,2,2,2,2,2,2,2 },
(v8hi){ -1,-1,-1,-1,-1,-1,-1,-1 },
(v8hi){ 0,0,0,0,0,0,0,0 },
(v8hi){ 1,2,3,4,5,6,7,8 },
(v8hi){ 8,7,6,5,4,3,2,1 }
};
const v4si v4si_vals[NUM_CONSTS] =
{ (v4si){ 1 },
(v4si){ 2 },
(v4si){ 1,1,1,1 },
(v4si){ 2,2,2,2 },
(v4si){ -1,-1,-1,-1 },
(v4si){ 0,0,0,0 },
(v4si){ 1,2,3,4 },
(v4si){ 4,3,2,1 }
};
const v2di v2di_vals[NUM_CONSTS] =
{ (v2di){ 1 },
(v2di){ 2 },
(v2di){ 1,1 },
(v2di){ 2,2 },
(v2di){ -1,-1 },
(v2di){ 0,0 },
(v2di){ 1,2 },
(v2di){ 2,1 }
};
const v4sf v4sf_vals[NUM_CONSTS] =
{ (v4sf){ 1.0f },
(v4sf){ 2.0f },
(v4sf){ 1.0f,1.0f,1.0f,1.0f },
(v4sf){ 2.0f,2.0f,2.0f,2.0f },
(v4sf){ -1.0f,-1.0f,-1.0f,-1.0f },
(v4sf){ 0.0f,0.0f,0.0f,0.0f },
(v4sf){ 1.1f,2.1f,3.1f,4.1f },
(v4sf){ 4.1f,3.1f,2.1f,1.1f }
};
const v2df v2df_vals[NUM_CONSTS] =
{ (v2df){ 1.0 },
(v2df){ 2.0 },
(v2df){ 1.0,1.0 },
(v2df){ 2.0,2.0 },
(v2df){ -1.0,-1.0 },
(v2df){ 0.0,0.0 },
(v2df){ 1.1,2.1 },
(v2df){ 2.1,1.1 }
};
/* Each bit of the result vector has the value of the corresponding
bit of A if the corresponding bit of C is 0, or the value of the
corresponding bit of B otherwise. */
void __attribute__((noinline, noclone, target ("arch=zEC12")))
emul (unsigned char *result, unsigned char *a,
unsigned char *b, unsigned char *c)
{
for (int i = 0; i < 16; i++)
result[i] = (a[i] & ~c[i]) | (b[i] & c[i]);
}
#define GENFUNC(NAME, T1, T2) \
T1 __attribute__((noinline, noclone)) \
NAME##_reg (T1 a, T1 b, T2 c) { return vec_sel (a, b, c); } \
void __attribute__((noinline, noclone)) \
NAME##_mem (T1 *a, T1 *b, T2 *c, T1 *out) { *out = vec_sel (*a, *b, *c); } \
T1 __attribute__((always_inline)) \
NAME##_const (T1 a, T1 b, T2 c) { return vec_sel (a, b, c); }
GENFUNC (vec_sel_b8_a, bv16qi, uv16qi)
GENFUNC (vec_sel_b8_b, bv16qi, bv16qi)
GENFUNC (vec_sel_s8_a, v16qi, uv16qi)
GENFUNC (vec_sel_s8_b, v16qi, bv16qi)
GENFUNC (vec_sel_u8_a, uv16qi, uv16qi)
GENFUNC (vec_sel_u8_b, uv16qi, bv16qi)
GENFUNC (vec_sel_b16_a, bv8hi, uv8hi)
GENFUNC (vec_sel_b16_b, bv8hi, bv8hi)
GENFUNC (vec_sel_s16_a, v8hi, uv8hi)
GENFUNC (vec_sel_s16_b, v8hi, bv8hi)
GENFUNC (vec_sel_u16_a, uv8hi, uv8hi)
GENFUNC (vec_sel_u16_b, uv8hi, bv8hi)
GENFUNC (vec_sel_b32_a, bv4si, uv4si)
GENFUNC (vec_sel_b32_b, bv4si, bv4si)
GENFUNC (vec_sel_s32_a, v4si, uv4si)
GENFUNC (vec_sel_s32_b, v4si, bv4si)
GENFUNC (vec_sel_u32_a, uv4si, uv4si)
GENFUNC (vec_sel_u32_b, uv4si, bv4si)
GENFUNC (vec_sel_b64_a, bv2di, uv2di)
GENFUNC (vec_sel_b64_b, bv2di, bv2di)
GENFUNC (vec_sel_s64_a, v2di, uv2di)
GENFUNC (vec_sel_s64_b, v2di, bv2di)
GENFUNC (vec_sel_u64_a, uv2di, uv2di)
GENFUNC (vec_sel_u64_b, uv2di, bv2di)
GENFUNC (vec_sel_flt_a, v4sf, uv4si)
GENFUNC (vec_sel_flt_b, v4sf, bv4si)
GENFUNC (vec_sel_dbl_a, v2df, uv2di)
GENFUNC (vec_sel_dbl_b, v2df, bv2di)
#define TESTFUNC(NAME, T1, T2, VAL_TYPE) \
for (int i = 0; i < NUM_CONSTS; i++) \
for (int j = 0; j < NUM_CONSTS; j++) \
for (int k = 0; k < NUM_CONSTS; k++) \
{ \
unsigned char result[16]; \
T1 in1 = (T1)VAL_TYPE##_vals[i]; \
T1 in2 = (T1)VAL_TYPE##_vals[j]; \
T2 in3 = (T2)VAL_TYPE##_vals[k]; \
emul (result, (char*)&in1, (char*)&in2, (char*)&in3); \
\
T1 reg = NAME##_reg (in1, in2, in3); \
if (memcmp ((char*)&reg, result, 16) != 0) \
__builtin_abort (); \
\
T1 mem; \
NAME##_mem (&in1, &in2, &in3, &mem); \
if (memcmp ((char*)&mem, result, 16) != 0) \
__builtin_abort (); \
\
T1 cons = NAME##_const (in1, in2, in3); \
if (memcmp ((char*)&cons, result, 16) != 0) \
__builtin_abort (); \
}
int
main ()
{
TESTFUNC (vec_sel_b8_a, bv16qi, uv16qi, v16qi);
TESTFUNC (vec_sel_b8_b, bv16qi, bv16qi, v16qi);
TESTFUNC (vec_sel_s8_a, v16qi, uv16qi, v16qi);
TESTFUNC (vec_sel_s8_b, v16qi, bv16qi, v16qi);
TESTFUNC (vec_sel_u8_a, uv16qi, uv16qi, v16qi);
TESTFUNC (vec_sel_u8_b, uv16qi, bv16qi, v16qi);
TESTFUNC (vec_sel_b16_a, bv8hi, uv8hi, v8hi);
TESTFUNC (vec_sel_b16_b, bv8hi, bv8hi, v8hi);
TESTFUNC (vec_sel_s16_a, v8hi, uv8hi, v8hi);
TESTFUNC (vec_sel_s16_b, v8hi, bv8hi, v8hi);
TESTFUNC (vec_sel_u16_a, uv8hi, uv8hi, v8hi);
TESTFUNC (vec_sel_u16_b, uv8hi, bv8hi, v8hi);
TESTFUNC (vec_sel_b32_a, bv4si, uv4si, v4si);
TESTFUNC (vec_sel_b32_b, bv4si, bv4si, v4si);
TESTFUNC (vec_sel_s32_a, v4si, uv4si, v4si);
TESTFUNC (vec_sel_s32_b, v4si, bv4si, v4si);
TESTFUNC (vec_sel_u32_a, uv4si, uv4si, v4si);
TESTFUNC (vec_sel_u32_b, uv4si, bv4si, v4si);
TESTFUNC (vec_sel_b64_a, bv2di, uv2di, v2di);
TESTFUNC (vec_sel_b64_b, bv2di, bv2di, v2di);
TESTFUNC (vec_sel_s64_a, v2di, uv2di, v2di);
TESTFUNC (vec_sel_s64_b, v2di, bv2di, v2di);
TESTFUNC (vec_sel_u64_a, uv2di, uv2di, v2di);
TESTFUNC (vec_sel_u64_b, uv2di, bv2di, v2di);
TESTFUNC (vec_sel_flt_a, v4sf, uv4si, v4sf);
TESTFUNC (vec_sel_flt_b, v4sf, bv4si, v4sf);
TESTFUNC (vec_sel_dbl_a, v2df, uv2di, v2df);
TESTFUNC (vec_sel_dbl_b, v2df, bv2di, v2df);
}
/* { dg-final { scan-assembler {\n\tvsel\t} } } */