blob: 317cae6010c4318554c6ee1f38ecda50e30a715e [file] [log] [blame]
/* { dg-do run { target aarch64_sve_hw } } */
/* { dg-options "-O" } */
/* { dg-options "-O -msve-vector-bits=256" { target aarch64_sve256_hw } } */
#include "vec_perm_1.c"
#define TEST_VEC_PERM(TYPE, MASK_TYPE, EXPECTED_RESULT, \
VALUES1, VALUES2, MASK) \
{ \
TYPE expected_result = EXPECTED_RESULT; \
TYPE values1 = VALUES1; \
TYPE values2 = VALUES2; \
MASK_TYPE mask = MASK; \
TYPE dest; \
dest = vec_perm_##TYPE (values1, values2, mask); \
if (__builtin_memcmp (&dest, &expected_result, sizeof (TYPE)) != 0) \
__builtin_abort (); \
}
int main (void)
{
TEST_VEC_PERM (vnx2di, vnx2di,
((vnx2di) { 5, 36, 7, 48 }),
((vnx2di) { 4, 5, 6, 7 }),
((vnx2di) { 12, 24, 36, 48 }),
((vnx2di) { 1 + (8 * 1), 6 + (8 * 3),
3 + (8 * 1), 7 + (8 * 5) }));
TEST_VEC_PERM (vnx4si, vnx4si,
((vnx4si) { 34, 38, 40, 10, 9, 8, 7, 35 }),
((vnx4si) { 3, 4, 5, 6, 7, 8, 9, 10 }),
((vnx4si) { 33, 34, 35, 36, 37, 38, 39, 40 }),
((vnx4si) { 9 + (16 * 2), 13 + (16 * 5),
15 + (16 * 1), 7 + (16 * 0),
6 + (16 * 8), 5 + (16 * 2),
4 + (16 * 3), 10 + (16 * 2) }));
TEST_VEC_PERM (vnx8hi, vnx8hi,
((vnx8hi) { 12, 16, 18, 10, 42, 43, 44, 34,
7, 48, 3, 35, 9, 8, 7, 13 }),
((vnx8hi) { 3, 4, 5, 6, 7, 8, 9, 10,
11, 12, 13, 14, 15, 16, 17, 18 }),
((vnx8hi) { 33, 34, 35, 36, 37, 38, 39, 40,
41, 42, 43, 44, 45, 46, 47, 48 }),
((vnx8hi) { 9 + (32 * 2), 13 + (32 * 2),
15 + (32 * 8), 7 + (32 * 9),
25 + (32 * 4), 26 + (32 * 3),
27 + (32 * 1), 17 + (32 * 2),
4 + (32 * 6), 31 + (32 * 7),
0 + (32 * 8), 18 + (32 * 9),
6 + (32 * 6), 5 + (32 * 7),
4 + (32 * 2), 10 + (32 * 2) }));
TEST_VEC_PERM (vnx16qi, vnx16qi,
((vnx16qi) { 5, 6, 7, 4, 5, 6, 4, 5,
6, 7, 12, 24, 36, 48, 12, 24,
5, 6, 7, 4, 5, 6, 4, 5,
6, 7, 12, 24, 36, 48, 12, 24 }),
((vnx16qi) { 4, 5, 6, 7, 4, 5, 6, 7,
4, 5, 6, 7, 4, 5, 6, 7,
4, 5, 6, 7, 4, 5, 6, 7,
4, 5, 6, 7, 4, 5, 6, 7 }),
((vnx16qi) { 12, 24, 36, 48, 12, 24, 36, 48,
12, 24, 36, 48, 12, 24, 36, 48,
12, 24, 36, 48, 12, 24, 36, 48,
12, 24, 36, 48, 12, 24, 36, 48 }),
((vnx16qi) { 5 + (64 * 3), 6 + (64 * 1),
7 + (64 * 2), 8 + (64 * 1),
9 + (64 * 3), 10 + (64 * 1),
28 + (64 * 3), 29 + (64 * 3),
30 + (64 * 1), 31 + (64 * 1),
32 + (64 * 3), 33 + (64 * 2),
54 + (64 * 2), 55 + (64 * 2),
56 + (64 * 1), 61 + (64 * 2),
5 + (64 * 2), 6 + (64 * 1),
7 + (64 * 2), 8 + (64 * 2),
9 + (64 * 2), 10 + (64 * 1),
28 + (64 * 3), 29 + (64 * 1),
30 + (64 * 3), 31 + (64 * 3),
32 + (64 * 1), 33 + (64 * 1),
54 + (64 * 2), 55 + (64 * 2),
56 + (64 * 2), 61 + (64 * 2) }));
TEST_VEC_PERM (vnx2df, vnx2di,
((vnx2df) { 5.1, 36.1, 7.1, 48.1 }),
((vnx2df) { 4.1, 5.1, 6.1, 7.1 }),
((vnx2df) { 12.1, 24.1, 36.1, 48.1 }),
((vnx2di) { 1 + (8 * 3), 6 + (8 * 10),
3 + (8 * 8), 7 + (8 * 2) }));
TEST_VEC_PERM (vnx4sf, vnx4si,
((vnx4sf) { 34.2, 38.2, 40.2, 10.2, 9.2, 8.2, 7.2, 35.2 }),
((vnx4sf) { 3.2, 4.2, 5.2, 6.2, 7.2, 8.2, 9.2, 10.2 }),
((vnx4sf) { 33.2, 34.2, 35.2, 36.2,
37.2, 38.2, 39.2, 40.2 }),
((vnx4si) { 9 + (16 * 1), 13 + (16 * 5),
15 + (16 * 4), 7 + (16 * 4),
6 + (16 * 3), 5 + (16 * 2),
4 + (16 * 1), 10 + (16 * 0) }));
TEST_VEC_PERM (vnx8hf, vnx8hi,
((vnx8hf) { 12.0, 16.0, 18.0, 10.0, 42.0, 43.0, 44.0, 34.0,
7.0, 48.0, 3.0, 35.0, 9.0, 8.0, 7.0, 13.0 }),
((vnx8hf) { 3.0, 4.0, 5.0, 6.0, 7.0, 8.0, 9.0, 10.0,
11.0, 12.0, 13.0, 14.0, 15.0, 16.0, 17.0, 18.0 }),
((vnx8hf) { 33.0, 34.0, 35.0, 36.0, 37.0, 38.0, 39.0, 40.0,
41.0, 42.0, 43.0, 44.0, 45.0, 46.0, 47.0, 48.0 }),
((vnx8hi) { 9 + (32 * 2), 13 + (32 * 2),
15 + (32 * 8), 7 + (32 * 9),
25 + (32 * 4), 26 + (32 * 3),
27 + (32 * 1), 17 + (32 * 2),
4 + (32 * 6), 31 + (32 * 7),
0 + (32 * 8), 18 + (32 * 9),
6 + (32 * 6), 5 + (32 * 7),
4 + (32 * 2), 10 + (32 * 2) }));
return 0;
}