blob: 687716e7176a3f2a2f82a6368d3df3d970dbf614 [file] [log] [blame]
/* { dg-do assemble { target aarch64_asm_sve_ok } } */
/* { dg-options "-O2 -ftree-vectorize -ffast-math --save-temps --param aarch64-sve-compare-costs=0" } */
#include <stdint.h>
#define TEST_LOOP(DATA_TYPE, CMP_TYPE, INDEX_TYPE) \
void \
f_##DATA_TYPE##_##CMP_TYPE##_##INDEX_TYPE \
(DATA_TYPE *restrict dest, DATA_TYPE *restrict src, \
CMP_TYPE *cmp1, CMP_TYPE *cmp2, INDEX_TYPE *indices, int n) \
{ \
for (int i = 0; i < n; ++i) \
if (cmp1[i] == cmp2[i]) \
dest[i] += src[indices[i]]; \
}
#define TEST32(T, DATA_TYPE) \
T (DATA_TYPE, int16_t, int32_t) \
T (DATA_TYPE, uint16_t, int32_t) \
T (DATA_TYPE, _Float16, int32_t) \
T (DATA_TYPE, int16_t, uint32_t) \
T (DATA_TYPE, uint16_t, uint32_t) \
T (DATA_TYPE, _Float16, uint32_t)
#define TEST64(T, DATA_TYPE) \
T (DATA_TYPE, int32_t, int64_t) \
T (DATA_TYPE, uint32_t, int64_t) \
T (DATA_TYPE, float, int64_t) \
T (DATA_TYPE, int32_t, uint64_t) \
T (DATA_TYPE, uint32_t, uint64_t) \
T (DATA_TYPE, float, uint64_t)
#define TEST_ALL(T) \
TEST32 (T, int32_t) \
TEST32 (T, uint32_t) \
TEST32 (T, float) \
TEST64 (T, int64_t) \
TEST64 (T, uint64_t) \
TEST64 (T, double)
TEST_ALL (TEST_LOOP)
/* { dg-final { scan-assembler-times {\tld1h\tz[0-9]+\.h, p[0-7]/z, \[x[0-9]+, x[0-9]+, lsl 1\]\n} 36 } } */
/* { dg-final { scan-assembler-times {\tcmpeq\tp[0-7]\.h, p[0-7]/z, z[0-9]+\.h, z[0-9]+\.h\n} 12 } } */
/* { dg-final { scan-assembler-times {\tfcmeq\tp[0-7]\.h, p[0-7]/z, z[0-9]+\.h, z[0-9]+\.h\n} 6 } } */
/* { dg-final { scan-assembler-times {\tld1w\tz[0-9]+\.s, p[0-7]/z, \[x[0-9]+, z[0-9]+\.s, sxtw 2\]\n} 18 } } */
/* { dg-final { scan-assembler-times {\tld1w\tz[0-9]+\.s, p[0-7]/z, \[x[0-9]+, z[0-9]+\.s, uxtw 2\]\n} 18 } } */
/* Also used for the TEST32 indices. */
/* { dg-final { scan-assembler-times {\tld1w\tz[0-9]+\.s, p[0-7]/z, \[x[0-9]+, x[0-9]+, lsl 2\]\n} 72 } } */
/* { dg-final { scan-assembler-times {\tcmpeq\tp[0-7]\.s, p[0-7]/z, z[0-9]+\.s, z[0-9]+\.s\n} 12 } } */
/* { dg-final { scan-assembler-times {\tfcmeq\tp[0-7]\.s, p[0-7]/z, z[0-9]+\.s, z[0-9]+\.s\n} 6 } } */
/* { dg-final { scan-assembler-times {\tld1d\tz[0-9]+\.d, p[0-7]/z, \[x[0-9]+, z[0-9]+\.d, lsl 3\]\n} 36 } } */