| /* { dg-do compile } */ |
| /* { dg-options "-O2 -ftree-vectorize -ffast-math" } */ |
| |
| #include <stdint.h> |
| |
| #define TEST_LOOP(NAME, OUTTYPE, INTYPE, MASKTYPE) \ |
| void __attribute__ ((noinline, noclone)) \ |
| NAME##_4 (OUTTYPE *__restrict dest, INTYPE *__restrict src, \ |
| MASKTYPE *__restrict cond, int n) \ |
| { \ |
| for (int i = 0; i < n; ++i) \ |
| if (cond[i]) \ |
| dest[i] = src[i * 4] + src[i * 4 + 2]; \ |
| } |
| |
| #define TEST2(NAME, OUTTYPE, INTYPE) \ |
| TEST_LOOP (NAME##_i8, OUTTYPE, INTYPE, int8_t) \ |
| TEST_LOOP (NAME##_i16, OUTTYPE, INTYPE, uint16_t) \ |
| TEST_LOOP (NAME##_f32, OUTTYPE, INTYPE, float) \ |
| TEST_LOOP (NAME##_f64, OUTTYPE, INTYPE, double) |
| |
| #define TEST1(NAME, OUTTYPE) \ |
| TEST2 (NAME##_i8, OUTTYPE, int8_t) \ |
| TEST2 (NAME##_i16, OUTTYPE, uint16_t) \ |
| TEST2 (NAME##_i32, OUTTYPE, int32_t) \ |
| TEST2 (NAME##_i64, OUTTYPE, uint64_t) |
| |
| #define TEST(NAME) \ |
| TEST1 (NAME##_i8, int8_t) \ |
| TEST1 (NAME##_i16, uint16_t) \ |
| TEST1 (NAME##_i32, int32_t) \ |
| TEST1 (NAME##_i64, uint64_t) \ |
| TEST2 (NAME##_f16_f16, _Float16, _Float16) \ |
| TEST2 (NAME##_f32_f32, float, float) \ |
| TEST2 (NAME##_f64_f64, double, double) |
| |
| TEST (test) |
| |
| /* { dg-final { scan-assembler-not {\tld4b\t} } } */ |
| /* { dg-final { scan-assembler-not {\tld4h\t} } } */ |
| /* { dg-final { scan-assembler-not {\tld4w\t} } } */ |
| /* { dg-final { scan-assembler-not {\tld4d\t} } } */ |