| /* { dg-do run } */ |
| /* { dg-options "-O2 -mavx512ifma" } */ |
| /* { dg-require-effective-target avx512ifma } */ |
| |
| #define AVX512IFMA |
| |
| #include "avx512f-helper.h" |
| |
| #define SIZE (AVX512F_LEN / 64) |
| #include "avx512f-mask-type.h" |
| |
| void |
| CALC (unsigned long long *r, unsigned long long *s1, |
| unsigned long long *s2, unsigned long long *s3) |
| { |
| int i; |
| |
| /* Valid, because values are less than 1 << 26. */ |
| for (i = 0; i < SIZE; i++) |
| r[i] = s2[i] * s3[i] + s1[i]; |
| } |
| |
| void |
| TEST (void) |
| { |
| UNION_TYPE (AVX512F_LEN, i_q) src1, src2, dst1, dst2, dst3; |
| unsigned long long dst_ref[SIZE]; |
| int i; |
| MASK_TYPE mask = MASK_VALUE; |
| |
| for (i = 0; i < SIZE; i++) |
| { |
| src1.a[i] = i + 50; |
| src2.a[i] = i + 100; |
| dst1.a[i] = DEFAULT_VALUE; |
| dst2.a[i] = DEFAULT_VALUE; |
| dst3.a[i] = DEFAULT_VALUE; |
| } |
| |
| CALC (dst_ref, dst1.a, src1.a, src2.a); |
| dst1.x = INTRINSIC (_madd52lo_epu64) (dst1.x, src1.x, src2.x); |
| dst2.x = INTRINSIC (_mask_madd52lo_epu64) (dst2.x, mask, src1.x, src2.x); |
| dst3.x = INTRINSIC (_maskz_madd52lo_epu64) (mask, dst3.x, src1.x, src2.x); |
| |
| if (UNION_CHECK (AVX512F_LEN, i_q) (dst1, dst_ref)) |
| abort (); |
| |
| MASK_MERGE (i_q) (dst_ref, mask, SIZE); |
| if (UNION_CHECK (AVX512F_LEN, i_q) (dst2, dst_ref)) |
| abort (); |
| |
| MASK_ZERO (i_q) (dst_ref, mask, SIZE); |
| if (UNION_CHECK (AVX512F_LEN, i_q) (dst3, dst_ref)) |
| abort (); |
| } |