| /* { dg-do run } */ |
| /* { dg-options "-O2 -mavx512ifma" } */ |
| /* { dg-require-effective-target avx512ifma } */ |
| |
| #define AVX512IFMA |
| |
| #include "avx512f-helper.h" |
| |
| #define SIZE (AVX512F_LEN / 64) |
| #include "avx512f-mask-type.h" |
| |
| void |
| CALC (long long *r, long long *s1, long long *s2, long long *s3) |
| { |
| int i; |
| long long a, b; |
| |
| for (i = 0; i < SIZE; i++) |
| { |
| /* Simulate higher 52 bits out of 104 bit, |
| by shifting opernads with 0 in lower 26 bits. */ |
| a = s2[i] >> 26; |
| b = s3[i] >> 26; |
| r[i] = a * b + s1[i]; |
| } |
| } |
| |
| void |
| TEST (void) |
| { |
| UNION_TYPE (AVX512F_LEN, i_q) src1, src2, dst1, dst2, dst3; |
| long long dst_ref[SIZE]; |
| int i; |
| MASK_TYPE mask = MASK_VALUE; |
| |
| for (i = 0; i < SIZE; i++) |
| { |
| src1.a[i] = 15 + 3467 * i; |
| src2.a[i] = 9217 + i; |
| src1.a[i] = src1.a[i] << 26; |
| src1.a[i] = src1.a[i] << 26; |
| src1.a[i] &= ((1LL << 52) - 1); |
| src2.a[i] &= ((1LL << 52) - 1); |
| dst1.a[i] = DEFAULT_VALUE; |
| dst2.a[i] = DEFAULT_VALUE; |
| dst3.a[i] = DEFAULT_VALUE; |
| } |
| |
| CALC (dst_ref, dst1.a, src1.a, src2.a); |
| dst1.x = INTRINSIC (_madd52hi_epu64) (dst1.x, src1.x, src2.x); |
| dst2.x = INTRINSIC (_mask_madd52hi_epu64) (dst2.x, mask, src1.x, src2.x); |
| dst3.x = INTRINSIC (_maskz_madd52hi_epu64) (mask, dst3.x, src1.x, src2.x); |
| |
| if (UNION_CHECK (AVX512F_LEN, i_q) (dst1, dst_ref)) |
| abort (); |
| |
| MASK_MERGE (i_q) (dst_ref, mask, SIZE); |
| if (UNION_CHECK (AVX512F_LEN, i_q) (dst2, dst_ref)) |
| abort (); |
| |
| MASK_ZERO (i_q) (dst_ref, mask, SIZE); |
| if (UNION_CHECK (AVX512F_LEN, i_q) (dst3, dst_ref)) |
| abort (); |
| } |