blob: fad298aaf4c9232a674434dc3a77ef3588fc968d [file] [log] [blame]
/* { dg-do run } */
/* { dg-options "-O2 -mavx512f" } */
/* { dg-require-effective-target avx512f } */
#include "avx512f-check.h"
#include "avx512f-helper.h"
#define SIZE (128 / 64)
#include "avx512f-mask-type.h"
void
avx512f_test (void)
{
int i, sign;
union128d res1, res2, res3, res4, src1, src2, src3;
volatile __mmask8 mask = 5;
double val[2] = { 35.5, 0.0 };
double *volatile p = &val[0];
double res_ref[SIZE];
double zero[SIZE];
for (i = 0; i < SIZE; i++)
{
src1.a[i] = 1.5 + i;
src2.a[i] = 7.5 + i;
src3.a[i] = 4.5 + i;
zero[i] = 0.0;
}
res1.x = _mm_mask_load_sd (src1.x, mask, p);
res2.x = _mm_maskz_load_sd (mask, p);
__builtin_memcpy (res_ref, zero, sizeof (zero));
res_ref[0] = val[0];
if (check_union128d (res1, res_ref))
abort ();
if (check_union128d (res2, res_ref))
abort ();
res3.x = _mm_mask_move_sd (src1.x, mask, src2.x, src3.x);
res4.x = _mm_maskz_move_sd (mask, src2.x, src3.x);
__builtin_memcpy (res_ref, src2.a, sizeof (src2.a));
res_ref[0] = src3.a[0];
if (check_union128d (res3, res_ref))
abort ();
if (check_union128d (res4, res_ref))
abort ();
_mm_mask_store_sd (p + 1, mask, src1.x);
if (val[1] != src1.a[0])
abort ();
mask ^= 1;
res1.x = _mm_mask_load_sd (src1.x, mask, p);
res2.x = _mm_maskz_load_sd (mask, p);
__builtin_memcpy (res_ref, zero, sizeof (zero));
res_ref[0] = src1.a[0];
if (check_union128d (res1, res_ref))
abort ();
res_ref[0] = zero[0];
if (check_union128d (res2, res_ref))
abort ();
res3.x = _mm_mask_move_sd (src1.x, mask, src2.x, src3.x);
res4.x = _mm_maskz_move_sd (mask, src2.x, src3.x);
__builtin_memcpy (res_ref, src2.a, sizeof (src2.a));
res_ref[0] = src1.a[0];
if (check_union128d (res3, res_ref))
abort ();
res_ref[0] = zero[0];
if (check_union128d (res4, res_ref))
abort ();
val[1] = 42.0;
_mm_mask_store_sd (p + 1, mask, src1.x);
if (val[1] != 42.0)
abort ();
}