blob: fa1c19b9f6bdbd405285ac8d2f30111307ba8dcf [file] [log] [blame]
/* { dg-do run } */
/* { dg-require-effective-target avx512er } */
/* { dg-options "-O2 -mavx512er" } */
#include "avx512er-check.h"
#include "avx512f-mask-type.h"
#include "avx512f-helper.h"
#include <math.h>
#define IMM 0x23
void static
avx512er_test (void)
{
union128 src1, src2, res, res1, res2, res3, res4;
float res_ref[4];
MASK_TYPE mask = MASK_VALUE;
int i;
for (i = 0; i < 4; i++)
{
src1.a[i] = 179.345 - 6.5645 * i;
src2.a[i] = 179221345 + 6.5645 * i;
res_ref[i] = src1.a[i];
}
res_ref[0] = 1.0 / sqrt (src2.a[0]);
res.x = _mm_rsqrt28_round_ss (src1.x, src2.x, _MM_FROUND_NO_EXC);
res1.x = _mm_mask_rsqrt28_ss (src1.x, IMM, src1.x, src2.x);
res2.x = _mm_mask_rsqrt28_round_ss (src1.x, IMM, src1.x, src2.x,
_MM_FROUND_TO_NEAREST_INT
| _MM_FROUND_NO_EXC);
res3.x = _mm_maskz_rsqrt28_ss (IMM, src1.x, src2.x);
res4.x = _mm_maskz_rsqrt28_round_ss (IMM, src1.x, src2.x,
_MM_FROUND_TO_NEAREST_INT
| _MM_FROUND_NO_EXC);
if (checkVf (res.a, res_ref, 4))
abort ();
MASK_MERGE () (res_ref, mask, 1);
if (checkVf (res1.a, res_ref, 2))
abort ();
if (checkVf (res2.a, res_ref, 2))
abort ();
MASK_ZERO () (res_ref, mask, 1);
if (checkVf (res3.a, res_ref, 2))
abort ();
if (checkVf (res4.a, res_ref, 2))
abort ();
}