blob: 3ee3b03e2510ae8377905d9dea56bbabc2a8906b [file] [log] [blame]
/* { dg-do run } */
/* { dg-options "-O3 --save-temps" } */
#include <arm_neon.h>
extern void abort (void);
extern float fabsf (float);
extern double fabs (double);
#define NUM_TESTS 8
float input_s1[] = {0.1f, -0.1f, 0.4f, 10.3f, 200.0f, -800.0f, -13.0f, -0.5f};
float input_s2[] = {-0.2f, 0.4f, 0.04f, -100.3f, 2.0f, -80.0f, 13.0f, -0.5f};
double input_d1[] = {0.1, -0.1, 0.4, 10.3, 200.0, -800.0, -13.0, -0.5};
double input_d2[] = {-0.2, 0.4, 0.04, -100.3, 2.0, -80.0, 13.0, -0.5};
#define TEST(T, CMP, SUFFIX, WIDTH, LANES, Q, F) \
int \
test_vca##T##_float##WIDTH##x##LANES##_t (void) \
{ \
int ret = 0; \
int i = 0; \
uint##WIDTH##_t output[NUM_TESTS]; \
\
for (i = 0; i < NUM_TESTS; i++) \
{ \
float##WIDTH##_t f1 = fabs##F (input_##SUFFIX##1[i]); \
float##WIDTH##_t f2 = fabs##F (input_##SUFFIX##2[i]); \
/* Inhibit optimization of our linear test loop. */ \
asm volatile ("" : : : "memory"); \
output[i] = f1 CMP f2 ? -1 : 0; \
} \
\
for (i = 0; i < NUM_TESTS; i += LANES) \
{ \
float##WIDTH##x##LANES##_t in1 = \
vld1##Q##_f##WIDTH (input_##SUFFIX##1 + i); \
float##WIDTH##x##LANES##_t in2 = \
vld1##Q##_f##WIDTH (input_##SUFFIX##2 + i); \
uint##WIDTH##x##LANES##_t expected_out = \
vld1##Q##_u##WIDTH (output + i); \
uint##WIDTH##x##LANES##_t out = \
veor##Q##_u##WIDTH (vca##T##Q##_f##WIDTH (in1, in2), \
expected_out); \
vst1##Q##_u##WIDTH (output + i, out); \
} \
\
for (i = 0; i < NUM_TESTS; i++) \
ret |= output[i]; \
\
return ret; \
}
#define BUILD_VARIANTS(T, CMP) \
TEST (T, CMP, s, 32, 2, , f) \
TEST (T, CMP, s, 32, 4, q, f) \
TEST (T, CMP, d, 64, 2, q, )
BUILD_VARIANTS (ge, >=)
/* { dg-final { scan-assembler "facge\\tv\[0-9\]+\.2s, v\[0-9\]+\.2s, v\[0-9\]+\.2s" } } */
/* { dg-final { scan-assembler "facge\\tv\[0-9\]+\.4s, v\[0-9\]+\.4s, v\[0-9\]+\.4s" } } */
/* { dg-final { scan-assembler "facge\\tv\[0-9\]+\.2d, v\[0-9\]+\.2d, v\[0-9\]+\.2d" } } */
BUILD_VARIANTS (gt, >)
/* { dg-final { scan-assembler "facgt\\tv\[0-9\]+\.2s, v\[0-9\]+\.2s, v\[0-9\]+\.2s" } } */
/* { dg-final { scan-assembler "facgt\\tv\[0-9\]+\.4s, v\[0-9\]+\.4s, v\[0-9\]+\.4s" } } */
/* { dg-final { scan-assembler "facgt\\tv\[0-9\]+\.2d, v\[0-9\]+\.2d, v\[0-9\]+\.2d" } } */
/* No need for another scan-assembler as these tests
also generate facge, facgt instructions. */
BUILD_VARIANTS (le, <=)
BUILD_VARIANTS (lt, <)
#undef TEST
#define TEST(T, CMP, SUFFIX, WIDTH, LANES, Q, F) \
if (test_vca##T##_float##WIDTH##x##LANES##_t ()) \
abort ();
int
main (int argc, char **argv)
{
BUILD_VARIANTS (ge, >=)
BUILD_VARIANTS (gt, >)
BUILD_VARIANTS (le, <=)
BUILD_VARIANTS (lt, <)
return 0;
}