| #include <arm_neon.h> |
| #include "arm-neon-ref.h" |
| #include "compute-ref-data.h" |
| #include <math.h> |
| |
| /* Additional expected results declaration, they are initialized in |
| each test file. */ |
| extern ARRAY(expected_uint, uint, 8, 8); |
| extern ARRAY(expected_uint, uint, 16, 4); |
| extern ARRAY(expected_uint, uint, 32, 2); |
| extern ARRAY(expected_q_uint, uint, 8, 16); |
| extern ARRAY(expected_q_uint, uint, 16, 8); |
| extern ARRAY(expected_q_uint, uint, 32, 4); |
| #if defined (__ARM_FEATURE_FP16_VECTOR_ARITHMETIC) |
| extern ARRAY(expected_float, uint, 16, 4); |
| extern ARRAY(expected_q_float, uint, 16, 8); |
| extern ARRAY(expected_nan, uint, 16, 4); |
| extern ARRAY(expected_mnan, uint, 16, 4); |
| extern ARRAY(expected_nan2, uint, 16, 4); |
| extern ARRAY(expected_inf, uint, 16, 4); |
| extern ARRAY(expected_minf, uint, 16, 4); |
| extern ARRAY(expected_inf2, uint, 16, 4); |
| extern ARRAY(expected_mzero, uint, 16, 4); |
| #endif |
| extern ARRAY(expected_float, uint, 32, 2); |
| extern ARRAY(expected_q_float, uint, 32, 4); |
| extern ARRAY(expected_uint2, uint, 32, 2); |
| extern ARRAY(expected_uint3, uint, 32, 2); |
| extern ARRAY(expected_uint4, uint, 32, 2); |
| extern ARRAY(expected_nan, uint, 32, 2); |
| extern ARRAY(expected_mnan, uint, 32, 2); |
| extern ARRAY(expected_nan2, uint, 32, 2); |
| extern ARRAY(expected_inf, uint, 32, 2); |
| extern ARRAY(expected_minf, uint, 32, 2); |
| extern ARRAY(expected_inf2, uint, 32, 2); |
| extern ARRAY(expected_mzero, uint, 32, 2); |
| extern ARRAY(expected_p8, uint, 8, 8); |
| extern ARRAY(expected_q_p8, uint, 8, 16); |
| |
| #define FNNAME1(NAME) exec_ ## NAME |
| #define FNNAME(NAME) FNNAME1(NAME) |
| |
| void FNNAME (INSN_NAME) (void) |
| { |
| /* Basic test: y=vcomp(x1,x2), then store the result. */ |
| #define TEST_VCOMP1(INSN, Q, T1, T2, T3, W, N) \ |
| VECT_VAR(vector_res, T3, W, N) = \ |
| INSN##Q##_##T2##W(VECT_VAR(vector, T1, W, N), \ |
| VECT_VAR(vector2, T1, W, N)); \ |
| vst1##Q##_u##W(VECT_VAR(result, T3, W, N), VECT_VAR(vector_res, T3, W, N)) |
| |
| #define TEST_VCOMP(INSN, Q, T1, T2, T3, W, N) \ |
| TEST_VCOMP1(INSN, Q, T1, T2, T3, W, N) |
| |
| /* No need for 64 bits elements. */ |
| DECL_VARIABLE(vector, int, 8, 8); |
| DECL_VARIABLE(vector, int, 16, 4); |
| DECL_VARIABLE(vector, int, 32, 2); |
| DECL_VARIABLE(vector, uint, 8, 8); |
| DECL_VARIABLE(vector, uint, 16, 4); |
| DECL_VARIABLE(vector, uint, 32, 2); |
| #if defined (__ARM_FEATURE_FP16_VECTOR_ARITHMETIC) |
| DECL_VARIABLE (vector, float, 16, 4); |
| #endif |
| DECL_VARIABLE(vector, float, 32, 2); |
| DECL_VARIABLE(vector, int, 8, 16); |
| DECL_VARIABLE(vector, int, 16, 8); |
| DECL_VARIABLE(vector, int, 32, 4); |
| DECL_VARIABLE(vector, uint, 8, 16); |
| DECL_VARIABLE(vector, uint, 16, 8); |
| DECL_VARIABLE(vector, uint, 32, 4); |
| #if defined (__ARM_FEATURE_FP16_VECTOR_ARITHMETIC) |
| DECL_VARIABLE (vector, float, 16, 8); |
| #endif |
| DECL_VARIABLE(vector, float, 32, 4); |
| |
| DECL_VARIABLE(vector2, int, 8, 8); |
| DECL_VARIABLE(vector2, int, 16, 4); |
| DECL_VARIABLE(vector2, int, 32, 2); |
| DECL_VARIABLE(vector2, uint, 8, 8); |
| DECL_VARIABLE(vector2, uint, 16, 4); |
| DECL_VARIABLE(vector2, uint, 32, 2); |
| #if defined (__ARM_FEATURE_FP16_VECTOR_ARITHMETIC) |
| DECL_VARIABLE (vector2, float, 16, 4); |
| #endif |
| DECL_VARIABLE(vector2, float, 32, 2); |
| DECL_VARIABLE(vector2, int, 8, 16); |
| DECL_VARIABLE(vector2, int, 16, 8); |
| DECL_VARIABLE(vector2, int, 32, 4); |
| DECL_VARIABLE(vector2, uint, 8, 16); |
| DECL_VARIABLE(vector2, uint, 16, 8); |
| DECL_VARIABLE(vector2, uint, 32, 4); |
| #if defined (__ARM_FEATURE_FP16_VECTOR_ARITHMETIC) |
| DECL_VARIABLE (vector2, float, 16, 8); |
| #endif |
| DECL_VARIABLE(vector2, float, 32, 4); |
| |
| DECL_VARIABLE(vector_res, uint, 8, 8); |
| DECL_VARIABLE(vector_res, uint, 16, 4); |
| DECL_VARIABLE(vector_res, uint, 32, 2); |
| DECL_VARIABLE(vector_res, uint, 8, 16); |
| DECL_VARIABLE(vector_res, uint, 16, 8); |
| DECL_VARIABLE(vector_res, uint, 32, 4); |
| |
| clean_results (); |
| |
| /* There is no 64 bits variant, don't use the generic initializer. */ |
| VLOAD(vector, buffer, , int, s, 8, 8); |
| VLOAD(vector, buffer, , int, s, 16, 4); |
| VLOAD(vector, buffer, , int, s, 32, 2); |
| VLOAD(vector, buffer, , uint, u, 8, 8); |
| VLOAD(vector, buffer, , uint, u, 16, 4); |
| VLOAD(vector, buffer, , uint, u, 32, 2); |
| #if defined (__ARM_FEATURE_FP16_VECTOR_ARITHMETIC) |
| VLOAD (vector, buffer, , float, f, 16, 4); |
| #endif |
| VLOAD(vector, buffer, , float, f, 32, 2); |
| |
| VLOAD(vector, buffer, q, int, s, 8, 16); |
| VLOAD(vector, buffer, q, int, s, 16, 8); |
| VLOAD(vector, buffer, q, int, s, 32, 4); |
| VLOAD(vector, buffer, q, uint, u, 8, 16); |
| VLOAD(vector, buffer, q, uint, u, 16, 8); |
| VLOAD(vector, buffer, q, uint, u, 32, 4); |
| #if defined (__ARM_FEATURE_FP16_VECTOR_ARITHMETIC) |
| VLOAD (vector, buffer, q, float, f, 16, 8); |
| #endif |
| VLOAD(vector, buffer, q, float, f, 32, 4); |
| |
| /* Choose init value arbitrarily, will be used for vector |
| comparison. */ |
| VDUP(vector2, , int, s, 8, 8, -10); |
| VDUP(vector2, , int, s, 16, 4, -14); |
| VDUP(vector2, , int, s, 32, 2, -16); |
| VDUP(vector2, , uint, u, 8, 8, 0xF3); |
| VDUP(vector2, , uint, u, 16, 4, 0xFFF2); |
| VDUP(vector2, , uint, u, 32, 2, 0xFFFFFFF1); |
| #if defined (__ARM_FEATURE_FP16_VECTOR_ARITHMETIC) |
| VDUP (vector2, , float, f, 16, 4, -15.0f); |
| #endif |
| VDUP(vector2, , float, f, 32, 2, -15.0f); |
| |
| VDUP(vector2, q, int, s, 8, 16, -4); |
| VDUP(vector2, q, int, s, 16, 8, -10); |
| VDUP(vector2, q, int, s, 32, 4, -14); |
| VDUP(vector2, q, uint, u, 8, 16, 0xF4); |
| VDUP(vector2, q, uint, u, 16, 8, 0xFFF6); |
| VDUP(vector2, q, uint, u, 32, 4, 0xFFFFFFF2); |
| #if defined (__ARM_FEATURE_FP16_VECTOR_ARITHMETIC) |
| VDUP (vector2, q, float, f, 16, 8, -14.0f); |
| #endif |
| VDUP(vector2, q, float, f, 32, 4, -14.0f); |
| |
| /* The comparison operators produce only unsigned results, which |
| means that our tests with uint* inputs write their results in the |
| same vectors as the int* variants. As a consequence, we have to |
| execute and test the int* first, then the uint* ones. |
| Same thing for float and poly8. |
| */ |
| |
| /* Apply operator named INSN_NAME. */ |
| TEST_VCOMP(INSN_NAME, , int, s, uint, 8, 8); |
| TEST_VCOMP(INSN_NAME, , int, s, uint, 16, 4); |
| TEST_VCOMP(INSN_NAME, , int, s, uint, 32, 2); |
| TEST_VCOMP(INSN_NAME, q, int, s, uint, 8, 16); |
| TEST_VCOMP(INSN_NAME, q, int, s, uint, 16, 8); |
| TEST_VCOMP(INSN_NAME, q, int, s, uint, 32, 4); |
| |
| CHECK(TEST_MSG, uint, 8, 8, PRIx8, expected, ""); |
| CHECK(TEST_MSG, uint, 16, 4, PRIx16, expected, ""); |
| CHECK(TEST_MSG, uint, 32, 2, PRIx32, expected, ""); |
| CHECK(TEST_MSG, uint, 8, 16, PRIx8, expected, ""); |
| CHECK(TEST_MSG, uint, 16, 8, PRIx16, expected, ""); |
| CHECK(TEST_MSG, uint, 32, 4, PRIx32, expected, ""); |
| |
| /* Now the uint* variants. */ |
| TEST_VCOMP(INSN_NAME, , uint, u, uint, 8, 8); |
| TEST_VCOMP(INSN_NAME, , uint, u, uint, 16, 4); |
| TEST_VCOMP(INSN_NAME, , uint, u, uint, 32, 2); |
| TEST_VCOMP(INSN_NAME, q, uint, u, uint, 8, 16); |
| TEST_VCOMP(INSN_NAME, q, uint, u, uint, 16, 8); |
| TEST_VCOMP(INSN_NAME, q, uint, u, uint, 32, 4); |
| |
| CHECK(TEST_MSG, uint, 8, 8, PRIx8, expected_uint, ""); |
| CHECK(TEST_MSG, uint, 16, 4, PRIx16, expected_uint, ""); |
| CHECK(TEST_MSG, uint, 32, 2, PRIx32, expected_uint, ""); |
| CHECK(TEST_MSG, uint, 8, 16, PRIx8, expected_q_uint, ""); |
| CHECK(TEST_MSG, uint, 16, 8, PRIx16, expected_q_uint, ""); |
| CHECK(TEST_MSG, uint, 32, 4, PRIx32, expected_q_uint, ""); |
| |
| /* The float variants. */ |
| #if defined (__ARM_FEATURE_FP16_VECTOR_ARITHMETIC) |
| TEST_VCOMP (INSN_NAME, , float, f, uint, 16, 4); |
| CHECK (TEST_MSG, uint, 16, 4, PRIx16, expected_float, ""); |
| #endif |
| TEST_VCOMP(INSN_NAME, , float, f, uint, 32, 2); |
| CHECK(TEST_MSG, uint, 32, 2, PRIx32, expected_float, ""); |
| |
| #if defined (__ARM_FEATURE_FP16_VECTOR_ARITHMETIC) |
| TEST_VCOMP (INSN_NAME, q, float, f, uint, 16, 8); |
| CHECK (TEST_MSG, uint, 16, 8, PRIx16, expected_q_float, ""); |
| #endif |
| TEST_VCOMP(INSN_NAME, q, float, f, uint, 32, 4); |
| CHECK(TEST_MSG, uint, 32, 4, PRIx32, expected_q_float, ""); |
| |
| /* Some "special" input values to test some corner cases. */ |
| /* Extra tests to have 100% coverage on all the variants. */ |
| VDUP(vector2, , uint, u, 32, 2, 0xFFFFFFF0); |
| TEST_VCOMP(INSN_NAME, , uint, u, uint, 32, 2); |
| CHECK(TEST_MSG, uint, 32, 2, PRIx32, expected_uint2, "uint 0xfffffff0"); |
| |
| VDUP(vector2, , int, s, 32, 2, -15); |
| TEST_VCOMP(INSN_NAME, , int, s, uint, 32, 2); |
| CHECK(TEST_MSG, uint, 32, 2, PRIx32, expected_uint3, "int -15"); |
| |
| VDUP(vector2, , float, f, 32, 2, -16.0f); |
| TEST_VCOMP(INSN_NAME, , float, f, uint, 32, 2); |
| CHECK(TEST_MSG, uint, 32, 2, PRIx32, expected_uint4, "float -16.0f"); |
| |
| |
| /* Extra FP tests with special values (NaN, ....). */ |
| #if defined (__ARM_FEATURE_FP16_VECTOR_ARITHMETIC) |
| VDUP (vector, , float, f, 16, 4, 1.0); |
| VDUP (vector2, , float, f, 16, 4, NAN); |
| TEST_VCOMP (INSN_NAME, , float, f, uint, 16, 4); |
| CHECK (TEST_MSG, uint, 16, 4, PRIx16, expected_nan, "FP special (NaN)"); |
| |
| VDUP (vector, , float, f, 16, 4, 1.0); |
| VDUP (vector2, , float, f, 16, 4, -NAN); |
| TEST_VCOMP (INSN_NAME, , float, f, uint, 16, 4); |
| CHECK (TEST_MSG, uint, 16, 4, PRIx16, expected_mnan, " FP special (-NaN)"); |
| |
| VDUP (vector, , float, f, 16, 4, NAN); |
| VDUP (vector2, , float, f, 16, 4, 1.0); |
| TEST_VCOMP (INSN_NAME, , float, f, uint, 16, 4); |
| CHECK (TEST_MSG, uint, 16, 4, PRIx16, expected_nan2, " FP special (NaN)"); |
| |
| VDUP (vector, , float, f, 16, 4, 1.0); |
| VDUP (vector2, , float, f, 16, 4, HUGE_VALF); |
| TEST_VCOMP (INSN_NAME, , float, f, uint, 16, 4); |
| CHECK (TEST_MSG, uint, 16, 4, PRIx16, expected_inf, " FP special (inf)"); |
| |
| VDUP (vector, , float, f, 16, 4, 1.0); |
| VDUP (vector2, , float, f, 16, 4, -HUGE_VALF); |
| TEST_VCOMP (INSN_NAME, , float, f, uint, 16, 4); |
| CHECK (TEST_MSG, uint, 16, 4, PRIx16, expected_minf, " FP special (-inf)"); |
| |
| VDUP (vector, , float, f, 16, 4, HUGE_VALF); |
| VDUP (vector2, , float, f, 16, 4, 1.0); |
| TEST_VCOMP (INSN_NAME, , float, f, uint, 16, 4); |
| CHECK (TEST_MSG, uint, 16, 4, PRIx16, expected_inf2, " FP special (inf)"); |
| |
| VDUP (vector, , float, f, 16, 4, -0.0); |
| VDUP (vector2, , float, f, 16, 4, 0.0); |
| TEST_VCOMP (INSN_NAME, , float, f, uint, 16, 4); |
| CHECK (TEST_MSG, uint, 16, 4, PRIx16, expected_mzero, " FP special (-0.0)"); |
| #endif |
| |
| VDUP(vector, , float, f, 32, 2, 1.0); |
| VDUP(vector2, , float, f, 32, 2, NAN); |
| TEST_VCOMP(INSN_NAME, , float, f, uint, 32, 2); |
| CHECK(TEST_MSG, uint, 32, 2, PRIx32, expected_nan, "FP special (NaN)"); |
| |
| VDUP(vector, , float, f, 32, 2, 1.0); |
| VDUP(vector2, , float, f, 32, 2, -NAN); |
| TEST_VCOMP(INSN_NAME, , float, f, uint, 32, 2); |
| CHECK(TEST_MSG, uint, 32, 2, PRIx32, expected_mnan, " FP special (-NaN)"); |
| |
| VDUP(vector, , float, f, 32, 2, NAN); |
| VDUP(vector2, , float, f, 32, 2, 1.0); |
| TEST_VCOMP(INSN_NAME, , float, f, uint, 32, 2); |
| CHECK(TEST_MSG, uint, 32, 2, PRIx32, expected_nan2, " FP special (NaN)"); |
| |
| VDUP(vector, , float, f, 32, 2, 1.0); |
| VDUP(vector2, , float, f, 32, 2, HUGE_VALF); |
| TEST_VCOMP(INSN_NAME, , float, f, uint, 32, 2); |
| CHECK(TEST_MSG, uint, 32, 2, PRIx32, expected_inf, " FP special (inf)"); |
| |
| VDUP(vector, , float, f, 32, 2, 1.0); |
| VDUP(vector2, , float, f, 32, 2, -HUGE_VALF); |
| TEST_VCOMP(INSN_NAME, , float, f, uint, 32, 2); |
| CHECK(TEST_MSG, uint, 32, 2, PRIx32, expected_minf, " FP special (-inf)"); |
| |
| VDUP(vector, , float, f, 32, 2, HUGE_VALF); |
| VDUP(vector2, , float, f, 32, 2, 1.0); |
| TEST_VCOMP(INSN_NAME, , float, f, uint, 32, 2); |
| CHECK(TEST_MSG, uint, 32, 2, PRIx32, expected_inf2, " FP special (inf)"); |
| |
| VDUP(vector, , float, f, 32, 2, -0.0); |
| VDUP(vector2, , float, f, 32, 2, 0.0); |
| TEST_VCOMP(INSN_NAME, , float, f, uint, 32, 2); |
| CHECK(TEST_MSG, uint, 32, 2, PRIx32, expected_mzero, " FP special (-0.0)"); |
| |
| #ifdef EXTRA_TESTS |
| EXTRA_TESTS(); |
| #endif |
| } |
| |
| int main (void) |
| { |
| FNNAME (INSN_NAME) (); |
| |
| return 0; |
| } |