aarch64/advsimd-intrinsics/cmp_op.inc

#include <arm_neon.h>
#include "arm-neon-ref.h"
#include "compute-ref-data.h"
#include <math.h>

/* Additional expected results declaration, they are initialized in
   each test file.  */
extern ARRAY(expected_uint, uint, 8, 8);
extern ARRAY(expected_uint, uint, 16, 4);
extern ARRAY(expected_uint, uint, 32, 2);
extern ARRAY(expected_q_uint, uint, 8, 16);
extern ARRAY(expected_q_uint, uint, 16, 8);
extern ARRAY(expected_q_uint, uint, 32, 4);
#if defined (__ARM_FEATURE_FP16_VECTOR_ARITHMETIC)
extern ARRAY(expected_float, uint, 16, 4);
extern ARRAY(expected_q_float, uint, 16, 8);
extern ARRAY(expected_nan, uint, 16, 4);
extern ARRAY(expected_mnan, uint, 16, 4);
extern ARRAY(expected_nan2, uint, 16, 4);
extern ARRAY(expected_inf, uint, 16, 4);
extern ARRAY(expected_minf, uint, 16, 4);
extern ARRAY(expected_inf2, uint, 16, 4);
extern ARRAY(expected_mzero, uint, 16, 4);
#endif
extern ARRAY(expected_float, uint, 32, 2);
extern ARRAY(expected_q_float, uint, 32, 4);
extern ARRAY(expected_uint2, uint, 32, 2);
extern ARRAY(expected_uint3, uint, 32, 2);
extern ARRAY(expected_uint4, uint, 32, 2);
extern ARRAY(expected_nan, uint, 32, 2);
extern ARRAY(expected_mnan, uint, 32, 2);
extern ARRAY(expected_nan2, uint, 32, 2);
extern ARRAY(expected_inf, uint, 32, 2);
extern ARRAY(expected_minf, uint, 32, 2);
extern ARRAY(expected_inf2, uint, 32, 2);
extern ARRAY(expected_mzero, uint, 32, 2);
extern ARRAY(expected_p8, uint, 8, 8);
extern ARRAY(expected_q_p8, uint, 8, 16);

#define FNNAME1(NAME) exec_ ## NAME
#define FNNAME(NAME) FNNAME1(NAME)

void FNNAME (INSN_NAME) (void)
{
  /* Basic test: y=vcomp(x1,x2), then store the result.  */
#define TEST_VCOMP1(INSN, Q, T1, T2, T3, W, N)				\
  VECT_VAR(vector_res, T3, W, N) =					\
    INSN##Q##_##T2##W(VECT_VAR(vector, T1, W, N),			\
		      VECT_VAR(vector2, T1, W, N));			\
  vst1##Q##_u##W(VECT_VAR(result, T3, W, N), VECT_VAR(vector_res, T3, W, N))

#define TEST_VCOMP(INSN, Q, T1, T2, T3, W, N)				\
  TEST_VCOMP1(INSN, Q, T1, T2, T3, W, N)

  /* No need for 64 bits elements.  */
  DECL_VARIABLE(vector, int, 8, 8);
  DECL_VARIABLE(vector, int, 16, 4);
  DECL_VARIABLE(vector, int, 32, 2);
  DECL_VARIABLE(vector, uint, 8, 8);
  DECL_VARIABLE(vector, uint, 16, 4);
  DECL_VARIABLE(vector, uint, 32, 2);
#if defined (__ARM_FEATURE_FP16_VECTOR_ARITHMETIC)
  DECL_VARIABLE (vector, float, 16, 4);
#endif
  DECL_VARIABLE(vector, float, 32, 2);
  DECL_VARIABLE(vector, int, 8, 16);
  DECL_VARIABLE(vector, int, 16, 8);
  DECL_VARIABLE(vector, int, 32, 4);
  DECL_VARIABLE(vector, uint, 8, 16);
  DECL_VARIABLE(vector, uint, 16, 8);
  DECL_VARIABLE(vector, uint, 32, 4);
#if defined (__ARM_FEATURE_FP16_VECTOR_ARITHMETIC)
  DECL_VARIABLE (vector, float, 16, 8);
#endif
  DECL_VARIABLE(vector, float, 32, 4);

  DECL_VARIABLE(vector2, int, 8, 8);
  DECL_VARIABLE(vector2, int, 16, 4);
  DECL_VARIABLE(vector2, int, 32, 2);
  DECL_VARIABLE(vector2, uint, 8, 8);
  DECL_VARIABLE(vector2, uint, 16, 4);
  DECL_VARIABLE(vector2, uint, 32, 2);
#if defined (__ARM_FEATURE_FP16_VECTOR_ARITHMETIC)
  DECL_VARIABLE (vector2, float, 16, 4);
#endif
  DECL_VARIABLE(vector2, float, 32, 2);
  DECL_VARIABLE(vector2, int, 8, 16);
  DECL_VARIABLE(vector2, int, 16, 8);
  DECL_VARIABLE(vector2, int, 32, 4);
  DECL_VARIABLE(vector2, uint, 8, 16);
  DECL_VARIABLE(vector2, uint, 16, 8);
  DECL_VARIABLE(vector2, uint, 32, 4);
#if defined (__ARM_FEATURE_FP16_VECTOR_ARITHMETIC)
  DECL_VARIABLE (vector2, float, 16, 8);
#endif
  DECL_VARIABLE(vector2, float, 32, 4);

  DECL_VARIABLE(vector_res, uint, 8, 8);
  DECL_VARIABLE(vector_res, uint, 16, 4);
  DECL_VARIABLE(vector_res, uint, 32, 2);
  DECL_VARIABLE(vector_res, uint, 8, 16);
  DECL_VARIABLE(vector_res, uint, 16, 8);
  DECL_VARIABLE(vector_res, uint, 32, 4);

  clean_results ();

  /* There is no 64 bits variant, don't use the generic initializer.  */
  VLOAD(vector, buffer, , int, s, 8, 8);
  VLOAD(vector, buffer, , int, s, 16, 4);
  VLOAD(vector, buffer, , int, s, 32, 2);
  VLOAD(vector, buffer, , uint, u, 8, 8);
  VLOAD(vector, buffer, , uint, u, 16, 4);
  VLOAD(vector, buffer, , uint, u, 32, 2);
#if defined (__ARM_FEATURE_FP16_VECTOR_ARITHMETIC)
  VLOAD (vector, buffer, , float, f, 16, 4);
#endif
  VLOAD(vector, buffer, , float, f, 32, 2);

  VLOAD(vector, buffer, q, int, s, 8, 16);
  VLOAD(vector, buffer, q, int, s, 16, 8);
  VLOAD(vector, buffer, q, int, s, 32, 4);
  VLOAD(vector, buffer, q, uint, u, 8, 16);
  VLOAD(vector, buffer, q, uint, u, 16, 8);
  VLOAD(vector, buffer, q, uint, u, 32, 4);
#if defined (__ARM_FEATURE_FP16_VECTOR_ARITHMETIC)
  VLOAD (vector, buffer, q, float, f, 16, 8);
#endif
  VLOAD(vector, buffer, q, float, f, 32, 4);

  /* Choose init value arbitrarily, will be used for vector
     comparison.  */
  VDUP(vector2, , int, s, 8, 8, -10);
  VDUP(vector2, , int, s, 16, 4, -14);
  VDUP(vector2, , int, s, 32, 2, -16);
  VDUP(vector2, , uint, u, 8, 8, 0xF3);
  VDUP(vector2, , uint, u, 16, 4, 0xFFF2);
  VDUP(vector2, , uint, u, 32, 2, 0xFFFFFFF1);
#if defined (__ARM_FEATURE_FP16_VECTOR_ARITHMETIC)
  VDUP (vector2, , float, f, 16, 4, -15.0f);
#endif
  VDUP(vector2, , float, f, 32, 2, -15.0f);

  VDUP(vector2, q, int, s, 8, 16, -4);
  VDUP(vector2, q, int, s, 16, 8, -10);
  VDUP(vector2, q, int, s, 32, 4, -14);
  VDUP(vector2, q, uint, u, 8, 16, 0xF4);
  VDUP(vector2, q, uint, u, 16, 8, 0xFFF6);
  VDUP(vector2, q, uint, u, 32, 4, 0xFFFFFFF2);
#if defined (__ARM_FEATURE_FP16_VECTOR_ARITHMETIC)
  VDUP (vector2, q, float, f, 16, 8, -14.0f);
#endif
  VDUP(vector2, q, float, f, 32, 4, -14.0f);

  /* The comparison operators produce only unsigned results, which
     means that our tests with uint* inputs write their results in the
     same vectors as the int* variants. As a consequence, we have to
     execute and test the int* first, then the uint* ones.
     Same thing for float and poly8.
  */

  /* Apply operator named INSN_NAME.  */
  TEST_VCOMP(INSN_NAME, , int, s, uint, 8, 8);
  TEST_VCOMP(INSN_NAME, , int, s, uint, 16, 4);
  TEST_VCOMP(INSN_NAME, , int, s, uint, 32, 2);
  TEST_VCOMP(INSN_NAME, q, int, s, uint, 8, 16);
  TEST_VCOMP(INSN_NAME, q, int, s, uint, 16, 8);
  TEST_VCOMP(INSN_NAME, q, int, s, uint, 32, 4);

  CHECK(TEST_MSG, uint, 8, 8, PRIx8, expected, "");
  CHECK(TEST_MSG, uint, 16, 4, PRIx16, expected, "");
  CHECK(TEST_MSG, uint, 32, 2, PRIx32, expected, "");
  CHECK(TEST_MSG, uint, 8, 16, PRIx8, expected, "");
  CHECK(TEST_MSG, uint, 16, 8, PRIx16, expected, "");
  CHECK(TEST_MSG, uint, 32, 4, PRIx32, expected, "");

  /* Now the uint* variants.  */
  TEST_VCOMP(INSN_NAME, , uint, u, uint, 8, 8);
  TEST_VCOMP(INSN_NAME, , uint, u, uint, 16, 4);
  TEST_VCOMP(INSN_NAME, , uint, u, uint, 32, 2);
  TEST_VCOMP(INSN_NAME, q, uint, u, uint, 8, 16);
  TEST_VCOMP(INSN_NAME, q, uint, u, uint, 16, 8);
  TEST_VCOMP(INSN_NAME, q, uint, u, uint, 32, 4);

  CHECK(TEST_MSG, uint, 8, 8, PRIx8, expected_uint, "");
  CHECK(TEST_MSG, uint, 16, 4, PRIx16, expected_uint, "");
  CHECK(TEST_MSG, uint, 32, 2, PRIx32, expected_uint, "");
  CHECK(TEST_MSG, uint, 8, 16, PRIx8, expected_q_uint, "");
  CHECK(TEST_MSG, uint, 16, 8, PRIx16, expected_q_uint, "");
  CHECK(TEST_MSG, uint, 32, 4, PRIx32, expected_q_uint, "");

  /* The float variants.  */
#if defined (__ARM_FEATURE_FP16_VECTOR_ARITHMETIC)
  TEST_VCOMP (INSN_NAME, , float, f, uint, 16, 4);
  CHECK (TEST_MSG, uint, 16, 4, PRIx16, expected_float, "");
#endif
  TEST_VCOMP(INSN_NAME, , float, f, uint, 32, 2);
  CHECK(TEST_MSG, uint, 32, 2, PRIx32, expected_float, "");

#if defined (__ARM_FEATURE_FP16_VECTOR_ARITHMETIC)
  TEST_VCOMP (INSN_NAME, q, float, f, uint, 16, 8);
  CHECK (TEST_MSG, uint, 16, 8, PRIx16, expected_q_float, "");
#endif
  TEST_VCOMP(INSN_NAME, q, float, f, uint, 32, 4);
  CHECK(TEST_MSG, uint, 32, 4, PRIx32, expected_q_float, "");

  /* Some "special" input values to test some corner cases.  */
  /* Extra tests to have 100% coverage on all the variants.  */
  VDUP(vector2, , uint, u, 32, 2, 0xFFFFFFF0);
  TEST_VCOMP(INSN_NAME, , uint, u, uint, 32, 2);
  CHECK(TEST_MSG, uint, 32, 2, PRIx32, expected_uint2, "uint 0xfffffff0");

  VDUP(vector2, , int, s, 32, 2, -15);
  TEST_VCOMP(INSN_NAME, , int, s, uint, 32, 2);
  CHECK(TEST_MSG, uint, 32, 2, PRIx32, expected_uint3, "int -15");

  VDUP(vector2, , float, f, 32, 2, -16.0f);
  TEST_VCOMP(INSN_NAME, , float, f, uint, 32, 2);
  CHECK(TEST_MSG, uint, 32, 2, PRIx32, expected_uint4, "float -16.0f");


  /* Extra FP tests with special values (NaN, ....).  */
#if defined (__ARM_FEATURE_FP16_VECTOR_ARITHMETIC)
  VDUP (vector, , float, f, 16, 4, 1.0);
  VDUP (vector2, , float, f, 16, 4, NAN);
  TEST_VCOMP (INSN_NAME, , float, f, uint, 16, 4);
  CHECK (TEST_MSG, uint, 16, 4, PRIx16, expected_nan, "FP special (NaN)");

  VDUP (vector, , float, f, 16, 4, 1.0);
  VDUP (vector2, , float, f, 16, 4, -NAN);
  TEST_VCOMP (INSN_NAME, , float, f, uint, 16, 4);
  CHECK (TEST_MSG, uint, 16, 4, PRIx16, expected_mnan, " FP special (-NaN)");

  VDUP (vector, , float, f, 16, 4, NAN);
  VDUP (vector2, , float, f, 16, 4, 1.0);
  TEST_VCOMP (INSN_NAME, , float, f, uint, 16, 4);
  CHECK (TEST_MSG, uint, 16, 4, PRIx16, expected_nan2, " FP special (NaN)");

  VDUP (vector, , float, f, 16, 4, 1.0);
  VDUP (vector2, , float, f, 16, 4, HUGE_VALF);
  TEST_VCOMP (INSN_NAME, , float, f, uint, 16, 4);
  CHECK (TEST_MSG, uint, 16, 4, PRIx16, expected_inf, " FP special (inf)");

  VDUP (vector, , float, f, 16, 4, 1.0);
  VDUP (vector2, , float, f, 16, 4, -HUGE_VALF);
  TEST_VCOMP (INSN_NAME, , float, f, uint, 16, 4);
  CHECK (TEST_MSG, uint, 16, 4, PRIx16, expected_minf, " FP special (-inf)");

  VDUP (vector, , float, f, 16, 4, HUGE_VALF);
  VDUP (vector2, , float, f, 16, 4, 1.0);
  TEST_VCOMP (INSN_NAME, , float, f, uint, 16, 4);
  CHECK (TEST_MSG, uint, 16, 4, PRIx16, expected_inf2, " FP special (inf)");

  VDUP (vector, , float, f, 16, 4, -0.0);
  VDUP (vector2, , float, f, 16, 4, 0.0);
  TEST_VCOMP (INSN_NAME, , float, f, uint, 16, 4);
  CHECK (TEST_MSG, uint, 16, 4, PRIx16, expected_mzero, " FP special (-0.0)");
#endif

  VDUP(vector, , float, f, 32, 2, 1.0);
  VDUP(vector2, , float, f, 32, 2, NAN);
  TEST_VCOMP(INSN_NAME, , float, f, uint, 32, 2);
  CHECK(TEST_MSG, uint, 32, 2, PRIx32, expected_nan, "FP special (NaN)");

  VDUP(vector, , float, f, 32, 2, 1.0);
  VDUP(vector2, , float, f, 32, 2, -NAN);
  TEST_VCOMP(INSN_NAME, , float, f, uint, 32, 2);
  CHECK(TEST_MSG, uint, 32, 2, PRIx32, expected_mnan, " FP special (-NaN)");

  VDUP(vector, , float, f, 32, 2, NAN);
  VDUP(vector2, , float, f, 32, 2, 1.0);
  TEST_VCOMP(INSN_NAME, , float, f, uint, 32, 2);
  CHECK(TEST_MSG, uint, 32, 2, PRIx32, expected_nan2, " FP special (NaN)");

  VDUP(vector, , float, f, 32, 2, 1.0);
  VDUP(vector2, , float, f, 32, 2, HUGE_VALF);
  TEST_VCOMP(INSN_NAME, , float, f, uint, 32, 2);
  CHECK(TEST_MSG, uint, 32, 2, PRIx32, expected_inf, " FP special (inf)");

  VDUP(vector, , float, f, 32, 2, 1.0);
  VDUP(vector2, , float, f, 32, 2, -HUGE_VALF);
  TEST_VCOMP(INSN_NAME, , float, f, uint, 32, 2);
  CHECK(TEST_MSG, uint, 32, 2, PRIx32, expected_minf, " FP special (-inf)");

  VDUP(vector, , float, f, 32, 2, HUGE_VALF);
  VDUP(vector2, , float, f, 32, 2, 1.0);
  TEST_VCOMP(INSN_NAME, , float, f, uint, 32, 2);
  CHECK(TEST_MSG, uint, 32, 2, PRIx32, expected_inf2, " FP special (inf)");

  VDUP(vector, , float, f, 32, 2, -0.0);
  VDUP(vector2, , float, f, 32, 2, 0.0);
  TEST_VCOMP(INSN_NAME, , float, f, uint, 32, 2);
  CHECK(TEST_MSG, uint, 32, 2, PRIx32, expected_mzero, " FP special (-0.0)");

#ifdef EXTRA_TESTS
  EXTRA_TESTS();
#endif
}

int main (void)
{
  FNNAME (INSN_NAME) ();

  return 0;
}