blob: c019f248d20aa97950095d2141cb370fcb479234 [file] [log] [blame]
/* { dg-final { check-function-bodies "**" "" "-DCHECK_ASM" } } */
#include "test_sve_acle.h"
/*
** abd_f16_m_tied1:
** fabd z0\.h, p0/m, z0\.h, z1\.h
** ret
*/
TEST_UNIFORM_Z (abd_f16_m_tied1, svfloat16_t,
z0 = svabd_f16_m (p0, z0, z1),
z0 = svabd_m (p0, z0, z1))
/*
** abd_f16_m_tied2:
** mov (z[0-9]+)\.d, z0\.d
** movprfx z0, z1
** fabd z0\.h, p0/m, z0\.h, \1\.h
** ret
*/
TEST_UNIFORM_Z (abd_f16_m_tied2, svfloat16_t,
z0 = svabd_f16_m (p0, z1, z0),
z0 = svabd_m (p0, z1, z0))
/*
** abd_f16_m_untied:
** movprfx z0, z1
** fabd z0\.h, p0/m, z0\.h, z2\.h
** ret
*/
TEST_UNIFORM_Z (abd_f16_m_untied, svfloat16_t,
z0 = svabd_f16_m (p0, z1, z2),
z0 = svabd_m (p0, z1, z2))
/*
** abd_h4_f16_m_tied1:
** mov (z[0-9]+\.h), h4
** fabd z0\.h, p0/m, z0\.h, \1
** ret
*/
TEST_UNIFORM_ZD (abd_h4_f16_m_tied1, svfloat16_t, __fp16,
z0 = svabd_n_f16_m (p0, z0, d4),
z0 = svabd_m (p0, z0, d4))
/*
** abd_h4_f16_m_untied:
** mov (z[0-9]+\.h), h4
** movprfx z0, z1
** fabd z0\.h, p0/m, z0\.h, \1
** ret
*/
TEST_UNIFORM_ZD (abd_h4_f16_m_untied, svfloat16_t, __fp16,
z0 = svabd_n_f16_m (p0, z1, d4),
z0 = svabd_m (p0, z1, d4))
/*
** abd_1_f16_m_tied1:
** fmov (z[0-9]+\.h), #1\.0(?:e\+0)?
** fabd z0\.h, p0/m, z0\.h, \1
** ret
*/
TEST_UNIFORM_Z (abd_1_f16_m_tied1, svfloat16_t,
z0 = svabd_n_f16_m (p0, z0, 1),
z0 = svabd_m (p0, z0, 1))
/*
** abd_1_f16_m_untied: { xfail *-*-* }
** fmov (z[0-9]+\.h), #1\.0(?:e\+0)?
** movprfx z0, z1
** fabd z0\.h, p0/m, z0\.h, \1
** ret
*/
TEST_UNIFORM_Z (abd_1_f16_m_untied, svfloat16_t,
z0 = svabd_n_f16_m (p0, z1, 1),
z0 = svabd_m (p0, z1, 1))
/*
** abd_f16_z_tied1:
** movprfx z0\.h, p0/z, z0\.h
** fabd z0\.h, p0/m, z0\.h, z1\.h
** ret
*/
TEST_UNIFORM_Z (abd_f16_z_tied1, svfloat16_t,
z0 = svabd_f16_z (p0, z0, z1),
z0 = svabd_z (p0, z0, z1))
/*
** abd_f16_z_tied2:
** movprfx z0\.h, p0/z, z0\.h
** fabd z0\.h, p0/m, z0\.h, z1\.h
** ret
*/
TEST_UNIFORM_Z (abd_f16_z_tied2, svfloat16_t,
z0 = svabd_f16_z (p0, z1, z0),
z0 = svabd_z (p0, z1, z0))
/*
** abd_f16_z_untied:
** (
** movprfx z0\.h, p0/z, z1\.h
** fabd z0\.h, p0/m, z0\.h, z2\.h
** |
** movprfx z0\.h, p0/z, z2\.h
** fabd z0\.h, p0/m, z0\.h, z1\.h
** )
** ret
*/
TEST_UNIFORM_Z (abd_f16_z_untied, svfloat16_t,
z0 = svabd_f16_z (p0, z1, z2),
z0 = svabd_z (p0, z1, z2))
/*
** abd_h4_f16_z_tied1:
** mov (z[0-9]+\.h), h4
** movprfx z0\.h, p0/z, z0\.h
** fabd z0\.h, p0/m, z0\.h, \1
** ret
*/
TEST_UNIFORM_ZD (abd_h4_f16_z_tied1, svfloat16_t, __fp16,
z0 = svabd_n_f16_z (p0, z0, d4),
z0 = svabd_z (p0, z0, d4))
/*
** abd_h4_f16_z_untied:
** mov (z[0-9]+\.h), h4
** (
** movprfx z0\.h, p0/z, z1\.h
** fabd z0\.h, p0/m, z0\.h, \1
** |
** movprfx z0\.h, p0/z, \1
** fabd z0\.h, p0/m, z0\.h, z1\.h
** )
** ret
*/
TEST_UNIFORM_ZD (abd_h4_f16_z_untied, svfloat16_t, __fp16,
z0 = svabd_n_f16_z (p0, z1, d4),
z0 = svabd_z (p0, z1, d4))
/*
** abd_1_f16_z_tied1:
** fmov (z[0-9]+\.h), #1\.0(?:e\+0)?
** movprfx z0\.h, p0/z, z0\.h
** fabd z0\.h, p0/m, z0\.h, \1
** ret
*/
TEST_UNIFORM_Z (abd_1_f16_z_tied1, svfloat16_t,
z0 = svabd_n_f16_z (p0, z0, 1),
z0 = svabd_z (p0, z0, 1))
/*
** abd_1_f16_z_untied:
** fmov (z[0-9]+\.h), #1\.0(?:e\+0)?
** (
** movprfx z0\.h, p0/z, z1\.h
** fabd z0\.h, p0/m, z0\.h, \1
** |
** movprfx z0\.h, p0/z, \1
** fabd z0\.h, p0/m, z0\.h, z1\.h
** )
** ret
*/
TEST_UNIFORM_Z (abd_1_f16_z_untied, svfloat16_t,
z0 = svabd_n_f16_z (p0, z1, 1),
z0 = svabd_z (p0, z1, 1))
/*
** abd_0p5_f16_z_tied1:
** fmov (z[0-9]+\.h), #(?:0\.5|5\.0e-1)
** movprfx z0\.h, p0/z, z0\.h
** fabd z0\.h, p0/m, z0\.h, \1
** ret
*/
TEST_UNIFORM_Z (abd_0p5_f16_z_tied1, svfloat16_t,
z0 = svabd_n_f16_z (p0, z0, 0.5),
z0 = svabd_z (p0, z0, 0.5))
/*
** abd_0p5_f16_z_untied:
** fmov (z[0-9]+\.h), #(?:0\.5|5\.0e-1)
** (
** movprfx z0\.h, p0/z, z1\.h
** fabd z0\.h, p0/m, z0\.h, \1
** |
** movprfx z0\.h, p0/z, \1
** fabd z0\.h, p0/m, z0\.h, z1\.h
** )
** ret
*/
TEST_UNIFORM_Z (abd_0p5_f16_z_untied, svfloat16_t,
z0 = svabd_n_f16_z (p0, z1, 0.5),
z0 = svabd_z (p0, z1, 0.5))
/*
** abd_m1_f16_z_tied1:
** fmov (z[0-9]+\.h), #-1\.0(?:e\+0)?
** movprfx z0\.h, p0/z, z0\.h
** fabd z0\.h, p0/m, z0\.h, \1
** ret
*/
TEST_UNIFORM_Z (abd_m1_f16_z_tied1, svfloat16_t,
z0 = svabd_n_f16_z (p0, z0, -1),
z0 = svabd_z (p0, z0, -1))
/*
** abd_m1_f16_z_untied:
** fmov (z[0-9]+\.h), #-1\.0(?:e\+0)?
** (
** movprfx z0\.h, p0/z, z1\.h
** fabd z0\.h, p0/m, z0\.h, \1
** |
** movprfx z0\.h, p0/z, \1
** fabd z0\.h, p0/m, z0\.h, z1\.h
** )
** ret
*/
TEST_UNIFORM_Z (abd_m1_f16_z_untied, svfloat16_t,
z0 = svabd_n_f16_z (p0, z1, -1),
z0 = svabd_z (p0, z1, -1))
/*
** abd_m0p5_f16_z_tied1:
** fmov (z[0-9]+\.h), #-(?:0\.5|5\.0e-1)
** movprfx z0\.h, p0/z, z0\.h
** fabd z0\.h, p0/m, z0\.h, \1
** ret
*/
TEST_UNIFORM_Z (abd_m0p5_f16_z_tied1, svfloat16_t,
z0 = svabd_n_f16_z (p0, z0, -0.5),
z0 = svabd_z (p0, z0, -0.5))
/*
** abd_m0p5_f16_z_untied:
** fmov (z[0-9]+\.h), #-(?:0\.5|5\.0e-1)
** (
** movprfx z0\.h, p0/z, z1\.h
** fabd z0\.h, p0/m, z0\.h, \1
** |
** movprfx z0\.h, p0/z, \1
** fabd z0\.h, p0/m, z0\.h, z1\.h
** )
** ret
*/
TEST_UNIFORM_Z (abd_m0p5_f16_z_untied, svfloat16_t,
z0 = svabd_n_f16_z (p0, z1, -0.5),
z0 = svabd_z (p0, z1, -0.5))
/*
** abd_m2_f16_z:
** fmov (z[0-9]+\.h), #-2\.0(?:e\+0)?
** movprfx z0\.h, p0/z, z0\.h
** fabd z0\.h, p0/m, z0\.h, \1
** ret
*/
TEST_UNIFORM_Z (abd_m2_f16_z, svfloat16_t,
z0 = svabd_n_f16_z (p0, z0, -2),
z0 = svabd_z (p0, z0, -2))
/*
** abd_f16_x_tied1:
** fabd z0\.h, p0/m, z0\.h, z1\.h
** ret
*/
TEST_UNIFORM_Z (abd_f16_x_tied1, svfloat16_t,
z0 = svabd_f16_x (p0, z0, z1),
z0 = svabd_x (p0, z0, z1))
/*
** abd_f16_x_tied2:
** fabd z0\.h, p0/m, z0\.h, z1\.h
** ret
*/
TEST_UNIFORM_Z (abd_f16_x_tied2, svfloat16_t,
z0 = svabd_f16_x (p0, z1, z0),
z0 = svabd_x (p0, z1, z0))
/*
** abd_f16_x_untied:
** (
** movprfx z0, z1
** fabd z0\.h, p0/m, z0\.h, z2\.h
** |
** movprfx z0, z2
** fabd z0\.h, p0/m, z0\.h, z1\.h
** )
** ret
*/
TEST_UNIFORM_Z (abd_f16_x_untied, svfloat16_t,
z0 = svabd_f16_x (p0, z1, z2),
z0 = svabd_x (p0, z1, z2))
/*
** abd_h4_f16_x_tied1:
** mov (z[0-9]+\.h), h4
** fabd z0\.h, p0/m, z0\.h, \1
** ret
*/
TEST_UNIFORM_ZD (abd_h4_f16_x_tied1, svfloat16_t, __fp16,
z0 = svabd_n_f16_x (p0, z0, d4),
z0 = svabd_x (p0, z0, d4))
/*
** abd_h4_f16_x_untied:
** mov z0\.h, h4
** fabd z0\.h, p0/m, z0\.h, z1\.h
** ret
*/
TEST_UNIFORM_ZD (abd_h4_f16_x_untied, svfloat16_t, __fp16,
z0 = svabd_n_f16_x (p0, z1, d4),
z0 = svabd_x (p0, z1, d4))
/*
** abd_1_f16_x_tied1:
** fmov (z[0-9]+\.h), #1\.0(?:e\+0)?
** fabd z0\.h, p0/m, z0\.h, \1
** ret
*/
TEST_UNIFORM_Z (abd_1_f16_x_tied1, svfloat16_t,
z0 = svabd_n_f16_x (p0, z0, 1),
z0 = svabd_x (p0, z0, 1))
/*
** abd_1_f16_x_untied:
** fmov z0\.h, #1\.0(?:e\+0)?
** fabd z0\.h, p0/m, z0\.h, z1\.h
** ret
*/
TEST_UNIFORM_Z (abd_1_f16_x_untied, svfloat16_t,
z0 = svabd_n_f16_x (p0, z1, 1),
z0 = svabd_x (p0, z1, 1))
/*
** abd_0p5_f16_x_tied1:
** fmov (z[0-9]+\.h), #(?:0\.5|5\.0e-1)
** fabd z0\.h, p0/m, z0\.h, \1
** ret
*/
TEST_UNIFORM_Z (abd_0p5_f16_x_tied1, svfloat16_t,
z0 = svabd_n_f16_x (p0, z0, 0.5),
z0 = svabd_x (p0, z0, 0.5))
/*
** abd_0p5_f16_x_untied:
** fmov z0\.h, #(?:0\.5|5\.0e-1)
** fabd z0\.h, p0/m, z0\.h, z1\.h
** ret
*/
TEST_UNIFORM_Z (abd_0p5_f16_x_untied, svfloat16_t,
z0 = svabd_n_f16_x (p0, z1, 0.5),
z0 = svabd_x (p0, z1, 0.5))
/*
** abd_m1_f16_x_tied1:
** fmov (z[0-9]+\.h), #-1\.0(?:e\+0)?
** fabd z0\.h, p0/m, z0\.h, \1
** ret
*/
TEST_UNIFORM_Z (abd_m1_f16_x_tied1, svfloat16_t,
z0 = svabd_n_f16_x (p0, z0, -1),
z0 = svabd_x (p0, z0, -1))
/*
** abd_m1_f16_x_untied:
** fmov z0\.h, #-1\.0(?:e\+0)?
** fabd z0\.h, p0/m, z0\.h, z1\.h
** ret
*/
TEST_UNIFORM_Z (abd_m1_f16_x_untied, svfloat16_t,
z0 = svabd_n_f16_x (p0, z1, -1),
z0 = svabd_x (p0, z1, -1))
/*
** abd_m0p5_f16_x_tied1:
** fmov (z[0-9]+\.h), #-(?:0\.5|5\.0e-1)
** fabd z0\.h, p0/m, z0\.h, \1
** ret
*/
TEST_UNIFORM_Z (abd_m0p5_f16_x_tied1, svfloat16_t,
z0 = svabd_n_f16_x (p0, z0, -0.5),
z0 = svabd_x (p0, z0, -0.5))
/*
** abd_m0p5_f16_x_untied:
** fmov z0\.h, #-(?:0\.5|5\.0e-1)
** fabd z0\.h, p0/m, z0\.h, z1\.h
** ret
*/
TEST_UNIFORM_Z (abd_m0p5_f16_x_untied, svfloat16_t,
z0 = svabd_n_f16_x (p0, z1, -0.5),
z0 = svabd_x (p0, z1, -0.5))
/*
** abd_2_f16_x_tied1:
** fmov (z[0-9]+\.h), #2\.0(?:e\+0)?
** fabd z0\.h, p0/m, z0\.h, \1
** ret
*/
TEST_UNIFORM_Z (abd_2_f16_x_tied1, svfloat16_t,
z0 = svabd_n_f16_x (p0, z0, 2),
z0 = svabd_x (p0, z0, 2))
/*
** abd_2_f16_x_untied:
** fmov z0\.h, #2\.0(?:e\+0)?
** fabd z0\.h, p0/m, z0\.h, z1\.h
** ret
*/
TEST_UNIFORM_Z (abd_2_f16_x_untied, svfloat16_t,
z0 = svabd_n_f16_x (p0, z1, 2),
z0 = svabd_x (p0, z1, 2))
/*
** ptrue_abd_f16_x_tied1:
** ...
** ptrue p[0-9]+\.b[^\n]*
** ...
** ret
*/
TEST_UNIFORM_Z (ptrue_abd_f16_x_tied1, svfloat16_t,
z0 = svabd_f16_x (svptrue_b16 (), z0, z1),
z0 = svabd_x (svptrue_b16 (), z0, z1))
/*
** ptrue_abd_f16_x_tied2:
** ...
** ptrue p[0-9]+\.b[^\n]*
** ...
** ret
*/
TEST_UNIFORM_Z (ptrue_abd_f16_x_tied2, svfloat16_t,
z0 = svabd_f16_x (svptrue_b16 (), z1, z0),
z0 = svabd_x (svptrue_b16 (), z1, z0))
/*
** ptrue_abd_f16_x_untied:
** ...
** ptrue p[0-9]+\.b[^\n]*
** ...
** ret
*/
TEST_UNIFORM_Z (ptrue_abd_f16_x_untied, svfloat16_t,
z0 = svabd_f16_x (svptrue_b16 (), z1, z2),
z0 = svabd_x (svptrue_b16 (), z1, z2))
/*
** ptrue_abd_1_f16_x_tied1:
** ...
** ptrue p[0-9]+\.b[^\n]*
** ...
** ret
*/
TEST_UNIFORM_Z (ptrue_abd_1_f16_x_tied1, svfloat16_t,
z0 = svabd_n_f16_x (svptrue_b16 (), z0, 1),
z0 = svabd_x (svptrue_b16 (), z0, 1))
/*
** ptrue_abd_1_f16_x_untied:
** ...
** ptrue p[0-9]+\.b[^\n]*
** ...
** ret
*/
TEST_UNIFORM_Z (ptrue_abd_1_f16_x_untied, svfloat16_t,
z0 = svabd_n_f16_x (svptrue_b16 (), z1, 1),
z0 = svabd_x (svptrue_b16 (), z1, 1))
/*
** ptrue_abd_0p5_f16_x_tied1:
** ...
** ptrue p[0-9]+\.b[^\n]*
** ...
** ret
*/
TEST_UNIFORM_Z (ptrue_abd_0p5_f16_x_tied1, svfloat16_t,
z0 = svabd_n_f16_x (svptrue_b16 (), z0, 0.5),
z0 = svabd_x (svptrue_b16 (), z0, 0.5))
/*
** ptrue_abd_0p5_f16_x_untied:
** ...
** ptrue p[0-9]+\.b[^\n]*
** ...
** ret
*/
TEST_UNIFORM_Z (ptrue_abd_0p5_f16_x_untied, svfloat16_t,
z0 = svabd_n_f16_x (svptrue_b16 (), z1, 0.5),
z0 = svabd_x (svptrue_b16 (), z1, 0.5))
/*
** ptrue_abd_m1_f16_x_tied1:
** ...
** ptrue p[0-9]+\.b[^\n]*
** ...
** ret
*/
TEST_UNIFORM_Z (ptrue_abd_m1_f16_x_tied1, svfloat16_t,
z0 = svabd_n_f16_x (svptrue_b16 (), z0, -1),
z0 = svabd_x (svptrue_b16 (), z0, -1))
/*
** ptrue_abd_m1_f16_x_untied:
** ...
** ptrue p[0-9]+\.b[^\n]*
** ...
** ret
*/
TEST_UNIFORM_Z (ptrue_abd_m1_f16_x_untied, svfloat16_t,
z0 = svabd_n_f16_x (svptrue_b16 (), z1, -1),
z0 = svabd_x (svptrue_b16 (), z1, -1))
/*
** ptrue_abd_m0p5_f16_x_tied1:
** ...
** ptrue p[0-9]+\.b[^\n]*
** ...
** ret
*/
TEST_UNIFORM_Z (ptrue_abd_m0p5_f16_x_tied1, svfloat16_t,
z0 = svabd_n_f16_x (svptrue_b16 (), z0, -0.5),
z0 = svabd_x (svptrue_b16 (), z0, -0.5))
/*
** ptrue_abd_m0p5_f16_x_untied:
** ...
** ptrue p[0-9]+\.b[^\n]*
** ...
** ret
*/
TEST_UNIFORM_Z (ptrue_abd_m0p5_f16_x_untied, svfloat16_t,
z0 = svabd_n_f16_x (svptrue_b16 (), z1, -0.5),
z0 = svabd_x (svptrue_b16 (), z1, -0.5))
/*
** ptrue_abd_2_f16_x_tied1:
** ...
** ptrue p[0-9]+\.b[^\n]*
** ...
** ret
*/
TEST_UNIFORM_Z (ptrue_abd_2_f16_x_tied1, svfloat16_t,
z0 = svabd_n_f16_x (svptrue_b16 (), z0, 2),
z0 = svabd_x (svptrue_b16 (), z0, 2))
/*
** ptrue_abd_2_f16_x_untied:
** ...
** ptrue p[0-9]+\.b[^\n]*
** ...
** ret
*/
TEST_UNIFORM_Z (ptrue_abd_2_f16_x_untied, svfloat16_t,
z0 = svabd_n_f16_x (svptrue_b16 (), z1, 2),
z0 = svabd_x (svptrue_b16 (), z1, 2))