blob: d865618d4659c49188b40213e29c9a2e1b4f50a0 [file] [log] [blame]
/* { dg-additional-options "-fno-trapping-math" } */
/* { dg-final { check-function-bodies "**" "" "-DCHECK_ASM" } } */
#include "test_sve_acle.h"
/*
** mul_f64_m_tied1:
** fmul z0\.d, p0/m, z0\.d, z1\.d
** ret
*/
TEST_UNIFORM_Z (mul_f64_m_tied1, svfloat64_t,
z0 = svmul_f64_m (p0, z0, z1),
z0 = svmul_m (p0, z0, z1))
/*
** mul_f64_m_tied2:
** mov (z[0-9]+\.d), z0\.d
** movprfx z0, z1
** fmul z0\.d, p0/m, z0\.d, \1
** ret
*/
TEST_UNIFORM_Z (mul_f64_m_tied2, svfloat64_t,
z0 = svmul_f64_m (p0, z1, z0),
z0 = svmul_m (p0, z1, z0))
/*
** mul_f64_m_untied:
** movprfx z0, z1
** fmul z0\.d, p0/m, z0\.d, z2\.d
** ret
*/
TEST_UNIFORM_Z (mul_f64_m_untied, svfloat64_t,
z0 = svmul_f64_m (p0, z1, z2),
z0 = svmul_m (p0, z1, z2))
/*
** mul_d4_f64_m_tied1:
** mov (z[0-9]+\.d), d4
** fmul z0\.d, p0/m, z0\.d, \1
** ret
*/
TEST_UNIFORM_ZD (mul_d4_f64_m_tied1, svfloat64_t, double,
z0 = svmul_n_f64_m (p0, z0, d4),
z0 = svmul_m (p0, z0, d4))
/*
** mul_d4_f64_m_untied:
** mov (z[0-9]+\.d), d4
** movprfx z0, z1
** fmul z0\.d, p0/m, z0\.d, \1
** ret
*/
TEST_UNIFORM_ZD (mul_d4_f64_m_untied, svfloat64_t, double,
z0 = svmul_n_f64_m (p0, z1, d4),
z0 = svmul_m (p0, z1, d4))
/*
** mul_1_f64_m_tied1:
** fmov (z[0-9]+\.d), #1\.0(?:e\+0)?
** fmul z0\.d, p0/m, z0\.d, \1
** ret
*/
TEST_UNIFORM_Z (mul_1_f64_m_tied1, svfloat64_t,
z0 = svmul_n_f64_m (p0, z0, 1),
z0 = svmul_m (p0, z0, 1))
/*
** mul_1_f64_m_untied: { xfail *-*-* }
** fmov (z[0-9]+\.d), #1\.0(?:e\+0)?
** movprfx z0, z1
** fmul z0\.d, p0/m, z0\.d, \1
** ret
*/
TEST_UNIFORM_Z (mul_1_f64_m_untied, svfloat64_t,
z0 = svmul_n_f64_m (p0, z1, 1),
z0 = svmul_m (p0, z1, 1))
/*
** mul_0p5_f64_m_tied1:
** fmul z0\.d, p0/m, z0\.d, #0\.5
** ret
*/
TEST_UNIFORM_Z (mul_0p5_f64_m_tied1, svfloat64_t,
z0 = svmul_n_f64_m (p0, z0, 0.5),
z0 = svmul_m (p0, z0, 0.5))
/*
** mul_0p5_f64_m_untied:
** movprfx z0, z1
** fmul z0\.d, p0/m, z0\.d, #0\.5
** ret
*/
TEST_UNIFORM_Z (mul_0p5_f64_m_untied, svfloat64_t,
z0 = svmul_n_f64_m (p0, z1, 0.5),
z0 = svmul_m (p0, z1, 0.5))
/*
** mul_2_f64_m_tied1:
** fmul z0\.d, p0/m, z0\.d, #2\.0
** ret
*/
TEST_UNIFORM_Z (mul_2_f64_m_tied1, svfloat64_t,
z0 = svmul_n_f64_m (p0, z0, 2),
z0 = svmul_m (p0, z0, 2))
/*
** mul_2_f64_m_untied:
** movprfx z0, z1
** fmul z0\.d, p0/m, z0\.d, #2\.0
** ret
*/
TEST_UNIFORM_Z (mul_2_f64_m_untied, svfloat64_t,
z0 = svmul_n_f64_m (p0, z1, 2),
z0 = svmul_m (p0, z1, 2))
/*
** mul_f64_z_tied1:
** movprfx z0\.d, p0/z, z0\.d
** fmul z0\.d, p0/m, z0\.d, z1\.d
** ret
*/
TEST_UNIFORM_Z (mul_f64_z_tied1, svfloat64_t,
z0 = svmul_f64_z (p0, z0, z1),
z0 = svmul_z (p0, z0, z1))
/*
** mul_f64_z_tied2:
** movprfx z0\.d, p0/z, z0\.d
** fmul z0\.d, p0/m, z0\.d, z1\.d
** ret
*/
TEST_UNIFORM_Z (mul_f64_z_tied2, svfloat64_t,
z0 = svmul_f64_z (p0, z1, z0),
z0 = svmul_z (p0, z1, z0))
/*
** mul_f64_z_untied:
** (
** movprfx z0\.d, p0/z, z1\.d
** fmul z0\.d, p0/m, z0\.d, z2\.d
** |
** movprfx z0\.d, p0/z, z2\.d
** fmul z0\.d, p0/m, z0\.d, z1\.d
** )
** ret
*/
TEST_UNIFORM_Z (mul_f64_z_untied, svfloat64_t,
z0 = svmul_f64_z (p0, z1, z2),
z0 = svmul_z (p0, z1, z2))
/*
** mul_d4_f64_z_tied1:
** mov (z[0-9]+\.d), d4
** movprfx z0\.d, p0/z, z0\.d
** fmul z0\.d, p0/m, z0\.d, \1
** ret
*/
TEST_UNIFORM_ZD (mul_d4_f64_z_tied1, svfloat64_t, double,
z0 = svmul_n_f64_z (p0, z0, d4),
z0 = svmul_z (p0, z0, d4))
/*
** mul_d4_f64_z_untied:
** mov (z[0-9]+\.d), d4
** (
** movprfx z0\.d, p0/z, z1\.d
** fmul z0\.d, p0/m, z0\.d, \1
** |
** movprfx z0\.d, p0/z, \1
** fmul z0\.d, p0/m, z0\.d, z1\.d
** )
** ret
*/
TEST_UNIFORM_ZD (mul_d4_f64_z_untied, svfloat64_t, double,
z0 = svmul_n_f64_z (p0, z1, d4),
z0 = svmul_z (p0, z1, d4))
/*
** mul_1_f64_z_tied1:
** fmov (z[0-9]+\.d), #1\.0(?:e\+0)?
** movprfx z0\.d, p0/z, z0\.d
** fmul z0\.d, p0/m, z0\.d, \1
** ret
*/
TEST_UNIFORM_Z (mul_1_f64_z_tied1, svfloat64_t,
z0 = svmul_n_f64_z (p0, z0, 1),
z0 = svmul_z (p0, z0, 1))
/*
** mul_1_f64_z_untied:
** fmov (z[0-9]+\.d), #1\.0(?:e\+0)?
** (
** movprfx z0\.d, p0/z, z1\.d
** fmul z0\.d, p0/m, z0\.d, \1
** |
** movprfx z0\.d, p0/z, \1
** fmul z0\.d, p0/m, z0\.d, z1\.d
** )
** ret
*/
TEST_UNIFORM_Z (mul_1_f64_z_untied, svfloat64_t,
z0 = svmul_n_f64_z (p0, z1, 1),
z0 = svmul_z (p0, z1, 1))
/*
** mul_0p5_f64_z_tied1:
** movprfx z0\.d, p0/z, z0\.d
** fmul z0\.d, p0/m, z0\.d, #0\.5
** ret
*/
TEST_UNIFORM_Z (mul_0p5_f64_z_tied1, svfloat64_t,
z0 = svmul_n_f64_z (p0, z0, 0.5),
z0 = svmul_z (p0, z0, 0.5))
/*
** mul_0p5_f64_z_untied:
** movprfx z0\.d, p0/z, z1\.d
** fmul z0\.d, p0/m, z0\.d, #0\.5
** ret
*/
TEST_UNIFORM_Z (mul_0p5_f64_z_untied, svfloat64_t,
z0 = svmul_n_f64_z (p0, z1, 0.5),
z0 = svmul_z (p0, z1, 0.5))
/*
** mul_2_f64_z_tied1:
** movprfx z0\.d, p0/z, z0\.d
** fmul z0\.d, p0/m, z0\.d, #2\.0
** ret
*/
TEST_UNIFORM_Z (mul_2_f64_z_tied1, svfloat64_t,
z0 = svmul_n_f64_z (p0, z0, 2),
z0 = svmul_z (p0, z0, 2))
/*
** mul_2_f64_z_untied:
** movprfx z0\.d, p0/z, z1\.d
** fmul z0\.d, p0/m, z0\.d, #2\.0
** ret
*/
TEST_UNIFORM_Z (mul_2_f64_z_untied, svfloat64_t,
z0 = svmul_n_f64_z (p0, z1, 2),
z0 = svmul_z (p0, z1, 2))
/*
** mul_f64_x_tied1:
** fmul z0\.d, (z0\.d, z1\.d|z1\.d, z0\.d)
** ret
*/
TEST_UNIFORM_Z (mul_f64_x_tied1, svfloat64_t,
z0 = svmul_f64_x (p0, z0, z1),
z0 = svmul_x (p0, z0, z1))
/*
** mul_f64_x_tied2:
** fmul z0\.d, (z0\.d, z1\.d|z1\.d, z0\.d)
** ret
*/
TEST_UNIFORM_Z (mul_f64_x_tied2, svfloat64_t,
z0 = svmul_f64_x (p0, z1, z0),
z0 = svmul_x (p0, z1, z0))
/*
** mul_f64_x_untied:
** fmul z0\.d, (z1\.d, z2\.d|z2\.d, z1\.d)
** ret
*/
TEST_UNIFORM_Z (mul_f64_x_untied, svfloat64_t,
z0 = svmul_f64_x (p0, z1, z2),
z0 = svmul_x (p0, z1, z2))
/*
** mul_d4_f64_x_tied1:
** mov (z[0-9]+\.d), d4
** fmul z0\.d, (z0\.d, \1|\1, z0\.d)
** ret
*/
TEST_UNIFORM_ZD (mul_d4_f64_x_tied1, svfloat64_t, double,
z0 = svmul_n_f64_x (p0, z0, d4),
z0 = svmul_x (p0, z0, d4))
/*
** mul_d4_f64_x_untied:
** mov (z[0-9]+\.d), d4
** fmul z0\.d, (z1\.d, \1|\1, z1\.d)
** ret
*/
TEST_UNIFORM_ZD (mul_d4_f64_x_untied, svfloat64_t, double,
z0 = svmul_n_f64_x (p0, z1, d4),
z0 = svmul_x (p0, z1, d4))
/*
** mul_1_f64_x_tied1:
** fmov (z[0-9]+\.d), #1\.0(?:e\+0)?
** fmul z0\.d, (z0\.d, \1|\1, z0\.d)
** ret
*/
TEST_UNIFORM_Z (mul_1_f64_x_tied1, svfloat64_t,
z0 = svmul_n_f64_x (p0, z0, 1),
z0 = svmul_x (p0, z0, 1))
/*
** mul_1_f64_x_untied:
** fmov (z[0-9]+\.d), #1\.0(?:e\+0)?
** fmul z0\.d, (z1\.d, \1|\1, z1\.d)
** ret
*/
TEST_UNIFORM_Z (mul_1_f64_x_untied, svfloat64_t,
z0 = svmul_n_f64_x (p0, z1, 1),
z0 = svmul_x (p0, z1, 1))
/*
** mul_0p5_f64_x_tied1:
** fmul z0\.d, p0/m, z0\.d, #0\.5
** ret
*/
TEST_UNIFORM_Z (mul_0p5_f64_x_tied1, svfloat64_t,
z0 = svmul_n_f64_x (p0, z0, 0.5),
z0 = svmul_x (p0, z0, 0.5))
/*
** mul_0p5_f64_x_untied:
** movprfx z0, z1
** fmul z0\.d, p0/m, z0\.d, #0\.5
** ret
*/
TEST_UNIFORM_Z (mul_0p5_f64_x_untied, svfloat64_t,
z0 = svmul_n_f64_x (p0, z1, 0.5),
z0 = svmul_x (p0, z1, 0.5))
/*
** mul_2_f64_x_tied1:
** fmul z0\.d, p0/m, z0\.d, #2\.0
** ret
*/
TEST_UNIFORM_Z (mul_2_f64_x_tied1, svfloat64_t,
z0 = svmul_n_f64_x (p0, z0, 2),
z0 = svmul_x (p0, z0, 2))
/*
** mul_2_f64_x_untied:
** movprfx z0, z1
** fmul z0\.d, p0/m, z0\.d, #2\.0
** ret
*/
TEST_UNIFORM_Z (mul_2_f64_x_untied, svfloat64_t,
z0 = svmul_n_f64_x (p0, z1, 2),
z0 = svmul_x (p0, z1, 2))
/*
** ptrue_mul_f64_x_tied1:
** fmul z0\.d, (z0\.d, z1\.d|z1\.d, z0\.d)
** ret
*/
TEST_UNIFORM_Z (ptrue_mul_f64_x_tied1, svfloat64_t,
z0 = svmul_f64_x (svptrue_b64 (), z0, z1),
z0 = svmul_x (svptrue_b64 (), z0, z1))
/*
** ptrue_mul_f64_x_tied2:
** fmul z0\.d, (z0\.d, z1\.d|z1\.d, z0\.d)
** ret
*/
TEST_UNIFORM_Z (ptrue_mul_f64_x_tied2, svfloat64_t,
z0 = svmul_f64_x (svptrue_b64 (), z1, z0),
z0 = svmul_x (svptrue_b64 (), z1, z0))
/*
** ptrue_mul_f64_x_untied:
** fmul z0\.d, (z1\.d, z2\.d|z2\.d, z1\.d)
** ret
*/
TEST_UNIFORM_Z (ptrue_mul_f64_x_untied, svfloat64_t,
z0 = svmul_f64_x (svptrue_b64 (), z1, z2),
z0 = svmul_x (svptrue_b64 (), z1, z2))
/*
** ptrue_mul_1_f64_x_tied1:
** fmov (z[0-9]+\.d), #1\.0(?:e\+0)?
** fmul z0\.d, (z0\.d, \1|\1, z0\.d)
** ret
*/
TEST_UNIFORM_Z (ptrue_mul_1_f64_x_tied1, svfloat64_t,
z0 = svmul_n_f64_x (svptrue_b64 (), z0, 1),
z0 = svmul_x (svptrue_b64 (), z0, 1))
/*
** ptrue_mul_1_f64_x_untied:
** fmov (z[0-9]+\.d), #1\.0(?:e\+0)?
** fmul z0\.d, (z1\.d, \1|\1, z1\.d)
** ret
*/
TEST_UNIFORM_Z (ptrue_mul_1_f64_x_untied, svfloat64_t,
z0 = svmul_n_f64_x (svptrue_b64 (), z1, 1),
z0 = svmul_x (svptrue_b64 (), z1, 1))
/*
** ptrue_mul_0p5_f64_x_tied1:
** ...
** ptrue p[0-9]+\.b[^\n]*
** ...
** ret
*/
TEST_UNIFORM_Z (ptrue_mul_0p5_f64_x_tied1, svfloat64_t,
z0 = svmul_n_f64_x (svptrue_b64 (), z0, 0.5),
z0 = svmul_x (svptrue_b64 (), z0, 0.5))
/*
** ptrue_mul_0p5_f64_x_untied:
** ...
** ptrue p[0-9]+\.b[^\n]*
** ...
** ret
*/
TEST_UNIFORM_Z (ptrue_mul_0p5_f64_x_untied, svfloat64_t,
z0 = svmul_n_f64_x (svptrue_b64 (), z1, 0.5),
z0 = svmul_x (svptrue_b64 (), z1, 0.5))
/*
** ptrue_mul_2_f64_x_tied1:
** ...
** ptrue p[0-9]+\.b[^\n]*
** ...
** ret
*/
TEST_UNIFORM_Z (ptrue_mul_2_f64_x_tied1, svfloat64_t,
z0 = svmul_n_f64_x (svptrue_b64 (), z0, 2),
z0 = svmul_x (svptrue_b64 (), z0, 2))
/*
** ptrue_mul_2_f64_x_untied:
** ...
** ptrue p[0-9]+\.b[^\n]*
** ...
** ret
*/
TEST_UNIFORM_Z (ptrue_mul_2_f64_x_untied, svfloat64_t,
z0 = svmul_n_f64_x (svptrue_b64 (), z1, 2),
z0 = svmul_x (svptrue_b64 (), z1, 2))