blob: 8151387600f108d5da9c8a244aea916d7474a2b0 [file] [log] [blame]
/* { dg-do run } */
/* { dg-options "-O2 -fdump-rtl-combine --save-temps" } */
/* Test that we don't generate BSL when in DImode with values in integer
registers, and do generate it where we have values in floating-point
registers. This is useful, as it allows us to avoid register moves
in the general case.
We want:
eor x0, x0, x1
and x0, x0, x2
eor x0, x0, x1
ret
Rather than:
fmov d2, x0
fmov d0, x2
fmov d1, x1
bsl v0.8b, v2.8b, v1.8b
fmov x0, d0
ret */
extern void abort (void);
unsigned long long __attribute__ ((noinline))
foo (unsigned long long a, unsigned long long b, unsigned long long c)
{
return ((a ^ b) & c) ^ b;
}
unsigned long long __attribute__ ((noinline))
foo2 (unsigned long long a, unsigned long long b, unsigned long long c)
{
return ((a ^ b) & c) ^ a;
}
#define force_simd(V1) asm volatile ("mov %d0, %1.d[0]" \
: "=w"(V1) \
: "w"(V1) \
: /* No clobbers */);
unsigned long long __attribute__ ((noinline))
bar (unsigned long long a, unsigned long long b, unsigned long long c)
{
force_simd (a);
force_simd (b);
force_simd (c);
c = ((a ^ b) & c) ^ b;
force_simd (c);
return c;
}
unsigned long long __attribute__ ((noinline))
bar2 (unsigned long long a, unsigned long long b, unsigned long long c)
{
force_simd (a);
force_simd (b);
force_simd (c);
c = ((a ^ b) & c) ^ a;
force_simd (c);
return c;
}
int
main (int argc, char** argv)
{
unsigned long long a = 0x0123456789abcdefULL;
unsigned long long b = 0xfedcba9876543210ULL;
unsigned long long c = 0xaabbccddeeff7777ULL;
if (foo (a, b, c) != bar (a, b, c))
abort ();
if (foo2 (a, b, c) != bar2 (a, b, c))
abort ();
return 0;
}
/* 2 BSL, 6 FMOV (to floating-point registers), and 2 FMOV (to general
purpose registers) for the "bar" tests, which should still use BSL. */
/* { dg-final { scan-assembler-times "bsl\tv\[0-9\]" 2 } } */
/* { dg-final { scan-assembler-times "fmov\td\[0-9\]" 6 } } */
/* { dg-final { scan-assembler-times "fmov\tx\[0-9\]" 2 } } */
/* { dg-final { scan-assembler-not "bif\tv\[0-9\]" } } */
/* { dg-final { scan-assembler-not "bit\tv\[0-9\]" } } */
/* We always match the idiom during combine. */
/* { dg-final { scan-rtl-dump-times "aarch64_simd_bsldi_internal" 2 "combine" } } */
/* { dg-final { scan-rtl-dump-times "aarch64_simd_bsldi_alt" 2 "combine" } } */