blob: a6f2dc48b3d83bab1c310e2d29a656a92bf0a9b3 [file] [log] [blame]
#include <stdlib.h>
#include <stddef.h>
#include <altivec.h>
#ifndef RTYPE
#define RTYPE TYPE
#endif
#ifdef DO_TRACE
#include <stdio.h>
#define TRACE(STRING, NUM) \
do \
{ \
fprintf (stderr, "%s%s: %2d\n", (NUM == 0) ? "\n" : "", \
STRING, (int)NUM); \
fflush (stderr); \
} \
while (0)
#ifndef FAIL_FORMAT
#define FAIL_FORMAT "%ld"
#define FAIL_CAST(X) ((long)(X))
#endif
#define FAIL(EXP, GOT) \
do \
{ \
fprintf (stderr, "Expected: " FAIL_FORMAT ", got " FAIL_FORMAT "\n", \
FAIL_CAST (EXP), FAIL_CAST (GOT)); \
fflush (stderr); \
abort (); \
} \
while (0)
#else
#define TRACE(STRING, NUM)
#define FAIL(EXP, GOT) abort ()
#endif
static void check (RTYPE, RTYPE) __attribute__((__noinline__));
static vector TYPE deoptimize (vector TYPE) __attribute__((__noinline__));
static vector TYPE *deoptimize_ptr (vector TYPE *) __attribute__((__noinline__));
static void
check (RTYPE expected, RTYPE got)
{
if (expected != got)
FAIL (expected, got);
}
static vector TYPE
deoptimize (vector TYPE a)
{
__asm__ (" # %x0" : "+wa" (a));
return a;
}
static vector TYPE *
deoptimize_ptr (vector TYPE *p)
{
__asm__ (" # %0" : "+r" (p));
return p;
}
/* Tests for the normal case of vec_extract where the vector is in a register
and returning the result in a register as a return value. */
RTYPE
get_auto_n (vector TYPE a, ssize_t n)
{
return (RTYPE) vec_extract (a, n);
}
RTYPE
get_auto_0 (vector TYPE a)
{
return (RTYPE) vec_extract (a, 0);
}
RTYPE
get_auto_1 (vector TYPE a)
{
return (RTYPE) vec_extract (a, 1);
}
#if ELEMENTS >= 4
RTYPE
get_auto_2 (vector TYPE a)
{
return (RTYPE) vec_extract (a, 2);
}
RTYPE
get_auto_3 (vector TYPE a)
{
return (RTYPE) vec_extract (a, 3);
}
#if ELEMENTS >= 8
RTYPE
get_auto_4 (vector TYPE a)
{
return (RTYPE) vec_extract (a, 4);
}
RTYPE
get_auto_5 (vector TYPE a)
{
return (RTYPE) vec_extract (a, 5);
}
RTYPE
get_auto_6 (vector TYPE a)
{
return (RTYPE) vec_extract (a, 6);
}
RTYPE
get_auto_7 (vector TYPE a)
{
return (RTYPE) vec_extract (a, 7);
}
#if ELEMENTS >= 16
RTYPE
get_auto_8 (vector TYPE a)
{
return (RTYPE) vec_extract (a, 8);
}
RTYPE
get_auto_9 (vector TYPE a)
{
return (RTYPE) vec_extract (a, 9);
}
RTYPE
get_auto_10 (vector TYPE a)
{
return (RTYPE) vec_extract (a, 10);
}
RTYPE
get_auto_11 (vector TYPE a)
{
return (RTYPE) vec_extract (a, 11);
}
RTYPE
get_auto_12 (vector TYPE a)
{
return (RTYPE) vec_extract (a, 12);
}
RTYPE
get_auto_13 (vector TYPE a)
{
return (RTYPE) vec_extract (a, 13);
}
RTYPE
get_auto_14 (vector TYPE a)
{
return (RTYPE) vec_extract (a, 14);
}
RTYPE
get_auto_15 (vector TYPE a)
{
return (RTYPE) vec_extract (a, 15);
}
#endif
#endif
#endif
typedef RTYPE (*auto_func_type) (vector TYPE);
static auto_func_type get_auto_const[] = {
get_auto_0,
get_auto_1,
#if ELEMENTS >= 4
get_auto_2,
get_auto_3,
#if ELEMENTS >= 8
get_auto_4,
get_auto_5,
get_auto_6,
get_auto_7,
#if ELEMENTS >= 16
get_auto_8,
get_auto_9,
get_auto_10,
get_auto_11,
get_auto_12,
get_auto_13,
get_auto_14,
get_auto_15,
#endif
#endif
#endif
};
extern void do_auto (vector TYPE a) __attribute__((__noinline__));
void
do_auto (vector TYPE a)
{
size_t i;
for (i = 0; i < sizeof (get_auto_const) / sizeof (get_auto_const[0]); i++)
{
TRACE ("auto", i);
check (get_auto_n (a, i), (get_auto_const[i]) (a));
}
}
/* Tests for vec_extract of a vector in a register, but storing the result
(there is an optimization where an element can be stored to memory if it is
in the right position to use a scalar store). */
void
get_store_n (RTYPE *p, vector TYPE a, ssize_t n)
{
*p = (RTYPE) vec_extract (a, n);
}
void
get_store_0 (RTYPE *p, vector TYPE a)
{
*p = (RTYPE) vec_extract (a, 0);
}
void
get_store_1 (RTYPE *p, vector TYPE a)
{
*p = (RTYPE) vec_extract (a, 1);
}
#if ELEMENTS >= 4
void
get_store_2 (RTYPE *p, vector TYPE a)
{
*p = (RTYPE) vec_extract (a, 2);
}
void
get_store_3 (RTYPE *p, vector TYPE a)
{
*p = (RTYPE) vec_extract (a, 3);
}
#if ELEMENTS >= 8
void
get_store_4 (RTYPE *p, vector TYPE a)
{
*p = (RTYPE) vec_extract (a, 4);
}
void
get_store_5 (RTYPE *p, vector TYPE a)
{
*p = (RTYPE) vec_extract (a, 5);
}
void
get_store_6 (RTYPE *p, vector TYPE a)
{
*p = (RTYPE) vec_extract (a, 6);
}
void
get_store_7 (RTYPE *p, vector TYPE a)
{
*p = (RTYPE) vec_extract (a, 7);
}
#if ELEMENTS >= 16
void
get_store_8 (RTYPE *p, vector TYPE a)
{
*p = (RTYPE) vec_extract (a, 8);
}
void
get_store_9 (RTYPE *p, vector TYPE a)
{
*p = (RTYPE) vec_extract (a, 9);
}
void
get_store_10 (RTYPE *p, vector TYPE a)
{
*p = (RTYPE) vec_extract (a, 10);
}
void
get_store_11 (RTYPE *p, vector TYPE a)
{
*p = (RTYPE) vec_extract (a, 11);
}
void
get_store_12 (RTYPE *p, vector TYPE a)
{
*p = (RTYPE) vec_extract (a, 12);
}
void
get_store_13 (RTYPE *p, vector TYPE a)
{
*p = (RTYPE) vec_extract (a, 13);
}
void
get_store_14 (RTYPE *p, vector TYPE a)
{
*p = (RTYPE) vec_extract (a, 14);
}
void
get_store_15 (RTYPE *p, vector TYPE a)
{
*p = (RTYPE) vec_extract (a, 15);
}
#endif
#endif
#endif
typedef void (*store_func_type) (RTYPE *, vector TYPE);
static store_func_type get_store_const[] = {
get_store_0,
get_store_1,
#if ELEMENTS >= 4
get_store_2,
get_store_3,
#if ELEMENTS >= 8
get_store_4,
get_store_5,
get_store_6,
get_store_7,
#if ELEMENTS >= 16
get_store_8,
get_store_9,
get_store_10,
get_store_11,
get_store_12,
get_store_13,
get_store_14,
get_store_15,
#endif
#endif
#endif
};
extern void do_store (vector TYPE a) __attribute__((__noinline__));
void
do_store (vector TYPE a)
{
size_t i;
RTYPE result_var, result_const;
for (i = 0; i < sizeof (get_store_const) / sizeof (get_store_const[0]); i++)
{
TRACE ("store", i);
get_store_n (&result_var, a, i);
(get_store_const[i]) (&result_const, a);
check (result_var, result_const);
}
}
/* Tests for vec_extract where the vector comes from memory (the compiler can
optimize this by doing a scalar load without having to load the whole
vector). */
RTYPE
get_pointer_n (vector TYPE *p, ssize_t n)
{
return (RTYPE) vec_extract (*p, n);
}
RTYPE
get_pointer_0 (vector TYPE *p)
{
return (RTYPE) vec_extract (*p, 0);
}
RTYPE
get_pointer_1 (vector TYPE *p)
{
return (RTYPE) vec_extract (*p, 1);
}
#if ELEMENTS >= 4
RTYPE
get_pointer_2 (vector TYPE *p)
{
return (RTYPE) vec_extract (*p, 2);
}
RTYPE
get_pointer_3 (vector TYPE *p)
{
return (RTYPE) vec_extract (*p, 3);
}
#if ELEMENTS >= 8
RTYPE
get_pointer_4 (vector TYPE *p)
{
return (RTYPE) vec_extract (*p, 4);
}
RTYPE
get_pointer_5 (vector TYPE *p)
{
return (RTYPE) vec_extract (*p, 5);
}
RTYPE
get_pointer_6 (vector TYPE *p)
{
return (RTYPE) vec_extract (*p, 6);
}
RTYPE
get_pointer_7 (vector TYPE *p)
{
return (RTYPE) vec_extract (*p, 7);
}
#if ELEMENTS >= 16
RTYPE
get_pointer_8 (vector TYPE *p)
{
return (RTYPE) vec_extract (*p, 8);
}
RTYPE
get_pointer_9 (vector TYPE *p)
{
return (RTYPE) vec_extract (*p, 9);
}
RTYPE
get_pointer_10 (vector TYPE *p)
{
return (RTYPE) vec_extract (*p, 10);
}
RTYPE
get_pointer_11 (vector TYPE *p)
{
return (RTYPE) vec_extract (*p, 11);
}
RTYPE
get_pointer_12 (vector TYPE *p)
{
return (RTYPE) vec_extract (*p, 12);
}
RTYPE
get_pointer_13 (vector TYPE *p)
{
return (RTYPE) vec_extract (*p, 13);
}
RTYPE
get_pointer_14 (vector TYPE *p)
{
return (RTYPE) vec_extract (*p, 14);
}
RTYPE
get_pointer_15 (vector TYPE *p)
{
return (RTYPE) vec_extract (*p, 15);
}
#endif
#endif
#endif
typedef RTYPE (*pointer_func_type) (vector TYPE *);
static pointer_func_type get_pointer_const[] = {
get_pointer_0,
get_pointer_1,
#if ELEMENTS >= 4
get_pointer_2,
get_pointer_3,
#if ELEMENTS >= 8
get_pointer_4,
get_pointer_5,
get_pointer_6,
get_pointer_7,
#if ELEMENTS >= 16
get_pointer_8,
get_pointer_9,
get_pointer_10,
get_pointer_11,
get_pointer_12,
get_pointer_13,
get_pointer_14,
get_pointer_15,
#endif
#endif
#endif
};
extern void do_pointer (vector TYPE *p) __attribute__((__noinline__));
void
do_pointer (vector TYPE *p)
{
size_t i;
for (i = 0; i < sizeof (get_pointer_const) / sizeof (get_pointer_const[0]); i++)
{
TRACE ("pointer", i);
check (get_pointer_n (p, i), (get_pointer_const[i]) (p));
}
}
/* Test for vec_extract where the vector comes from an indexed memory
operation. This is to make sure that if the compiler optimizes vec_extract
from memory to be a scalar load, the address is correctly adjusted. */
RTYPE
get_indexed_n (vector TYPE *p, size_t x, ssize_t n)
{
return (RTYPE) vec_extract (p[x], n);
}
RTYPE
get_indexed_0 (vector TYPE *p, size_t x)
{
return (RTYPE) vec_extract (p[x], 0);
}
RTYPE
get_indexed_1 (vector TYPE *p, size_t x)
{
return (RTYPE) vec_extract (p[x], 1);
}
#if ELEMENTS >= 4
RTYPE
get_indexed_2 (vector TYPE *p, size_t x)
{
return (RTYPE) vec_extract (p[x], 2);
}
RTYPE
get_indexed_3 (vector TYPE *p, size_t x)
{
return (RTYPE) vec_extract (p[x], 3);
}
#if ELEMENTS >= 8
RTYPE
get_indexed_4 (vector TYPE *p, size_t x)
{
return (RTYPE) vec_extract (p[x], 4);
}
RTYPE
get_indexed_5 (vector TYPE *p, size_t x)
{
return (RTYPE) vec_extract (p[x], 5);
}
RTYPE
get_indexed_6 (vector TYPE *p, size_t x)
{
return (RTYPE) vec_extract (p[x], 6);
}
RTYPE
get_indexed_7 (vector TYPE *p, size_t x)
{
return (RTYPE) vec_extract (p[x], 7);
}
#if ELEMENTS >= 16
RTYPE
get_indexed_8 (vector TYPE *p, size_t x)
{
return (RTYPE) vec_extract (p[x], 8);
}
RTYPE
get_indexed_9 (vector TYPE *p, size_t x)
{
return (RTYPE) vec_extract (p[x], 9);
}
RTYPE
get_indexed_10 (vector TYPE *p, size_t x)
{
return (RTYPE) vec_extract (p[x], 10);
}
RTYPE
get_indexed_11 (vector TYPE *p, size_t x)
{
return (RTYPE) vec_extract (p[x], 11);
}
RTYPE
get_indexed_12 (vector TYPE *p, size_t x)
{
return (RTYPE) vec_extract (p[x], 12);
}
RTYPE
get_indexed_13 (vector TYPE *p, size_t x)
{
return (RTYPE) vec_extract (p[x], 13);
}
RTYPE
get_indexed_14 (vector TYPE *p, size_t x)
{
return (RTYPE) vec_extract (p[x], 14);
}
RTYPE
get_indexed_15 (vector TYPE *p, size_t x)
{
return (RTYPE) vec_extract (p[x], 15);
}
#endif
#endif
#endif
typedef RTYPE (*indexed_func_type) (vector TYPE *, size_t);
static indexed_func_type get_indexed_const[] = {
get_indexed_0,
get_indexed_1,
#if ELEMENTS >= 4
get_indexed_2,
get_indexed_3,
#if ELEMENTS >= 8
get_indexed_4,
get_indexed_5,
get_indexed_6,
get_indexed_7,
#if ELEMENTS >= 16
get_indexed_8,
get_indexed_9,
get_indexed_10,
get_indexed_11,
get_indexed_12,
get_indexed_13,
get_indexed_14,
get_indexed_15,
#endif
#endif
#endif
};
extern void do_indexed (vector TYPE *p, size_t x) __attribute__((__noinline__));
void
do_indexed (vector TYPE *p, size_t x)
{
size_t i;
for (i = 0; i < sizeof (get_indexed_const) / sizeof (get_indexed_const[0]); i++)
{
TRACE ("indexed", i);
check (get_indexed_n (p, x, i), (get_indexed_const[i]) (p, x));
}
}
/* Test for vec_extract where the vector comes from memory using an address
with a pointer and a constant offset. This will occur in ISA 3.0 which
added d-form memory addressing for vectors. */
RTYPE
get_ptr_plus1_n (vector TYPE *p, ssize_t n)
{
return (RTYPE) vec_extract (p[1], n);
}
RTYPE
get_ptr_plus1_0 (vector TYPE *p)
{
return (RTYPE) vec_extract (p[1], 0);
}
RTYPE
get_ptr_plus1_1 (vector TYPE *p)
{
return (RTYPE) vec_extract (p[1], 1);
}
#if ELEMENTS >= 4
RTYPE
get_ptr_plus1_2 (vector TYPE *p)
{
return (RTYPE) vec_extract (p[1], 2);
}
RTYPE
get_ptr_plus1_3 (vector TYPE *p)
{
return (RTYPE) vec_extract (p[1], 3);
}
#if ELEMENTS >= 8
RTYPE
get_ptr_plus1_4 (vector TYPE *p)
{
return (RTYPE) vec_extract (p[1], 4);
}
RTYPE
get_ptr_plus1_5 (vector TYPE *p)
{
return (RTYPE) vec_extract (p[1], 5);
}
RTYPE
get_ptr_plus1_6 (vector TYPE *p)
{
return (RTYPE) vec_extract (p[1], 6);
}
RTYPE
get_ptr_plus1_7 (vector TYPE *p)
{
return (RTYPE) vec_extract (p[1], 7);
}
#if ELEMENTS >= 16
RTYPE
get_ptr_plus1_8 (vector TYPE *p)
{
return (RTYPE) vec_extract (p[1], 8);
}
RTYPE
get_ptr_plus1_9 (vector TYPE *p)
{
return (RTYPE) vec_extract (p[1], 9);
}
RTYPE
get_ptr_plus1_10 (vector TYPE *p)
{
return (RTYPE) vec_extract (p[1], 10);
}
RTYPE
get_ptr_plus1_11 (vector TYPE *p)
{
return (RTYPE) vec_extract (p[1], 11);
}
RTYPE
get_ptr_plus1_12 (vector TYPE *p)
{
return (RTYPE) vec_extract (p[1], 12);
}
RTYPE
get_ptr_plus1_13 (vector TYPE *p)
{
return (RTYPE) vec_extract (p[1], 13);
}
RTYPE
get_ptr_plus1_14 (vector TYPE *p)
{
return (RTYPE) vec_extract (p[1], 14);
}
RTYPE
get_ptr_plus1_15 (vector TYPE *p)
{
return (RTYPE) vec_extract (p[1], 15);
}
#endif
#endif
#endif
typedef RTYPE (*pointer_func_type) (vector TYPE *);
static pointer_func_type get_ptr_plus1_const[] = {
get_ptr_plus1_0,
get_ptr_plus1_1,
#if ELEMENTS >= 4
get_ptr_plus1_2,
get_ptr_plus1_3,
#if ELEMENTS >= 8
get_ptr_plus1_4,
get_ptr_plus1_5,
get_ptr_plus1_6,
get_ptr_plus1_7,
#if ELEMENTS >= 16
get_ptr_plus1_8,
get_ptr_plus1_9,
get_ptr_plus1_10,
get_ptr_plus1_11,
get_ptr_plus1_12,
get_ptr_plus1_13,
get_ptr_plus1_14,
get_ptr_plus1_15,
#endif
#endif
#endif
};
extern void do_ptr_plus1 (vector TYPE *p) __attribute__((__noinline__));
void
do_ptr_plus1 (vector TYPE *p)
{
size_t i;
for (i = 0; i < sizeof (get_ptr_plus1_const) / sizeof (get_ptr_plus1_const[0]); i++)
{
TRACE ("ptr_plus1", i);
check (get_ptr_plus1_n (p, i), (get_ptr_plus1_const[i]) (p));
}
}
/* Test for vec_extract where the vector comes from a static variable. */
static vector TYPE s;
RTYPE
get_static_n (ssize_t n)
{
return (RTYPE) vec_extract (s, n);
}
RTYPE
get_static_0 (void)
{
return (RTYPE) vec_extract (s, 0);
}
RTYPE
get_static_1 (void)
{
return (RTYPE) vec_extract (s, 1);
}
#if ELEMENTS >= 4
RTYPE
get_static_2 (void)
{
return (RTYPE) vec_extract (s, 2);
}
RTYPE
get_static_3 (void)
{
return (RTYPE) vec_extract (s, 3);
}
#if ELEMENTS >= 8
RTYPE
get_static_4 (void)
{
return (RTYPE) vec_extract (s, 4);
}
RTYPE
get_static_5 (void)
{
return (RTYPE) vec_extract (s, 5);
}
RTYPE
get_static_6 (void)
{
return (RTYPE) vec_extract (s, 6);
}
RTYPE
get_static_7 (void)
{
return (RTYPE) vec_extract (s, 7);
}
#if ELEMENTS >= 16
RTYPE
get_static_8 (void)
{
return (RTYPE) vec_extract (s, 8);
}
RTYPE
get_static_9 (void)
{
return (RTYPE) vec_extract (s, 9);
}
RTYPE
get_static_10 (void)
{
return (RTYPE) vec_extract (s, 10);
}
RTYPE
get_static_11 (void)
{
return (RTYPE) vec_extract (s, 11);
}
RTYPE
get_static_12 (void)
{
return (RTYPE) vec_extract (s, 12);
}
RTYPE
get_static_13 (void)
{
return (RTYPE) vec_extract (s, 13);
}
RTYPE
get_static_14 (void)
{
return (RTYPE) vec_extract (s, 14);
}
RTYPE
get_static_15 (void)
{
return (RTYPE) vec_extract (s, 15);
}
#endif
#endif
#endif
typedef RTYPE (*static_func_type) (void);
static static_func_type get_static_const[] = {
get_static_0,
get_static_1,
#if ELEMENTS >= 4
get_static_2,
get_static_3,
#if ELEMENTS >= 8
get_static_4,
get_static_5,
get_static_6,
get_static_7,
#if ELEMENTS >= 16
get_static_8,
get_static_9,
get_static_10,
get_static_11,
get_static_12,
get_static_13,
get_static_14,
get_static_15,
#endif
#endif
#endif
};
extern void do_static (void) __attribute__((__noinline__));
void
do_static (void)
{
size_t i;
for (i = 0; i < sizeof (get_static_const) / sizeof (get_static_const[0]); i++)
{
TRACE ("static", i);
check (get_static_n (i), (get_static_const[i]) ());
}
}
/* Test for vec_extract where the vector is in a global variable. */
vector TYPE g;
RTYPE
get_global_n (ssize_t n)
{
return (RTYPE) vec_extract (g, n);
}
RTYPE
get_global_0 (void)
{
return (RTYPE) vec_extract (g, 0);
}
RTYPE
get_global_1 (void)
{
return (RTYPE) vec_extract (g, 1);
}
#if ELEMENTS >= 4
RTYPE
get_global_2 (void)
{
return (RTYPE) vec_extract (g, 2);
}
RTYPE
get_global_3 (void)
{
return (RTYPE) vec_extract (g, 3);
}
#if ELEMENTS >= 8
RTYPE
get_global_4 (void)
{
return (RTYPE) vec_extract (g, 4);
}
RTYPE
get_global_5 (void)
{
return (RTYPE) vec_extract (g, 5);
}
RTYPE
get_global_6 (void)
{
return (RTYPE) vec_extract (g, 6);
}
RTYPE
get_global_7 (void)
{
return (RTYPE) vec_extract (g, 7);
}
#if ELEMENTS >= 16
RTYPE
get_global_8 (void)
{
return (RTYPE) vec_extract (g, 8);
}
RTYPE
get_global_9 (void)
{
return (RTYPE) vec_extract (g, 9);
}
RTYPE
get_global_10 (void)
{
return (RTYPE) vec_extract (g, 10);
}
RTYPE
get_global_11 (void)
{
return (RTYPE) vec_extract (g, 11);
}
RTYPE
get_global_12 (void)
{
return (RTYPE) vec_extract (g, 12);
}
RTYPE
get_global_13 (void)
{
return (RTYPE) vec_extract (g, 13);
}
RTYPE
get_global_14 (void)
{
return (RTYPE) vec_extract (g, 14);
}
RTYPE
get_global_15 (void)
{
return (RTYPE) vec_extract (g, 15);
}
#endif
#endif
#endif
typedef RTYPE (*global_func_type) (void);
static global_func_type get_global_const[] = {
get_global_0,
get_global_1,
#if ELEMENTS >= 4
get_global_2,
get_global_3,
#if ELEMENTS >= 8
get_global_4,
get_global_5,
get_global_6,
get_global_7,
#if ELEMENTS >= 16
get_global_8,
get_global_9,
get_global_10,
get_global_11,
get_global_12,
get_global_13,
get_global_14,
get_global_15,
#endif
#endif
#endif
};
extern void do_global (void) __attribute__((__noinline__));
void
do_global (void)
{
size_t i;
for (i = 0; i < sizeof (get_global_const) / sizeof (get_global_const[0]); i++)
{
TRACE ("global", i);
check (get_global_n (i), (get_global_const[i]) ());
}
}
/* Main program to test all of the possibilities. */
int
main (void)
{
size_t i;
vector TYPE x = INITIAL;
vector TYPE *p, *p2, a, y;
vector TYPE z[2];
a = deoptimize (x);
s = deoptimize (x);
g = deoptimize (x);
y = deoptimize (x);
z[0] = deoptimize (x);
z[1] = deoptimize (x);
p = deoptimize_ptr (&y);
p2 = deoptimize_ptr (&z[0]);
do_auto (a);
do_store (a);
do_pointer (p);
for (i = 0; i < 2; i++)
do_indexed (p2, i);
do_ptr_plus1 (p2);
do_static ();
do_global ();
return 0;
}