blob: 39fdea3a69dd7b56737a9dae00dcf93d09001147 [file] [log] [blame]
/* { dg-do run } */
/* { dg-options "-O2 -mavx2 -ftree-vectorize -fvect-cost-model=unlimited -mprefer-vector-width=256" } */
/* { dg-require-effective-target avx2 } */
#include "avx2-check.h"
#include <string.h>
#include "pr103144-mul-1.c"
typedef int v8si __attribute__((vector_size(32)));
void
avx2_test (void)
{
int* epi32_exp = (int*) malloc (N * sizeof (int));
int* epi32_dst = (int*) malloc (N * sizeof (int));
__builtin_memset (epi32_exp, 0, N * sizeof (int));
int b = 8;
v8si init = __extension__(v8si) { b, b * 3, b * 9, b * 27, b * 81, b * 243, b * 729, b * 2187 };
for (int i = 0; i != N / 8; i++)
{
memcpy (epi32_exp + i * 8, &init, 32);
init *= 6561;
}
foo_mul (epi32_dst, b);
if (__builtin_memcmp (epi32_dst, epi32_exp, N * sizeof (int)) != 0)
__builtin_abort ();
foo_mul_peel (epi32_dst, b);
if (__builtin_memcmp (epi32_dst, epi32_exp, 39 * 4) != 0)
__builtin_abort ();
init = __extension__(v8si) { 1, 3, 9, 27, 81, 243, 729, 2187 };
for (int i = 0; i != N / 8; i++)
{
memcpy (epi32_exp + i * 8, &init, 32);
init *= 6561;
}
foo_mul_const (epi32_dst);
if (__builtin_memcmp (epi32_dst, epi32_exp, N * sizeof (int)) != 0)
__builtin_abort ();
foo_mul_peel_const (epi32_dst);
if (__builtin_memcmp (epi32_dst, epi32_exp, 39 * 4) != 0)
__builtin_abort ();
return;
}