| /* { dg-do run } */ |
| /* { dg-require-effective-target avx2 } */ |
| /* { dg-options "-O2 -mavx2" } */ |
| |
| #include <string.h> |
| #include "avx2-check.h" |
| |
| static void |
| compute_i64gatherps (float *src, |
| float *s1, |
| long long *s2, float *mask, int scale, float *r) |
| { |
| int i; |
| |
| for (i = 0; i < 2; ++i) |
| if ((((int *) mask)[i] >> 31) & 1) |
| r[i] = *(float *) (((unsigned char *) s1) + s2[i] * scale); |
| else |
| r[i] = src[i]; |
| } |
| |
| void static |
| avx2_test (void) |
| { |
| int i; |
| union128i_q idx; |
| union128 res, src, mask; |
| float s1[2], res_ref[4] = { 0 }; |
| |
| for (i = 0; i < 2; ++i) |
| { |
| /* Set some stuff */ |
| s1[i] = 2.718281828459045 * (i + 1) * (i + 2); |
| |
| /* Set src as something different from s1 */ |
| src.a[i] = -s1[i]; |
| |
| /* Mask out evens */ |
| ((int *) mask.a)[i] = i % 2 ? 0 : -1; |
| |
| /* About to gather in reverse order, |
| divide by 2 to demonstrate scale */ |
| idx.a[i] = (8 - (i + 1) * 4) >> 1; |
| } |
| |
| res.x = _mm_mask_i64gather_ps (src.x, s1, idx.x, mask.x, 2); |
| |
| compute_i64gatherps (src.a, s1, idx.a, mask.a, 2, res_ref); |
| |
| if (check_union128 (res, res_ref) != 0) |
| abort (); |
| } |