/* { dg-do run } */ /* { dg-require-effective-target avx2 } */ /* { dg-options "-O2 -mavx2" } */ #include #include "avx2-check.h" static void compute_i32gatherps256 (float *src, float *s1, int *s2, float *mask, int scale, float *r) { int i; for (i = 0; i < 8; ++i) if ((((int *) mask)[i] >> 31) & 1) r[i] = *(float *) (((unsigned char *) s1) + s2[i] * scale); else r[i] = src[i]; } void static avx2_test (void) { int i; union256i_d idx; union256 res, src, mask; float s1[8], res_ref[8] = { 0 }; for (i = 0; i < 8; ++i) { /* Set some stuff */ s1[i] = 2.718281828459045 * (i + 1) * (i + 2); /* Set src as something different from s1 */ src.a[i] = -s1[i]; /* Mask out evens */ ((int *) mask.a)[i] = i % 2 ? 0 : -1; /* About to gather in reverse order, divide by 2 to demonstrate scale */ idx.a[i] = (32 - (i + 1) * 4) >> 1; } res.x = _mm256_mask_i32gather_ps (src.x, s1, idx.x, mask.x, 2); compute_i32gatherps256 (src.a, s1, idx.a, mask.a, 2, res_ref); if (check_union256 (res, res_ref) != 0) abort (); }