1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
|
/* { dg-do run } */
/* { dg-require-effective-target avx2 } */
/* { dg-options "-O3 -mavx2" } */
#include "avx2-check.h"
#define N 1024
int a[N], b[N], c[N], d[N];
__attribute__((noinline, noclone)) void
foo (float *__restrict p, float *__restrict q, float *__restrict r,
long s1, long s2, long s3)
{
int i;
for (i = 0; i < N; i++)
p[i] = q[a[i] * s1 + b[i] * s2 + s3] * r[c[i] * s1 + d[i] * s2 + s3];
}
static void
avx2_test (void)
{
int i;
float e[N], f[N], g[N];
for (i = 0; i < N; i++)
{
a[i] = (i * 7) & (N / 8 - 1);
b[i] = (i * 13) & (N / 8 - 1);
c[i] = (i * 23) & (N / 8 - 1);
d[i] = (i * 5) & (N / 8 - 1);
e[i] = 16.5 + i;
f[i] = 127.5 - i;
}
foo (g, e, f, 3, 2, 4);
for (i = 0; i < N; i++)
if (g[i] != (float) ((20.5 + a[i] * 3 + b[i] * 2)
* (123.5 - c[i] * 3 - d[i] * 2)))
abort ();
}
|