| void add90 (TYPE a[restrict N], TYPE b[restrict N], TYPE c[restrict N]) |
| { |
| for (int i=0; i < N; i+=2) |
| { |
| c[i] = a[i] - b[i+1]; |
| c[i+1] = a[i+1] + b[i]; |
| } |
| } |
| |
| /* { dg-final { scan-tree-dump-times "stmt.*COMPLEX_ADD_ROT90" 1 "vect" } } */ |
| |
| void add270 (TYPE a[restrict N], TYPE b[restrict N], TYPE c[restrict N]) |
| { |
| for (int i=0; i < N; i+=2) |
| { |
| c[i] = a[i] + b[i+1]; |
| c[i+1] = a[i+1] - b[i]; |
| } |
| } |
| |
| /* { dg-final { scan-tree-dump-times "stmt.*COMPLEX_ADD_ROT270" 1 "vect" } } */ |
| |
| void addMixed (TYPE a[restrict N], TYPE b[restrict N], TYPE c[restrict N]) |
| { |
| for (int i=0; i < N; i+=4) |
| { |
| c[i] = a[i] - b[i+1]; |
| c[i+1] = a[i+1] + b[i]; |
| c[i+2] = a[i+2] + b[i+3]; |
| c[i+3] = a[i+3] - b[i+2]; |
| } |
| } |
| |
| void add90HandUnrolled (TYPE a[restrict N], TYPE b[restrict N], |
| TYPE c[restrict N]) |
| { |
| for (int i=0; i < (N /2); i+=4) |
| { |
| c[i] = a[i] - b[i+1]; |
| c[i+2] = a[i+2] - b[i+3]; |
| c[i+1] = a[i+1] + b[i]; |
| c[i+3] = a[i+3] + b[i+2]; |
| } |
| } |
| |
| /* { dg-final { scan-tree-dump-times "stmt.*COMPLEX_ADD_ROT90" 1 "vect" } } */ |
| |
| void add90Hybrid (TYPE a[restrict N], TYPE b[restrict N], TYPE c[restrict N], |
| TYPE d[restrict N]) |
| { |
| for (int i=0; i < N; i+=2) |
| { |
| c[i] = a[i] - b[i+1]; |
| c[i+1] = a[i+1] + b[i]; |
| d[i] = a[i] - b[i]; |
| d[i+1] = a[i+1] - b[i+1]; |
| } |
| } |
| |
| /* { dg-final { scan-tree-dump-times "stmt.*COMPLEX_ADD_ROT90" 2 "vect" } } */ |