Viewing file: complex-add-pattern-template.c (1.65 KB) -rw-r--r-- Select action/file-type: (+) | (+) | (+) | Code (+) | Session (+) | (+) | SDB (+) | (+) | (+) | (+) | (+) | (+) |
void add90 (TYPE a[restrict N], TYPE b[restrict N], TYPE c[restrict N]) { #if defined (UNROLL) #pragma GCC unroll 16 #endif for (int i=0; i < N; i+=2) { c[i] = a[i] - b[i+1]; c[i+1] = a[i+1] + b[i]; } }
/* { dg-final { scan-tree-dump-times "stmt.*COMPLEX_ADD_ROT90" 1 "vect" } } */
void add270 (TYPE a[restrict N], TYPE b[restrict N], TYPE c[restrict N]) { #if defined (UNROLL) #pragma GCC unroll 16 #endif for (int i=0; i < N; i+=2) { c[i] = a[i] + b[i+1]; c[i+1] = a[i+1] - b[i]; } }
/* { dg-final { scan-tree-dump-times "stmt.*COMPLEX_ADD_ROT270" 1 "vect" } } */
void addMixed (TYPE a[restrict N], TYPE b[restrict N], TYPE c[restrict N]) { #if defined (UNROLL) #pragma GCC unroll 16 #endif for (int i=0; i < N; i+=4) { c[i] = a[i] - b[i+1]; c[i+1] = a[i+1] + b[i]; c[i+2] = a[i+2] + b[i+3]; c[i+3] = a[i+3] - b[i+2]; } }
void add90HandUnrolled (TYPE a[restrict N], TYPE b[restrict N], TYPE c[restrict N]) { #if defined (UNROLL) #pragma GCC unroll 16 #endif for (int i=0; i < (N /2); i+=4) { c[i] = a[i] - b[i+1]; c[i+2] = a[i+2] - b[i+3]; c[i+1] = a[i+1] + b[i]; c[i+3] = a[i+3] + b[i+2]; } }
/* { dg-final { scan-tree-dump-times "stmt.*COMPLEX_ADD_ROT90" 1 "vect" } } */
void add90Hybrid (TYPE a[restrict N], TYPE b[restrict N], TYPE c[restrict N], TYPE d[restrict N]) { #if defined (UNROLL) #pragma GCC unroll 16 #endif for (int i=0; i < N; i+=2) { c[i] = a[i] - b[i+1]; c[i+1] = a[i+1] + b[i]; d[i] = a[i] - b[i]; d[i+1] = a[i+1] - b[i+1]; } }
/* { dg-final { scan-tree-dump-times "stmt.*COMPLEX_ADD_ROT90" 2 "vect" } } */
|