Viewing file: vect-reduc-dot-s16b.c (1.25 KB) -rw-r--r-- Select action/file-type: (+) | (+) | (+) | Code (+) | Session (+) | (+) | SDB (+) | (+) | (+) | (+) | (+) | (+) |
/* { dg-require-effective-target vect_int } */
#include <stdarg.h> #include "tree-vect.h"
#define N 64
#define DOT 43680
signed short X[N] __attribute__ ((__aligned__(__BIGGEST_ALIGNMENT__))); signed short Y[N] __attribute__ ((__aligned__(__BIGGEST_ALIGNMENT__)));
/* short->short->int dot product. Should be vectorized on architectures supporting vectorized multiplication of two short args with short result, e.g "mulv4hi3" and widenning sum */ __attribute__ ((noinline)) int foo (int len) { int i; int result = 0; short prod;
for (i = 0; i < len; i++) { prod = X[i] * Y[i]; result += prod; } return result; }
int main (void) { int i, dot;
check_vect ();
for (i = 0; i < N; i++) { X[i] = i; Y[i] = 64 - i; __asm__ volatile (""); }
dot = foo (N); if (dot != DOT) abort ();
return 0; }
/* { dg-final { scan-tree-dump-times "vectorized 1 loops" 1 "vect" { target { vect_short_mult && { vect_widen_sum_hi_to_si || vect_unpack } } } } } */ /* { dg-final { scan-tree-dump-times "vectorized 1 loops" 0 "vect" { target { ! vect_short_mult } } } } */ /* { dg-final { scan-tree-dump-times "vectorized 1 loops" 0 "vect" { target { { ! vect_widen_sum_hi_to_si } && { ! vect_unpack } } } } } */
|