Viewing file: struct_vect_23.c (1.91 KB) -rw-r--r-- Select action/file-type: (+) | (+) | (+) | Code (+) | Session (+) | (+) | SDB (+) | (+) | (+) | (+) | (+) | (+) |
/* { dg-do compile } */ /* { dg-options "-O2 -ftree-vectorize" } */
#include <stdint.h>
#define TEST_LOOP(NAME, TYPE) \ void __attribute__ ((noinline, noclone)) \ NAME (TYPE *restrict dest, TYPE *restrict src, int n) \ { \ for (int i = 0; i < n; ++i) \ dest[i] += src[i * 4]; \ }
#define TEST(NAME) \ TEST_LOOP (NAME##_i8, int8_t) \ TEST_LOOP (NAME##_i16, uint16_t) \ TEST_LOOP (NAME##_f32, float) \ TEST_LOOP (NAME##_f64, double)
TEST (test)
/* Check the vectorized loop. */ /* { dg-final { scan-assembler-times {\tld1b\t} 1 } } */ /* { dg-final { scan-assembler-times {\tld4b\t} 1 } } */ /* { dg-final { scan-assembler-times {\tst1b\t} 1 } } */ /* { dg-final { scan-assembler-times {\tld1h\t} 1 } } */ /* { dg-final { scan-assembler-times {\tld4h\t} 1 } } */ /* { dg-final { scan-assembler-times {\tst1h\t} 1 } } */ /* { dg-final { scan-assembler-times {\tld1w\t} 1 } } */ /* { dg-final { scan-assembler-times {\tld4w\t} 1 } } */ /* { dg-final { scan-assembler-times {\tst1w\t} 1 } } */ /* { dg-final { scan-assembler-times {\tld1d\t} 1 } } */ /* { dg-final { scan-assembler-times {\tld4d\t} 1 } } */ /* { dg-final { scan-assembler-times {\tst1d\t} 1 } } */
/* Check the scalar tail. */ /* { dg-final { scan-assembler-times {\tldrb\tw} 2 } } */ /* { dg-final { scan-assembler-times {\tstrb\tw} 1 } } */ /* { dg-final { scan-assembler-times {\tldrh\tw} 2 } } */ /* { dg-final { scan-assembler-times {\tstrh\tw} 1 } } */ /* { dg-final { scan-assembler-times {\tldr\ts} 2 } } */ /* { dg-final { scan-assembler-times {\tstr\ts} 1 } } */ /* { dg-final { scan-assembler-times {\tldr\td} 2 } } */ /* { dg-final { scan-assembler-times {\tstr\td} 1 } } */
/* Each function should have three branches: one directly to the exit (n <= 0), one to the single scalar epilogue iteration (n == 1), and one branch-back for the vectorized loop. */ /* { dg-final { scan-assembler-times {\tb[.a-z]+\t} 12 } } */
|