Viewing file: vec_perm_1_overrange_run.c (4.13 KB) -rw-r--r-- Select action/file-type: (+) | (+) | (+) | Code (+) | Session (+) | (+) | SDB (+) | (+) | (+) | (+) | (+) | (+) |
/* { dg-do run { target aarch64_sve_hw } } */ /* { dg-options "-O" } */ /* { dg-options "-O -msve-vector-bits=256" { target aarch64_sve256_hw } } */
#include "vec_perm_1.c"
#define TEST_VEC_PERM(TYPE, MASK_TYPE, EXPECTED_RESULT, \ VALUES1, VALUES2, MASK) \ { \ TYPE expected_result = EXPECTED_RESULT; \ TYPE values1 = VALUES1; \ TYPE values2 = VALUES2; \ MASK_TYPE mask = MASK; \ TYPE dest; \ dest = vec_perm_##TYPE (values1, values2, mask); \ if (__builtin_memcmp (&dest, &expected_result, sizeof (TYPE)) != 0) \ __builtin_abort (); \ }
int main (void) { TEST_VEC_PERM (vnx2di, vnx2di, ((vnx2di) { 5, 36, 7, 48 }), ((vnx2di) { 4, 5, 6, 7 }), ((vnx2di) { 12, 24, 36, 48 }), ((vnx2di) { 1 + (8 * 1), 6 + (8 * 3), 3 + (8 * 1), 7 + (8 * 5) })); TEST_VEC_PERM (vnx4si, vnx4si, ((vnx4si) { 34, 38, 40, 10, 9, 8, 7, 35 }), ((vnx4si) { 3, 4, 5, 6, 7, 8, 9, 10 }), ((vnx4si) { 33, 34, 35, 36, 37, 38, 39, 40 }), ((vnx4si) { 9 + (16 * 2), 13 + (16 * 5), 15 + (16 * 1), 7 + (16 * 0), 6 + (16 * 8), 5 + (16 * 2), 4 + (16 * 3), 10 + (16 * 2) })); TEST_VEC_PERM (vnx8hi, vnx8hi, ((vnx8hi) { 12, 16, 18, 10, 42, 43, 44, 34, 7, 48, 3, 35, 9, 8, 7, 13 }), ((vnx8hi) { 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18 }), ((vnx8hi) { 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48 }), ((vnx8hi) { 9 + (32 * 2), 13 + (32 * 2), 15 + (32 * 8), 7 + (32 * 9), 25 + (32 * 4), 26 + (32 * 3), 27 + (32 * 1), 17 + (32 * 2), 4 + (32 * 6), 31 + (32 * 7), 0 + (32 * 8), 18 + (32 * 9), 6 + (32 * 6), 5 + (32 * 7), 4 + (32 * 2), 10 + (32 * 2) })); TEST_VEC_PERM (vnx16qi, vnx16qi, ((vnx16qi) { 5, 6, 7, 4, 5, 6, 4, 5, 6, 7, 12, 24, 36, 48, 12, 24, 5, 6, 7, 4, 5, 6, 4, 5, 6, 7, 12, 24, 36, 48, 12, 24 }), ((vnx16qi) { 4, 5, 6, 7, 4, 5, 6, 7, 4, 5, 6, 7, 4, 5, 6, 7, 4, 5, 6, 7, 4, 5, 6, 7, 4, 5, 6, 7, 4, 5, 6, 7 }), ((vnx16qi) { 12, 24, 36, 48, 12, 24, 36, 48, 12, 24, 36, 48, 12, 24, 36, 48, 12, 24, 36, 48, 12, 24, 36, 48, 12, 24, 36, 48, 12, 24, 36, 48 }), ((vnx16qi) { 5 + (64 * 3), 6 + (64 * 1), 7 + (64 * 2), 8 + (64 * 1), 9 + (64 * 3), 10 + (64 * 1), 28 + (64 * 3), 29 + (64 * 3), 30 + (64 * 1), 31 + (64 * 1), 32 + (64 * 3), 33 + (64 * 2), 54 + (64 * 2), 55 + (64 * 2), 56 + (64 * 1), 61 + (64 * 2), 5 + (64 * 2), 6 + (64 * 1), 7 + (64 * 2), 8 + (64 * 2), 9 + (64 * 2), 10 + (64 * 1), 28 + (64 * 3), 29 + (64 * 1), 30 + (64 * 3), 31 + (64 * 3), 32 + (64 * 1), 33 + (64 * 1), 54 + (64 * 2), 55 + (64 * 2), 56 + (64 * 2), 61 + (64 * 2) })); TEST_VEC_PERM (vnx2df, vnx2di, ((vnx2df) { 5.1, 36.1, 7.1, 48.1 }), ((vnx2df) { 4.1, 5.1, 6.1, 7.1 }), ((vnx2df) { 12.1, 24.1, 36.1, 48.1 }), ((vnx2di) { 1 + (8 * 3), 6 + (8 * 10), 3 + (8 * 8), 7 + (8 * 2) })); TEST_VEC_PERM (vnx4sf, vnx4si, ((vnx4sf) { 34.2, 38.2, 40.2, 10.2, 9.2, 8.2, 7.2, 35.2 }), ((vnx4sf) { 3.2, 4.2, 5.2, 6.2, 7.2, 8.2, 9.2, 10.2 }), ((vnx4sf) { 33.2, 34.2, 35.2, 36.2, 37.2, 38.2, 39.2, 40.2 }), ((vnx4si) { 9 + (16 * 1), 13 + (16 * 5), 15 + (16 * 4), 7 + (16 * 4), 6 + (16 * 3), 5 + (16 * 2), 4 + (16 * 1), 10 + (16 * 0) })); TEST_VEC_PERM (vnx8hf, vnx8hi, ((vnx8hf) { 12.0, 16.0, 18.0, 10.0, 42.0, 43.0, 44.0, 34.0, 7.0, 48.0, 3.0, 35.0, 9.0, 8.0, 7.0, 13.0 }), ((vnx8hf) { 3.0, 4.0, 5.0, 6.0, 7.0, 8.0, 9.0, 10.0, 11.0, 12.0, 13.0, 14.0, 15.0, 16.0, 17.0, 18.0 }), ((vnx8hf) { 33.0, 34.0, 35.0, 36.0, 37.0, 38.0, 39.0, 40.0, 41.0, 42.0, 43.0, 44.0, 45.0, 46.0, 47.0, 48.0 }), ((vnx8hi) { 9 + (32 * 2), 13 + (32 * 2), 15 + (32 * 8), 7 + (32 * 9), 25 + (32 * 4), 26 + (32 * 3), 27 + (32 * 1), 17 + (32 * 2), 4 + (32 * 6), 31 + (32 * 7), 0 + (32 * 8), 18 + (32 * 9), 6 + (32 * 6), 5 + (32 * 7), 4 + (32 * 2), 10 + (32 * 2) })); return 0; }
|