Viewing file: avx512f-vrndscalepd-2.c (2.03 KB) -rw-r--r-- Select action/file-type: (+) | (+) | (+) | Code (+) | Session (+) | (+) | SDB (+) | (+) | (+) | (+) | (+) | (+) |
/* { dg-do run } */ /* { dg-options "-O2 -mavx512f" } */ /* { dg-require-effective-target avx512f } */
#define AVX512F
#include "avx512f-helper.h"
#define SIZE (AVX512F_LEN / 64) #include "avx512f-mask-type.h" #include "math.h"
static void CALC (double *s, double *r, int imm) { int i = 0, rc, m; rc = imm & 0xf; m = imm >> 4; for (i = 0; i < SIZE; i++) switch (rc) { case _MM_FROUND_FLOOR: r[i] = floor (s[i] * pow (2, m)) / pow (2, m); break; case _MM_FROUND_CEIL: r[i] = ceil (s[i] * pow (2, m)) / pow (2, m); break; default: abort (); break; } }
void TEST (void) { int imm, i, j; UNION_TYPE (AVX512F_LEN, d) res1,res2,res3,s; double res_ref[SIZE];
MASK_TYPE mask = 6 ^ (0xff >> SIZE);
imm = _MM_FROUND_FLOOR | (7 << 4);
for (i = 0; i < 3; i++) {
for (j = 0; j < SIZE; j++) { s.a[j] = j * (j + 12.0231); res1.a[j] = DEFAULT_VALUE; res2.a[j] = DEFAULT_VALUE; res3.a[j] = DEFAULT_VALUE; }
switch (i) { case 0: imm = _MM_FROUND_FLOOR | (7 << 4); res1.x = INTRINSIC (_roundscale_pd) (s.x, imm); res2.x = INTRINSIC (_mask_roundscale_pd) (res2.x, mask, s.x, imm); res3.x = INTRINSIC (_maskz_roundscale_pd) (mask, s.x, imm); break; case 1: imm = _MM_FROUND_FLOOR; res1.x = INTRINSIC (_floor_pd) (s.x); #if AVX512F_LEN == 512 res2.x = INTRINSIC (_mask_floor_pd) (res2.x, mask, s.x); #endif break; case 2: imm = _MM_FROUND_CEIL; res1.x = INTRINSIC (_ceil_pd) (s.x); #if AVX512F_LEN == 512 res2.x = INTRINSIC (_mask_ceil_pd) (res2.x, mask, s.x); #endif break; }
CALC (s.a, res_ref, imm);
if (UNION_CHECK (AVX512F_LEN, d) (res1, res_ref)) abort ();
MASK_MERGE(d) (res_ref,mask,SIZE );
#if AVX512F_LEN == 512 if (UNION_CHECK (AVX512F_LEN, d) (res2, res_ref)) abort (); #else if (!i && UNION_CHECK (AVX512F_LEN, d) (res2, res_ref)) abort (); #endif
MASK_ZERO(d) (res_ref,mask,SIZE );
if (!i && UNION_CHECK (AVX512F_LEN, d) (res3, res_ref)) abort ();
} }
|