Viewing file: avx512er-vrsqrt28ss-2.c (1.32 KB) -rw-r--r-- Select action/file-type: (+) | (+) | (+) | Code (+) | Session (+) | (+) | SDB (+) | (+) | (+) | (+) | (+) | (+) |
/* { dg-do run } */ /* { dg-require-effective-target avx512er } */ /* { dg-options "-O2 -mavx512er" } */
#include "avx512er-check.h" #include "avx512f-mask-type.h" #include "avx512f-helper.h" #include <math.h>
#define IMM 0x23
void static avx512er_test (void) { union128 src1, src2, res, res1, res2, res3, res4; float res_ref[4]; MASK_TYPE mask = MASK_VALUE; int i; for (i = 0; i < 4; i++) { src1.a[i] = 179.345 - 6.5645 * i; src2.a[i] = 179221345 + 6.5645 * i; res_ref[i] = src1.a[i]; }
res_ref[0] = 1.0 / sqrt (src2.a[0]);
res.x = _mm_rsqrt28_round_ss (src1.x, src2.x, _MM_FROUND_NO_EXC); res1.x = _mm_mask_rsqrt28_ss (src1.x, IMM, src1.x, src2.x); res2.x = _mm_mask_rsqrt28_round_ss (src1.x, IMM, src1.x, src2.x, _MM_FROUND_TO_NEAREST_INT | _MM_FROUND_NO_EXC); res3.x = _mm_maskz_rsqrt28_ss (IMM, src1.x, src2.x); res4.x = _mm_maskz_rsqrt28_round_ss (IMM, src1.x, src2.x, _MM_FROUND_TO_NEAREST_INT | _MM_FROUND_NO_EXC);
if (checkVf (res.a, res_ref, 4)) abort (); MASK_MERGE () (res_ref, mask, 1);
if (checkVf (res1.a, res_ref, 2)) abort ();
if (checkVf (res2.a, res_ref, 2)) abort ();
MASK_ZERO () (res_ref, mask, 1);
if (checkVf (res3.a, res_ref, 2)) abort ();
if (checkVf (res4.a, res_ref, 2)) abort (); }
|