Viewing file: bfmlalt_lane_f32.c (2.24 KB) -rw-r--r-- Select action/file-type: (+) | (+) | (+) | Code (+) | Session (+) | (+) | SDB (+) | (+) | (+) | (+) | (+) | (+) |
/* { dg-additional-options "-march=armv8.2-a+sve+bf16" } */ /* { dg-require-effective-target aarch64_asm_bf16_ok } */ /* { dg-final { check-function-bodies "**" "" "-DCHECK_ASM" } } */
#include "test_sve_acle.h"
/* ** bfmlalt_lane_0_f32_tied1: ** bfmlalt z0\.s, z4\.h, z5\.h\[0\] ** ret */ TEST_DUAL_Z (bfmlalt_lane_0_f32_tied1, svfloat32_t, svbfloat16_t, z0 = svbfmlalt_lane_f32 (z0, z4, z5, 0), z0 = svbfmlalt_lane (z0, z4, z5, 0))
/* ** bfmlalt_lane_0_f32_tied2: ** mov (z[0-9]+)\.d, z0\.d ** movprfx z0, z4 ** bfmlalt z0\.s, \1\.h, z1\.h\[0\] ** ret */ TEST_DUAL_Z_REV (bfmlalt_lane_0_f32_tied2, svfloat32_t, svbfloat16_t, z0_res = svbfmlalt_lane_f32 (z4, z0, z1, 0), z0_res = svbfmlalt_lane (z4, z0, z1, 0))
/* ** bfmlalt_lane_0_f32_tied3: ** mov (z[0-9]+)\.d, z0\.d ** movprfx z0, z4 ** bfmlalt z0\.s, z1\.h, \1\.h\[0\] ** ret */ TEST_DUAL_Z_REV (bfmlalt_lane_0_f32_tied3, svfloat32_t, svbfloat16_t, z0_res = svbfmlalt_lane_f32 (z4, z1, z0, 0), z0_res = svbfmlalt_lane (z4, z1, z0, 0))
/* ** bfmlalt_lane_0_f32_untied: ** movprfx z0, z1 ** bfmlalt z0\.s, z4\.h, z5\.h\[0\] ** ret */ TEST_DUAL_Z (bfmlalt_lane_0_f32_untied, svfloat32_t, svbfloat16_t, z0 = svbfmlalt_lane_f32 (z1, z4, z5, 0), z0 = svbfmlalt_lane (z1, z4, z5, 0))
/* ** bfmlalt_lane_1_f32: ** bfmlalt z0\.s, z4\.h, z5\.h\[1\] ** ret */ TEST_DUAL_Z (bfmlalt_lane_1_f32, svfloat32_t, svbfloat16_t, z0 = svbfmlalt_lane_f32 (z0, z4, z5, 1), z0 = svbfmlalt_lane (z0, z4, z5, 1))
/* ** bfmlalt_lane_7_f32: ** bfmlalt z0\.s, z4\.h, z5\.h\[7\] ** ret */ TEST_DUAL_Z (bfmlalt_lane_7_f32, svfloat32_t, svbfloat16_t, z0 = svbfmlalt_lane_f32 (z0, z4, z5, 7), z0 = svbfmlalt_lane (z0, z4, z5, 7))
/* ** bfmlalt_lane_z8_f32: ** str d8, \[sp, -16\]! ** mov (z[0-7])\.d, z8\.d ** bfmlalt z0\.s, z1\.h, \1\.h\[1\] ** ldr d8, \[sp\], 16 ** ret */ TEST_DUAL_LANE_REG (bfmlalt_lane_z8_f32, svfloat32_t, svbfloat16_t, z8, z0 = svbfmlalt_lane_f32 (z0, z1, z8, 1), z0 = svbfmlalt_lane (z0, z1, z8, 1))
/* ** bfmlalt_lane_z16_f32: ** mov (z[0-7])\.d, z16\.d ** bfmlalt z0\.s, z1\.h, \1\.h\[1\] ** ret */ TEST_DUAL_LANE_REG (bfmlalt_lane_z16_f32, svfloat32_t, svbfloat16_t, z16, z0 = svbfmlalt_lane_f32 (z0, z1, z16, 1), z0 = svbfmlalt_lane (z0, z1, z16, 1))
|