This is the mail archive of the
gcc-patches@gcc.gnu.org
mailing list for the GCC project.
Re: [PATCH 14/15][ARM/AArch64 Testsuite]Add test of vcvt{,_high}_i{f32_f16,f16_f32}
- From: Christophe Lyon <christophe dot lyon at linaro dot org>
- To: Alan Lawrence <alan dot lawrence at arm dot com>
- Cc: "gcc-patches at gcc dot gnu dot org" <gcc-patches at gcc dot gnu dot org>
- Date: Tue, 25 Aug 2015 16:21:41 +0200
- Subject: Re: [PATCH 14/15][ARM/AArch64 Testsuite]Add test of vcvt{,_high}_i{f32_f16,f16_f32}
- Authentication-results: sourceware.org; auth=none
- References: <55B7670B dot 1090902 at arm dot com> <1440511043-7622-1-git-send-email-alan dot lawrence at arm dot com>
On 25 August 2015 at 15:57, Alan Lawrence <alan.lawrence@arm.com> wrote:
> Sorry - wrong version posted. The hunk for add_options_for_arm_neon_fp16 has
> moved to the previous patch! This version also fixes some whitespace issues.
>
This looks OK to me now, thanks.
> gcc/testsuite/ChangeLog:
>
> * gcc.target/aarch64/advsimd-intrinsics/vcvt_f16.c: New.
> * lib/target-supports.exp
> (check_effective_target_arm_neon_fp16_hw_ok): New.
> ---
> .../aarch64/advsimd-intrinsics/vcvt_f16.c | 98 ++++++++++++++++++++++
> gcc/testsuite/lib/target-supports.exp | 15 ++++
> 2 files changed, 113 insertions(+)
> create mode 100644 gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vcvt_f16.c
>
> diff --git a/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vcvt_f16.c b/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vcvt_f16.c
> new file mode 100644
> index 0000000..a2cfd38
> --- /dev/null
> +++ b/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vcvt_f16.c
> @@ -0,0 +1,98 @@
> +/* { dg-require-effective-target arm_neon_fp16_hw_ok { target { arm*-*-* } } } */
> +#include <arm_neon.h>
> +#include "arm-neon-ref.h"
> +#include "compute-ref-data.h"
> +#include <math.h>
> +
> +/* Expected results for vcvt. */
> +VECT_VAR_DECL (expected,hfloat,32,4) [] = { 0x41800000, 0x41700000,
> + 0x41600000, 0x41500000 };
> +VECT_VAR_DECL (expected,hfloat,16,4) [] = { 0x3e00, 0x4100, 0x4300, 0x4480 };
> +
> +/* Expected results for vcvt_high_f32_f16. */
> +VECT_VAR_DECL (expected_high,hfloat,32,4) [] = { 0xc1400000, 0xc1300000,
> + 0xc1200000, 0xc1100000 };
> +/* Expected results for vcvt_high_f16_f32. */
> +VECT_VAR_DECL (expected_high,hfloat,16,8) [] = { 0x4000, 0x4000, 0x4000, 0x4000,
> + 0xcc00, 0xcb80, 0xcb00, 0xca80 };
> +
> +void
> +exec_vcvt (void)
> +{
> + clean_results ();
> +
> +#define TEST_MSG vcvt_f32_f16
> + {
> + VECT_VAR_DECL (buffer_src, float, 16, 4) [] = { 16.0, 15.0, 14.0, 13.0 };
> +
> + DECL_VARIABLE (vector_src, float, 16, 4);
> +
> + VLOAD (vector_src, buffer_src, , float, f, 16, 4);
> + DECL_VARIABLE (vector_res, float, 32, 4) =
> + vcvt_f32_f16 (VECT_VAR (vector_src, float, 16, 4));
> + vst1q_f32 (VECT_VAR (result, float, 32, 4),
> + VECT_VAR (vector_res, float, 32, 4));
> +
> + CHECK_FP (TEST_MSG, float, 32, 4, PRIx32, expected, "");
> + }
> +#undef TEST_MSG
> +
> + clean_results ();
> +
> +#define TEST_MSG vcvt_f16_f32
> + {
> + VECT_VAR_DECL (buffer_src, float, 32, 4) [] = { 1.5, 2.5, 3.5, 4.5 };
> + DECL_VARIABLE (vector_src, float, 32, 4);
> +
> + VLOAD (vector_src, buffer_src, q, float, f, 32, 4);
> + DECL_VARIABLE (vector_res, float, 16, 4) =
> + vcvt_f16_f32 (VECT_VAR (vector_src, float, 32, 4));
> + vst1_f16 (VECT_VAR (result, float, 16, 4),
> + VECT_VAR (vector_res, float, 16 ,4));
> +
> + CHECK_FP (TEST_MSG, float, 16, 4, PRIx16, expected, "");
> + }
> +#undef TEST_MSG
> +
> +#if defined (__aarch64__)
> + clean_results ();
> +
> +#define TEST_MSG "vcvt_high_f32_f16"
> + {
> + DECL_VARIABLE (vector_src, float, 16, 8);
> + VLOAD (vector_src, buffer, q, float, f, 16, 8);
> + DECL_VARIABLE (vector_res, float, 32, 4);
> + VECT_VAR (vector_res, float, 32, 4) =
> + vcvt_high_f32_f16 (VECT_VAR (vector_src, float, 16, 8));
> + vst1q_f32 (VECT_VAR (result, float, 32, 4),
> + VECT_VAR (vector_res, float, 32, 4));
> + CHECK_FP (TEST_MSG, float, 32, 4, PRIx32, expected_high, "");
> + }
> +#undef TEST_MSG
> + clean_results ();
> +
> +#define TEST_MSG "vcvt_high_f16_f32"
> + {
> + DECL_VARIABLE (vector_low, float, 16, 4);
> + VDUP (vector_low, , float, f, 16, 4, 2.0);
> +
> + DECL_VARIABLE (vector_src, float, 32, 4);
> + VLOAD (vector_src, buffer, q, float, f, 32, 4);
> +
> + DECL_VARIABLE (vector_res, float, 16, 8) =
> + vcvt_high_f16_f32 (VECT_VAR (vector_low, float, 16, 4),
> + VECT_VAR (vector_src, float, 32, 4));
> + vst1q_f16 (VECT_VAR (result, float, 16, 8),
> + VECT_VAR (vector_res, float, 16, 8));
> +
> + CHECK_FP (TEST_MSG, float, 16, 8, PRIx16, expected_high, "");
> + }
> +#endif
> +}
> +
> +int
> +main (void)
> +{
> + exec_vcvt ();
> + return 0;
> +}
> diff --git a/gcc/testsuite/lib/target-supports.exp b/gcc/testsuite/lib/target-supports.exp
> index 9aec02d..0a22c95 100644
> --- a/gcc/testsuite/lib/target-supports.exp
> +++ b/gcc/testsuite/lib/target-supports.exp
> @@ -2730,6 +2730,21 @@ proc check_effective_target_arm_neon_fp16_ok { } {
> check_effective_target_arm_neon_fp16_ok_nocache]
> }
>
> +proc check_effective_target_arm_neon_fp16_hw_ok { } {
> + if {! [check_effective_target_arm_neon_fp16_ok] } {
> + return 0
> + }
> + global et_arm_neon_fp16_flags
> + check_runtime_nocache arm_neon_fp16_hw_ok {
> + int
> + main (int argc, char **argv)
> + {
> + asm ("vcvt.f32.f16 q1, d0");
> + return 0;
> + }
> + } $et_arm_neon_fp16_flags
> +}
> +
> proc add_options_for_arm_neon_fp16 { flags } {
> if { ! [check_effective_target_arm_neon_fp16_ok] } {
> return "$flags"
> --
> 1.8.3
>