Message ID | 1440511043-7622-1-git-send-email-alan.lawrence@arm.com |
---|---|
State | New |
Headers | show |
On 25 August 2015 at 15:57, Alan Lawrence <alan.lawrence@arm.com> wrote: > Sorry - wrong version posted. The hunk for add_options_for_arm_neon_fp16 has > moved to the previous patch! This version also fixes some whitespace issues. > This looks OK to me now, thanks. > gcc/testsuite/ChangeLog: > > * gcc.target/aarch64/advsimd-intrinsics/vcvt_f16.c: New. > * lib/target-supports.exp > (check_effective_target_arm_neon_fp16_hw_ok): New. > --- > .../aarch64/advsimd-intrinsics/vcvt_f16.c | 98 ++++++++++++++++++++++ > gcc/testsuite/lib/target-supports.exp | 15 ++++ > 2 files changed, 113 insertions(+) > create mode 100644 gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vcvt_f16.c > > diff --git a/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vcvt_f16.c b/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vcvt_f16.c > new file mode 100644 > index 0000000..a2cfd38 > --- /dev/null > +++ b/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vcvt_f16.c > @@ -0,0 +1,98 @@ > +/* { dg-require-effective-target arm_neon_fp16_hw_ok { target { arm*-*-* } } } */ > +#include <arm_neon.h> > +#include "arm-neon-ref.h" > +#include "compute-ref-data.h" > +#include <math.h> > + > +/* Expected results for vcvt. */ > +VECT_VAR_DECL (expected,hfloat,32,4) [] = { 0x41800000, 0x41700000, > + 0x41600000, 0x41500000 }; > +VECT_VAR_DECL (expected,hfloat,16,4) [] = { 0x3e00, 0x4100, 0x4300, 0x4480 }; > + > +/* Expected results for vcvt_high_f32_f16. */ > +VECT_VAR_DECL (expected_high,hfloat,32,4) [] = { 0xc1400000, 0xc1300000, > + 0xc1200000, 0xc1100000 }; > +/* Expected results for vcvt_high_f16_f32. */ > +VECT_VAR_DECL (expected_high,hfloat,16,8) [] = { 0x4000, 0x4000, 0x4000, 0x4000, > + 0xcc00, 0xcb80, 0xcb00, 0xca80 }; > + > +void > +exec_vcvt (void) > +{ > + clean_results (); > + > +#define TEST_MSG vcvt_f32_f16 > + { > + VECT_VAR_DECL (buffer_src, float, 16, 4) [] = { 16.0, 15.0, 14.0, 13.0 }; > + > + DECL_VARIABLE (vector_src, float, 16, 4); > + > + VLOAD (vector_src, buffer_src, , float, f, 16, 4); > + DECL_VARIABLE (vector_res, float, 32, 4) = > + vcvt_f32_f16 (VECT_VAR (vector_src, float, 16, 4)); > + vst1q_f32 (VECT_VAR (result, float, 32, 4), > + VECT_VAR (vector_res, float, 32, 4)); > + > + CHECK_FP (TEST_MSG, float, 32, 4, PRIx32, expected, ""); > + } > +#undef TEST_MSG > + > + clean_results (); > + > +#define TEST_MSG vcvt_f16_f32 > + { > + VECT_VAR_DECL (buffer_src, float, 32, 4) [] = { 1.5, 2.5, 3.5, 4.5 }; > + DECL_VARIABLE (vector_src, float, 32, 4); > + > + VLOAD (vector_src, buffer_src, q, float, f, 32, 4); > + DECL_VARIABLE (vector_res, float, 16, 4) = > + vcvt_f16_f32 (VECT_VAR (vector_src, float, 32, 4)); > + vst1_f16 (VECT_VAR (result, float, 16, 4), > + VECT_VAR (vector_res, float, 16 ,4)); > + > + CHECK_FP (TEST_MSG, float, 16, 4, PRIx16, expected, ""); > + } > +#undef TEST_MSG > + > +#if defined (__aarch64__) > + clean_results (); > + > +#define TEST_MSG "vcvt_high_f32_f16" > + { > + DECL_VARIABLE (vector_src, float, 16, 8); > + VLOAD (vector_src, buffer, q, float, f, 16, 8); > + DECL_VARIABLE (vector_res, float, 32, 4); > + VECT_VAR (vector_res, float, 32, 4) = > + vcvt_high_f32_f16 (VECT_VAR (vector_src, float, 16, 8)); > + vst1q_f32 (VECT_VAR (result, float, 32, 4), > + VECT_VAR (vector_res, float, 32, 4)); > + CHECK_FP (TEST_MSG, float, 32, 4, PRIx32, expected_high, ""); > + } > +#undef TEST_MSG > + clean_results (); > + > +#define TEST_MSG "vcvt_high_f16_f32" > + { > + DECL_VARIABLE (vector_low, float, 16, 4); > + VDUP (vector_low, , float, f, 16, 4, 2.0); > + > + DECL_VARIABLE (vector_src, float, 32, 4); > + VLOAD (vector_src, buffer, q, float, f, 32, 4); > + > + DECL_VARIABLE (vector_res, float, 16, 8) = > + vcvt_high_f16_f32 (VECT_VAR (vector_low, float, 16, 4), > + VECT_VAR (vector_src, float, 32, 4)); > + vst1q_f16 (VECT_VAR (result, float, 16, 8), > + VECT_VAR (vector_res, float, 16, 8)); > + > + CHECK_FP (TEST_MSG, float, 16, 8, PRIx16, expected_high, ""); > + } > +#endif > +} > + > +int > +main (void) > +{ > + exec_vcvt (); > + return 0; > +} > diff --git a/gcc/testsuite/lib/target-supports.exp b/gcc/testsuite/lib/target-supports.exp > index 9aec02d..0a22c95 100644 > --- a/gcc/testsuite/lib/target-supports.exp > +++ b/gcc/testsuite/lib/target-supports.exp > @@ -2730,6 +2730,21 @@ proc check_effective_target_arm_neon_fp16_ok { } { > check_effective_target_arm_neon_fp16_ok_nocache] > } > > +proc check_effective_target_arm_neon_fp16_hw_ok { } { > + if {! [check_effective_target_arm_neon_fp16_ok] } { > + return 0 > + } > + global et_arm_neon_fp16_flags > + check_runtime_nocache arm_neon_fp16_hw_ok { > + int > + main (int argc, char **argv) > + { > + asm ("vcvt.f32.f16 q1, d0"); > + return 0; > + } > + } $et_arm_neon_fp16_flags > +} > + > proc add_options_for_arm_neon_fp16 { flags } { > if { ! [check_effective_target_arm_neon_fp16_ok] } { > return "$flags" > -- > 1.8.3 >
Ping. (Thanks, Christophe!) Correct version here: https://gcc.gnu.org/ml/gcc-patches/2015-08/msg01501.html Cheers, Alan On 25/08/15 15:21, Christophe Lyon wrote: > On 25 August 2015 at 15:57, Alan Lawrence <alan.lawrence@arm.com> wrote: >> Sorry - wrong version posted. The hunk for add_options_for_arm_neon_fp16 has >> moved to the previous patch! This version also fixes some whitespace issues. >> > > This looks OK to me now, thanks. > >> gcc/testsuite/ChangeLog: >> >> * gcc.target/aarch64/advsimd-intrinsics/vcvt_f16.c: New. >> * lib/target-supports.exp >> (check_effective_target_arm_neon_fp16_hw_ok): New. >> --- >> .../aarch64/advsimd-intrinsics/vcvt_f16.c | 98 ++++++++++++++++++++++ >> gcc/testsuite/lib/target-supports.exp | 15 ++++ >> 2 files changed, 113 insertions(+) >> create mode 100644 gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vcvt_f16.c >> >> diff --git a/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vcvt_f16.c b/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vcvt_f16.c >> new file mode 100644 >> index 0000000..a2cfd38 >> --- /dev/null >> +++ b/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vcvt_f16.c >> @@ -0,0 +1,98 @@ >> +/* { dg-require-effective-target arm_neon_fp16_hw_ok { target { arm*-*-* } } } */ >> +#include <arm_neon.h> >> +#include "arm-neon-ref.h" >> +#include "compute-ref-data.h" >> +#include <math.h> >> + >> +/* Expected results for vcvt. */ >> +VECT_VAR_DECL (expected,hfloat,32,4) [] = { 0x41800000, 0x41700000, >> + 0x41600000, 0x41500000 }; >> +VECT_VAR_DECL (expected,hfloat,16,4) [] = { 0x3e00, 0x4100, 0x4300, 0x4480 }; >> + >> +/* Expected results for vcvt_high_f32_f16. */ >> +VECT_VAR_DECL (expected_high,hfloat,32,4) [] = { 0xc1400000, 0xc1300000, >> + 0xc1200000, 0xc1100000 }; >> +/* Expected results for vcvt_high_f16_f32. */ >> +VECT_VAR_DECL (expected_high,hfloat,16,8) [] = { 0x4000, 0x4000, 0x4000, 0x4000, >> + 0xcc00, 0xcb80, 0xcb00, 0xca80 }; >> + >> +void >> +exec_vcvt (void) >> +{ >> + clean_results (); >> + >> +#define TEST_MSG vcvt_f32_f16 >> + { >> + VECT_VAR_DECL (buffer_src, float, 16, 4) [] = { 16.0, 15.0, 14.0, 13.0 }; >> + >> + DECL_VARIABLE (vector_src, float, 16, 4); >> + >> + VLOAD (vector_src, buffer_src, , float, f, 16, 4); >> + DECL_VARIABLE (vector_res, float, 32, 4) = >> + vcvt_f32_f16 (VECT_VAR (vector_src, float, 16, 4)); >> + vst1q_f32 (VECT_VAR (result, float, 32, 4), >> + VECT_VAR (vector_res, float, 32, 4)); >> + >> + CHECK_FP (TEST_MSG, float, 32, 4, PRIx32, expected, ""); >> + } >> +#undef TEST_MSG >> + >> + clean_results (); >> + >> +#define TEST_MSG vcvt_f16_f32 >> + { >> + VECT_VAR_DECL (buffer_src, float, 32, 4) [] = { 1.5, 2.5, 3.5, 4.5 }; >> + DECL_VARIABLE (vector_src, float, 32, 4); >> + >> + VLOAD (vector_src, buffer_src, q, float, f, 32, 4); >> + DECL_VARIABLE (vector_res, float, 16, 4) = >> + vcvt_f16_f32 (VECT_VAR (vector_src, float, 32, 4)); >> + vst1_f16 (VECT_VAR (result, float, 16, 4), >> + VECT_VAR (vector_res, float, 16 ,4)); >> + >> + CHECK_FP (TEST_MSG, float, 16, 4, PRIx16, expected, ""); >> + } >> +#undef TEST_MSG >> + >> +#if defined (__aarch64__) >> + clean_results (); >> + >> +#define TEST_MSG "vcvt_high_f32_f16" >> + { >> + DECL_VARIABLE (vector_src, float, 16, 8); >> + VLOAD (vector_src, buffer, q, float, f, 16, 8); >> + DECL_VARIABLE (vector_res, float, 32, 4); >> + VECT_VAR (vector_res, float, 32, 4) = >> + vcvt_high_f32_f16 (VECT_VAR (vector_src, float, 16, 8)); >> + vst1q_f32 (VECT_VAR (result, float, 32, 4), >> + VECT_VAR (vector_res, float, 32, 4)); >> + CHECK_FP (TEST_MSG, float, 32, 4, PRIx32, expected_high, ""); >> + } >> +#undef TEST_MSG >> + clean_results (); >> + >> +#define TEST_MSG "vcvt_high_f16_f32" >> + { >> + DECL_VARIABLE (vector_low, float, 16, 4); >> + VDUP (vector_low, , float, f, 16, 4, 2.0); >> + >> + DECL_VARIABLE (vector_src, float, 32, 4); >> + VLOAD (vector_src, buffer, q, float, f, 32, 4); >> + >> + DECL_VARIABLE (vector_res, float, 16, 8) = >> + vcvt_high_f16_f32 (VECT_VAR (vector_low, float, 16, 4), >> + VECT_VAR (vector_src, float, 32, 4)); >> + vst1q_f16 (VECT_VAR (result, float, 16, 8), >> + VECT_VAR (vector_res, float, 16, 8)); >> + >> + CHECK_FP (TEST_MSG, float, 16, 8, PRIx16, expected_high, ""); >> + } >> +#endif >> +} >> + >> +int >> +main (void) >> +{ >> + exec_vcvt (); >> + return 0; >> +} >> diff --git a/gcc/testsuite/lib/target-supports.exp b/gcc/testsuite/lib/target-supports.exp >> index 9aec02d..0a22c95 100644 >> --- a/gcc/testsuite/lib/target-supports.exp >> +++ b/gcc/testsuite/lib/target-supports.exp >> @@ -2730,6 +2730,21 @@ proc check_effective_target_arm_neon_fp16_ok { } { >> check_effective_target_arm_neon_fp16_ok_nocache] >> } >> >> +proc check_effective_target_arm_neon_fp16_hw_ok { } { >> + if {! [check_effective_target_arm_neon_fp16_ok] } { >> + return 0 >> + } >> + global et_arm_neon_fp16_flags >> + check_runtime_nocache arm_neon_fp16_hw_ok { >> + int >> + main (int argc, char **argv) >> + { >> + asm ("vcvt.f32.f16 q1, d0"); >> + return 0; >> + } >> + } $et_arm_neon_fp16_flags >> +} >> + >> proc add_options_for_arm_neon_fp16 { flags } { >> if { ! [check_effective_target_arm_neon_fp16_ok] } { >> return "$flags" >> -- >> 1.8.3 >> >
On 08/09/15 11:56, Alan Lawrence wrote: > Ping. (Thanks, Christophe!) > > Correct version here: https://gcc.gnu.org/ml/gcc-patches/2015-08/msg01501.html > > Cheers, Alan > > On 25/08/15 15:21, Christophe Lyon wrote: >> On 25 August 2015 at 15:57, Alan Lawrence <alan.lawrence@arm.com> wrote: >>> Sorry - wrong version posted. The hunk for add_options_for_arm_neon_fp16 has >>> moved to the previous patch! This version also fixes some whitespace issues. >>> >> This looks OK to me now, thanks. >> >>> gcc/testsuite/ChangeLog: >>> >>> * gcc.target/aarch64/advsimd-intrinsics/vcvt_f16.c: New. >>> * lib/target-supports.exp >>> (check_effective_target_arm_neon_fp16_hw_ok): New. >>> --- >>> .../aarch64/advsimd-intrinsics/vcvt_f16.c | 98 ++++++++++++++++++++++ >>> gcc/testsuite/lib/target-supports.exp | 15 ++++ >>> 2 files changed, 113 insertions(+) >>> create mode 100644 gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vcvt_f16.c >>> >>> diff --git a/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vcvt_f16.c b/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vcvt_f16.c >>> new file mode 100644 >>> index 0000000..a2cfd38 >>> --- /dev/null >>> +++ b/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vcvt_f16.c >>> @@ -0,0 +1,98 @@ >>> +/* { dg-require-effective-target arm_neon_fp16_hw_ok { target { arm*-*-* } } } */ >>> +#include <arm_neon.h> >>> +#include "arm-neon-ref.h" >>> +#include "compute-ref-data.h" >>> +#include <math.h> >>> + >>> +/* Expected results for vcvt. */ >>> +VECT_VAR_DECL (expected,hfloat,32,4) [] = { 0x41800000, 0x41700000, >>> + 0x41600000, 0x41500000 }; >>> +VECT_VAR_DECL (expected,hfloat,16,4) [] = { 0x3e00, 0x4100, 0x4300, 0x4480 }; >>> + >>> +/* Expected results for vcvt_high_f32_f16. */ >>> +VECT_VAR_DECL (expected_high,hfloat,32,4) [] = { 0xc1400000, 0xc1300000, >>> + 0xc1200000, 0xc1100000 }; >>> +/* Expected results for vcvt_high_f16_f32. */ >>> +VECT_VAR_DECL (expected_high,hfloat,16,8) [] = { 0x4000, 0x4000, 0x4000, 0x4000, >>> + 0xcc00, 0xcb80, 0xcb00, 0xca80 }; >>> + >>> +void >>> +exec_vcvt (void) >>> +{ >>> + clean_results (); >>> + >>> +#define TEST_MSG vcvt_f32_f16 >>> + { >>> + VECT_VAR_DECL (buffer_src, float, 16, 4) [] = { 16.0, 15.0, 14.0, 13.0 }; >>> + >>> + DECL_VARIABLE (vector_src, float, 16, 4); >>> + >>> + VLOAD (vector_src, buffer_src, , float, f, 16, 4); >>> + DECL_VARIABLE (vector_res, float, 32, 4) = >>> + vcvt_f32_f16 (VECT_VAR (vector_src, float, 16, 4)); >>> + vst1q_f32 (VECT_VAR (result, float, 32, 4), >>> + VECT_VAR (vector_res, float, 32, 4)); >>> + >>> + CHECK_FP (TEST_MSG, float, 32, 4, PRIx32, expected, ""); >>> + } >>> +#undef TEST_MSG >>> + >>> + clean_results (); >>> + >>> +#define TEST_MSG vcvt_f16_f32 >>> + { >>> + VECT_VAR_DECL (buffer_src, float, 32, 4) [] = { 1.5, 2.5, 3.5, 4.5 }; >>> + DECL_VARIABLE (vector_src, float, 32, 4); >>> + >>> + VLOAD (vector_src, buffer_src, q, float, f, 32, 4); >>> + DECL_VARIABLE (vector_res, float, 16, 4) = >>> + vcvt_f16_f32 (VECT_VAR (vector_src, float, 32, 4)); >>> + vst1_f16 (VECT_VAR (result, float, 16, 4), >>> + VECT_VAR (vector_res, float, 16 ,4)); >>> + >>> + CHECK_FP (TEST_MSG, float, 16, 4, PRIx16, expected, ""); >>> + } >>> +#undef TEST_MSG >>> + >>> +#if defined (__aarch64__) >>> + clean_results (); >>> + >>> +#define TEST_MSG "vcvt_high_f32_f16" >>> + { >>> + DECL_VARIABLE (vector_src, float, 16, 8); >>> + VLOAD (vector_src, buffer, q, float, f, 16, 8); >>> + DECL_VARIABLE (vector_res, float, 32, 4); >>> + VECT_VAR (vector_res, float, 32, 4) = >>> + vcvt_high_f32_f16 (VECT_VAR (vector_src, float, 16, 8)); >>> + vst1q_f32 (VECT_VAR (result, float, 32, 4), >>> + VECT_VAR (vector_res, float, 32, 4)); >>> + CHECK_FP (TEST_MSG, float, 32, 4, PRIx32, expected_high, ""); >>> + } >>> +#undef TEST_MSG >>> + clean_results (); >>> + >>> +#define TEST_MSG "vcvt_high_f16_f32" >>> + { >>> + DECL_VARIABLE (vector_low, float, 16, 4); >>> + VDUP (vector_low, , float, f, 16, 4, 2.0); >>> + >>> + DECL_VARIABLE (vector_src, float, 32, 4); >>> + VLOAD (vector_src, buffer, q, float, f, 32, 4); >>> + >>> + DECL_VARIABLE (vector_res, float, 16, 8) = >>> + vcvt_high_f16_f32 (VECT_VAR (vector_low, float, 16, 4), >>> + VECT_VAR (vector_src, float, 32, 4)); >>> + vst1q_f16 (VECT_VAR (result, float, 16, 8), >>> + VECT_VAR (vector_res, float, 16, 8)); >>> + >>> + CHECK_FP (TEST_MSG, float, 16, 8, PRIx16, expected_high, ""); >>> + } >>> +#endif >>> +} >>> + >>> +int >>> +main (void) >>> +{ >>> + exec_vcvt (); >>> + return 0; >>> +} >>> diff --git a/gcc/testsuite/lib/target-supports.exp b/gcc/testsuite/lib/target-supports.exp >>> index 9aec02d..0a22c95 100644 >>> --- a/gcc/testsuite/lib/target-supports.exp >>> +++ b/gcc/testsuite/lib/target-supports.exp >>> @@ -2730,6 +2730,21 @@ proc check_effective_target_arm_neon_fp16_ok { } { >>> check_effective_target_arm_neon_fp16_ok_nocache] >>> } >>> >>> +proc check_effective_target_arm_neon_fp16_hw_ok { } { I see we're not using the *hw_ok naming anywhere else in target-supports.exp. For example, we have check_effective_target_arm_neon_hw, without the _ok. So I'd just call this check_effective_target_arm_neon_fp16_hw. Ok with that change. Thanks, Kyrill >>> + if {! [check_effective_target_arm_neon_fp16_ok] } { >>> + return 0 >>> + } >>> + global et_arm_neon_fp16_flags >>> + check_runtime_nocache arm_neon_fp16_hw_ok { >>> + int >>> + main (int argc, char **argv) >>> + { >>> + asm ("vcvt.f32.f16 q1, d0"); >>> + return 0; >>> + } >>> + } $et_arm_neon_fp16_flags >>> +} >>> + >>> proc add_options_for_arm_neon_fp16 { flags } { >>> if { ! [check_effective_target_arm_neon_fp16_ok] } { >>> return "$flags" >>> -- >>> 1.8.3 >>>
On 25 August 2015 at 14:57, Alan Lawrence <alan.lawrence@arm.com> wrote: > Sorry - wrong version posted. The hunk for add_options_for_arm_neon_fp16 has > moved to the previous patch! This version also fixes some whitespace issues. > > gcc/testsuite/ChangeLog: > > * gcc.target/aarch64/advsimd-intrinsics/vcvt_f16.c: New. > * lib/target-supports.exp > (check_effective_target_arm_neon_fp16_hw_ok): New. > --- > .../aarch64/advsimd-intrinsics/vcvt_f16.c | 98 ++++++++++++++++++++++ > gcc/testsuite/lib/target-supports.exp | 15 ++++ > 2 files changed, 113 insertions(+) > create mode 100644 gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vcvt_f16.c > > diff --git a/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vcvt_f16.c b/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vcvt_f16.c > new file mode 100644 > index 0000000..a2cfd38 > --- /dev/null > +++ b/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vcvt_f16.c > +#include <math.h> We should avoid dependencies on external header files. In this case I can't see that anything in math.h is needed any way. Otherwise OK with me. /Marcus
diff --git a/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vcvt_f16.c b/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vcvt_f16.c new file mode 100644 index 0000000..a2cfd38 --- /dev/null +++ b/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vcvt_f16.c @@ -0,0 +1,98 @@ +/* { dg-require-effective-target arm_neon_fp16_hw_ok { target { arm*-*-* } } } */ +#include <arm_neon.h> +#include "arm-neon-ref.h" +#include "compute-ref-data.h" +#include <math.h> + +/* Expected results for vcvt. */ +VECT_VAR_DECL (expected,hfloat,32,4) [] = { 0x41800000, 0x41700000, + 0x41600000, 0x41500000 }; +VECT_VAR_DECL (expected,hfloat,16,4) [] = { 0x3e00, 0x4100, 0x4300, 0x4480 }; + +/* Expected results for vcvt_high_f32_f16. */ +VECT_VAR_DECL (expected_high,hfloat,32,4) [] = { 0xc1400000, 0xc1300000, + 0xc1200000, 0xc1100000 }; +/* Expected results for vcvt_high_f16_f32. */ +VECT_VAR_DECL (expected_high,hfloat,16,8) [] = { 0x4000, 0x4000, 0x4000, 0x4000, + 0xcc00, 0xcb80, 0xcb00, 0xca80 }; + +void +exec_vcvt (void) +{ + clean_results (); + +#define TEST_MSG vcvt_f32_f16 + { + VECT_VAR_DECL (buffer_src, float, 16, 4) [] = { 16.0, 15.0, 14.0, 13.0 }; + + DECL_VARIABLE (vector_src, float, 16, 4); + + VLOAD (vector_src, buffer_src, , float, f, 16, 4); + DECL_VARIABLE (vector_res, float, 32, 4) = + vcvt_f32_f16 (VECT_VAR (vector_src, float, 16, 4)); + vst1q_f32 (VECT_VAR (result, float, 32, 4), + VECT_VAR (vector_res, float, 32, 4)); + + CHECK_FP (TEST_MSG, float, 32, 4, PRIx32, expected, ""); + } +#undef TEST_MSG + + clean_results (); + +#define TEST_MSG vcvt_f16_f32 + { + VECT_VAR_DECL (buffer_src, float, 32, 4) [] = { 1.5, 2.5, 3.5, 4.5 }; + DECL_VARIABLE (vector_src, float, 32, 4); + + VLOAD (vector_src, buffer_src, q, float, f, 32, 4); + DECL_VARIABLE (vector_res, float, 16, 4) = + vcvt_f16_f32 (VECT_VAR (vector_src, float, 32, 4)); + vst1_f16 (VECT_VAR (result, float, 16, 4), + VECT_VAR (vector_res, float, 16 ,4)); + + CHECK_FP (TEST_MSG, float, 16, 4, PRIx16, expected, ""); + } +#undef TEST_MSG + +#if defined (__aarch64__) + clean_results (); + +#define TEST_MSG "vcvt_high_f32_f16" + { + DECL_VARIABLE (vector_src, float, 16, 8); + VLOAD (vector_src, buffer, q, float, f, 16, 8); + DECL_VARIABLE (vector_res, float, 32, 4); + VECT_VAR (vector_res, float, 32, 4) = + vcvt_high_f32_f16 (VECT_VAR (vector_src, float, 16, 8)); + vst1q_f32 (VECT_VAR (result, float, 32, 4), + VECT_VAR (vector_res, float, 32, 4)); + CHECK_FP (TEST_MSG, float, 32, 4, PRIx32, expected_high, ""); + } +#undef TEST_MSG + clean_results (); + +#define TEST_MSG "vcvt_high_f16_f32" + { + DECL_VARIABLE (vector_low, float, 16, 4); + VDUP (vector_low, , float, f, 16, 4, 2.0); + + DECL_VARIABLE (vector_src, float, 32, 4); + VLOAD (vector_src, buffer, q, float, f, 32, 4); + + DECL_VARIABLE (vector_res, float, 16, 8) = + vcvt_high_f16_f32 (VECT_VAR (vector_low, float, 16, 4), + VECT_VAR (vector_src, float, 32, 4)); + vst1q_f16 (VECT_VAR (result, float, 16, 8), + VECT_VAR (vector_res, float, 16, 8)); + + CHECK_FP (TEST_MSG, float, 16, 8, PRIx16, expected_high, ""); + } +#endif +} + +int +main (void) +{ + exec_vcvt (); + return 0; +} diff --git a/gcc/testsuite/lib/target-supports.exp b/gcc/testsuite/lib/target-supports.exp index 9aec02d..0a22c95 100644 --- a/gcc/testsuite/lib/target-supports.exp +++ b/gcc/testsuite/lib/target-supports.exp @@ -2730,6 +2730,21 @@ proc check_effective_target_arm_neon_fp16_ok { } { check_effective_target_arm_neon_fp16_ok_nocache] } +proc check_effective_target_arm_neon_fp16_hw_ok { } { + if {! [check_effective_target_arm_neon_fp16_ok] } { + return 0 + } + global et_arm_neon_fp16_flags + check_runtime_nocache arm_neon_fp16_hw_ok { + int + main (int argc, char **argv) + { + asm ("vcvt.f32.f16 q1, d0"); + return 0; + } + } $et_arm_neon_fp16_flags +} + proc add_options_for_arm_neon_fp16 { flags } { if { ! [check_effective_target_arm_neon_fp16_ok] } { return "$flags"