Index: compiler-rt/cmake/builtin-config-ix.cmake =================================================================== --- compiler-rt/cmake/builtin-config-ix.cmake +++ compiler-rt/cmake/builtin-config-ix.cmake @@ -22,6 +22,13 @@ } ") +builtin_check_c_compiler_source(COMPILER_RT_HAS_FLOAT16 +" +_Float16 foo(_Float16 x) { + return x; +} +" +) set(ARM64 aarch64) set(ARM32 arm armhf armv6m armv7m armv7em armv7 armv7s armv7k) Index: compiler-rt/lib/builtins/CMakeLists.txt =================================================================== --- compiler-rt/lib/builtins/CMakeLists.txt +++ compiler-rt/lib/builtins/CMakeLists.txt @@ -169,6 +169,7 @@ divtc3.c divtf3.c extenddftf2.c + extendhftf2.c extendsftf2.c fixtfdi.c fixtfsi.c @@ -187,6 +188,7 @@ powitf2.c subtf3.c trunctfdf2.c + trunctfhf2.c trunctfsf2.c ) @@ -607,6 +609,8 @@ else () set(BUILTIN_CFLAGS "") + append_list_if(COMPILER_RT_HAS_FLOAT16 -DCOMPILER_RT_HAS_FLOAT16 BUILTIN_CFLAGS) + append_list_if(COMPILER_RT_HAS_STD_C11_FLAG -std=c11 BUILTIN_CFLAGS) # These flags would normally be added to CMAKE_C_FLAGS by the llvm Index: compiler-rt/lib/builtins/extendhfsf2.c =================================================================== --- compiler-rt/lib/builtins/extendhfsf2.c +++ compiler-rt/lib/builtins/extendhfsf2.c @@ -12,15 +12,15 @@ // Use a forwarding definition and noinline to implement a poor man's alias, // as there isn't a good cross-platform way of defining one. -COMPILER_RT_ABI NOINLINE float __extendhfsf2(uint16_t a) { +COMPILER_RT_ABI NOINLINE float __extendhfsf2(src_t a) { return __extendXfYf2__(a); } -COMPILER_RT_ABI float __gnu_h2f_ieee(uint16_t a) { return __extendhfsf2(a); } +COMPILER_RT_ABI float __gnu_h2f_ieee(src_t a) { return __extendhfsf2(a); } #if defined(__ARM_EABI__) #if defined(COMPILER_RT_ARMHF_TARGET) -AEABI_RTABI float __aeabi_h2f(uint16_t a) { return __extendhfsf2(a); } +AEABI_RTABI float __aeabi_h2f(src_t a) { return __extendhfsf2(a); } #else COMPILER_RT_ALIAS(__extendhfsf2, __aeabi_h2f) #endif Index: compiler-rt/lib/builtins/extendhftf2.c =================================================================== --- /dev/null +++ compiler-rt/lib/builtins/extendhftf2.c @@ -0,0 +1,23 @@ +//===-- lib/extendhfsf2.c - half -> quad conversion ---------------*- C -*-===// +// +// The LLVM Compiler Infrastructure +// +// This file is dual licensed under the MIT and the University of Illinois Open +// Source Licenses. See LICENSE.TXT for details. +// +//===----------------------------------------------------------------------===// + +#define QUAD_PRECISION +#include "fp_lib.h" + +#if defined(CRT_HAS_128BIT) && defined(CRT_LDBL_128BIT) \ + && defined(COMPILER_RT_HAS_FLOAT16) +#define SRC_HALF +#define DST_QUAD +#include "fp_extend_impl.inc" + +COMPILER_RT_ABI long double __extendhftf2(src_t a) { + return __extendXfYf2__(a); +} + +#endif Index: compiler-rt/lib/builtins/fp_extend.h =================================================================== --- compiler-rt/lib/builtins/fp_extend.h +++ compiler-rt/lib/builtins/fp_extend.h @@ -40,7 +40,11 @@ } #elif defined SRC_HALF +#if defined COMPILER_RT_HAS_FLOAT16 +typedef _Float16 src_t; +#else typedef uint16_t src_t; +#endif typedef uint16_t src_rep_t; #define SRC_REP_C UINT16_C static const int srcSigBits = 10; Index: compiler-rt/lib/builtins/fp_trunc.h =================================================================== --- compiler-rt/lib/builtins/fp_trunc.h +++ compiler-rt/lib/builtins/fp_trunc.h @@ -50,7 +50,11 @@ static const int dstSigBits = 23; #elif defined DST_HALF +#if defined COMPILER_RT_HAS_FLOAT16 +typedef _Float16 dst_t; +#else typedef uint16_t dst_t; +#endif typedef uint16_t dst_rep_t; #define DST_REP_C UINT16_C static const int dstSigBits = 10; Index: compiler-rt/lib/builtins/truncdfhf2.c =================================================================== --- compiler-rt/lib/builtins/truncdfhf2.c +++ compiler-rt/lib/builtins/truncdfhf2.c @@ -10,11 +10,11 @@ #define DST_HALF #include "fp_trunc_impl.inc" -COMPILER_RT_ABI uint16_t __truncdfhf2(double a) { return __truncXfYf2__(a); } +COMPILER_RT_ABI dst_t __truncdfhf2(double a) { return __truncXfYf2__(a); } #if defined(__ARM_EABI__) #if defined(COMPILER_RT_ARMHF_TARGET) -AEABI_RTABI uint16_t __aeabi_d2h(double a) { return __truncdfhf2(a); } +AEABI_RTABI dst_t __aeabi_d2h(double a) { return __truncdfhf2(a); } #else COMPILER_RT_ALIAS(__truncdfhf2, __aeabi_d2h) #endif Index: compiler-rt/lib/builtins/truncsfhf2.c =================================================================== --- compiler-rt/lib/builtins/truncsfhf2.c +++ compiler-rt/lib/builtins/truncsfhf2.c @@ -12,15 +12,15 @@ // Use a forwarding definition and noinline to implement a poor man's alias, // as there isn't a good cross-platform way of defining one. -COMPILER_RT_ABI NOINLINE uint16_t __truncsfhf2(float a) { +COMPILER_RT_ABI NOINLINE dst_t __truncsfhf2(float a) { return __truncXfYf2__(a); } -COMPILER_RT_ABI uint16_t __gnu_f2h_ieee(float a) { return __truncsfhf2(a); } +COMPILER_RT_ABI dst_t __gnu_f2h_ieee(float a) { return __truncsfhf2(a); } #if defined(__ARM_EABI__) #if defined(COMPILER_RT_ARMHF_TARGET) -AEABI_RTABI uint16_t __aeabi_f2h(float a) { return __truncsfhf2(a); } +AEABI_RTABI dst_t __aeabi_f2h(float a) { return __truncsfhf2(a); } #else COMPILER_RT_ALIAS(__truncsfhf2, __aeabi_f2h) #endif Index: compiler-rt/lib/builtins/trunctfhf2.c =================================================================== --- /dev/null +++ compiler-rt/lib/builtins/trunctfhf2.c @@ -0,0 +1,23 @@ +//===-- lib/trunctfhf2.c - quad -> half conversion ----------------*- C -*-===// +// +// The LLVM Compiler Infrastructure +// +// This file is dual licensed under the MIT and the University of Illinois Open +// Source Licenses. See LICENSE.TXT for details. +// +//===----------------------------------------------------------------------===// + +#define QUAD_PRECISION +#include "fp_lib.h" + +#if defined(CRT_HAS_128BIT) && defined(CRT_LDBL_128BIT) \ + && defined(COMPILER_RT_HAS_FLOAT16) +#define SRC_QUAD +#define DST_HALF +#include "fp_trunc_impl.inc" + +COMPILER_RT_ABI dst_t __trunctfhf2(long double a) { + return __truncXfYf2__(a); +} + +#endif Index: compiler-rt/test/builtins/CMakeLists.txt =================================================================== --- compiler-rt/test/builtins/CMakeLists.txt +++ compiler-rt/test/builtins/CMakeLists.txt @@ -44,6 +44,8 @@ string(REPLACE ";" " " BUILTINS_TEST_TARGET_CFLAGS "${BUILTINS_TEST_TARGET_CFLAGS}") endif() + append_list_if(COMPILER_RT_HAS_FLOAT16 -DCOMPILER_RT_HAS_FLOAT16 BUILTINS_TEST_TARGET_CFLAGS) + # Compute builtins available in library and add them as lit features. if(APPLE) # TODO: Support other Apple platforms. Index: compiler-rt/test/builtins/Unit/extendhfsf2_test.c =================================================================== --- compiler-rt/test/builtins/Unit/extendhfsf2_test.c +++ compiler-rt/test/builtins/Unit/extendhfsf2_test.c @@ -5,98 +5,97 @@ #include "fp_test.h" -float __extendhfsf2(uint16_t a); +float __extendhfsf2(TYPE_FP16 a); -int test__extendhfsf2(uint16_t a, float expected) +int test__extendhfsf2(TYPE_FP16 a, float expected) { - float x = __extendhfsf2(a); + TYPE_FP16 x = __extendhfsf2(a); int ret = compareResultH(x, expected); if (ret){ printf("error in test__extendhfsf2(%#.4x) = %f, " - "expected %f\n", a, x, expected); + "expected %f\n", fromRep16(a), x, expected); } return ret; } -char assumption_1[sizeof(__fp16) * CHAR_BIT == 16] = {0}; +char assumption_1[sizeof(TYPE_FP16) * CHAR_BIT == 16] = {0}; int main() { // qNaN - if (test__extendhfsf2(UINT16_C(0x7e00), + if (test__extendhfsf2(fromRep16(0x7e00), makeQNaN32())) return 1; // NaN - if (test__extendhfsf2(UINT16_C(0x7e00), - makeNaN32(UINT32_C(0x8000)))) + if (test__extendhfsf2(fromRep16(0x7d00), + makeQNaN32())) return 1; // inf - if (test__extendhfsf2(UINT16_C(0x7c00), + if (test__extendhfsf2(fromRep16(0x7c00), makeInf32())) return 1; - if (test__extendhfsf2(UINT16_C(0xfc00), + if (test__extendhfsf2(fromRep16(0xfc00), -makeInf32())) return 1; // zero - if (test__extendhfsf2(UINT16_C(0x0), + if (test__extendhfsf2(fromRep16(0x0), 0.0f)) return 1; - if (test__extendhfsf2(UINT16_C(0x8000), + if (test__extendhfsf2(fromRep16(0x8000), -0.0f)) return 1; - - if (test__extendhfsf2(UINT16_C(0x4248), + if (test__extendhfsf2(fromRep16(0x4248), 3.1415926535f)) return 1; - if (test__extendhfsf2(UINT16_C(0xc248), + if (test__extendhfsf2(fromRep16(0xc248), -3.1415926535f)) return 1; - if (test__extendhfsf2(UINT16_C(0x7c00), + if (test__extendhfsf2(fromRep16(0x7c00), 0x1.987124876876324p+100f)) return 1; - if (test__extendhfsf2(UINT16_C(0x6e62), + if (test__extendhfsf2(fromRep16(0x6e62), 0x1.988p+12f)) return 1; - if (test__extendhfsf2(UINT16_C(0x3c00), + if (test__extendhfsf2(fromRep16(0x3c00), 0x1.0p+0f)) return 1; - if (test__extendhfsf2(UINT16_C(0x0400), + if (test__extendhfsf2(fromRep16(0x0400), 0x1.0p-14f)) return 1; // denormal - if (test__extendhfsf2(UINT16_C(0x0010), + if (test__extendhfsf2(fromRep16(0x0010), 0x1.0p-20f)) return 1; - if (test__extendhfsf2(UINT16_C(0x0001), + if (test__extendhfsf2(fromRep16(0x0001), 0x1.0p-24f)) return 1; - if (test__extendhfsf2(UINT16_C(0x8001), + if (test__extendhfsf2(fromRep16(0x8001), -0x1.0p-24f)) return 1; - if (test__extendhfsf2(UINT16_C(0x0001), + if (test__extendhfsf2(fromRep16(0x0001), 0x1.5p-25f)) return 1; // and back to zero - if (test__extendhfsf2(UINT16_C(0x0000), + if (test__extendhfsf2(fromRep16(0x0000), 0x1.0p-25f)) return 1; - if (test__extendhfsf2(UINT16_C(0x8000), + if (test__extendhfsf2(fromRep16(0x8000), -0x1.0p-25f)) return 1; // max (precise) - if (test__extendhfsf2(UINT16_C(0x7bff), + if (test__extendhfsf2(fromRep16(0x7bff), 65504.0f)) return 1; // max (rounded) - if (test__extendhfsf2(UINT16_C(0x7bff), + if (test__extendhfsf2(fromRep16(0x7bff), 65504.0f)) return 1; // max (to +inf) - if (test__extendhfsf2(UINT16_C(0x7c00), + if (test__extendhfsf2(fromRep16(0x7c00), makeInf32())) return 1; - if (test__extendhfsf2(UINT16_C(0xfc00), + if (test__extendhfsf2(fromRep16(0xfc00), -makeInf32())) return 1; return 0; Index: compiler-rt/test/builtins/Unit/extendhftf2_test.c =================================================================== --- /dev/null +++ compiler-rt/test/builtins/Unit/extendhftf2_test.c @@ -0,0 +1,97 @@ +// RUN: %clang_builtins %s %librt -o %t && %run %t +// REQUIRES: librt_has_extendhftf2 + +#include "int_lib.h" +#include + +#if __LDBL_MANT_DIG__ == 113 && defined (COMPILER_RT_HAS_FLOAT16) + +#include "fp_test.h" + +COMPILER_RT_ABI long double __extendhftf2(TYPE_FP16 a); + +int test__extendhftf2(TYPE_FP16 a, uint64_t expectedHi, uint64_t expectedLo) +{ + long double x = __extendhftf2(a); + int ret = compareResultLD(x, expectedHi, expectedLo); + + if (ret) + { + printf("error in test__extendhftf2(%#.4x) = %.20Lf, " + "expected %.20Lf\n", toRep16(a), x, + fromRep128(expectedHi, expectedLo)); + } + return ret; +} + +char assumption_1[sizeof(TYPE_FP16) * CHAR_BIT == 16] = {0}; + +#endif + +int main() +{ +#if __LDBL_MANT_DIG__ == 113 && defined (COMPILER_RT_HAS_FLOAT16) + // qNaN + if (test__extendhftf2(makeQNaN16(), + UINT64_C(0x7fff800000000000), + UINT64_C(0x0))) + return 1; + // NaN + if (test__extendhftf2(makeNaN16(UINT16_C(0x0100)), + UINT64_C(0x7fff400000000000), + UINT64_C(0x0))) + return 1; + // inf + if (test__extendhftf2(makeInf16(), + UINT64_C(0x7fff000000000000), + UINT64_C(0x0))) + return 1; + if (test__extendhftf2(-makeInf16(), + UINT64_C(0xffff000000000000), + UINT64_C(0x0))) + return 1; + // zero + if (test__extendhftf2(fromRep16(0x0U), + UINT64_C(0x0), UINT64_C(0x0))) + return 1; + if (test__extendhftf2(fromRep16(0x8000U), + UINT64_C(0x8000000000000000), + UINT64_C(0x0))) + return 1; + // denormal + if (test__extendhftf2(fromRep16(0x0010U), + UINT64_C(0x3feb000000000000), + UINT64_C(0x0000000000000000))) + return 1; + if (test__extendhftf2(fromRep16(0x0001U), + UINT64_C(0x3fe7000000000000), + UINT64_C(0x0000000000000000))) + return 1; + if (test__extendhftf2(fromRep16(0x8001U), + UINT64_C(0xbfe7000000000000), + UINT64_C(0x0000000000000000))) + return 1; + + // pi + if (test__extendhftf2(fromRep16(0x4248U), + UINT64_C(0x4000920000000000), + UINT64_C(0x0000000000000000))) + return 1; + if (test__extendhftf2(fromRep16(0xc248U), + UINT64_C(0xc000920000000000), + UINT64_C(0x0000000000000000))) + return 1; + + if (test__extendhftf2(fromRep16(0x508cU), + UINT64_C(0x4004230000000000), + UINT64_C(0x0))) + return 1; + if (test__extendhftf2(fromRep16(0x1bb7U), + UINT64_C(0x3ff6edc000000000), + UINT64_C(0x0))) + return 1; +#else + printf("skipped\n"); +#endif + return 0; +} Index: compiler-rt/test/builtins/Unit/fp_test.h =================================================================== --- compiler-rt/test/builtins/Unit/fp_test.h +++ compiler-rt/test/builtins/Unit/fp_test.h @@ -3,13 +3,25 @@ #include #include +#ifdef COMPILER_RT_HAS_FLOAT16 +#define TYPE_FP16 _Float16 +#else +#define TYPE_FP16 uint16_t +#endif + enum EXPECTED_RESULT { LESS_0, LESS_EQUAL_0, EQUAL_0, GREATER_0, GREATER_EQUAL_0, NEQUAL_0 }; -static inline uint16_t fromRep16(uint16_t x) +static inline TYPE_FP16 fromRep16(uint16_t x) { +#ifdef COMPILER_RT_HAS_FLOAT16 + TYPE_FP16 ret; + memcpy (&ret, &x, sizeof (ret)); + return ret; +#else return x; +#endif } static inline float fromRep32(uint32_t x) @@ -36,9 +48,15 @@ } #endif -static inline uint16_t toRep16(uint16_t x) +static inline uint16_t toRep16(TYPE_FP16 x) { +#ifdef COMPILER_RT_HAS_FLOAT16 + uint16_t ret; + memcpy (&ret, &x, sizeof (ret)); + return ret; +#else return x; +#endif } static inline uint32_t toRep32(float x) @@ -64,16 +82,17 @@ } #endif -static inline int compareResultH(uint16_t result, - uint16_t expected) +static inline int compareResultH(TYPE_FP16 result, + TYPE_FP16 expected) { uint16_t rep = toRep16(result); + uint16_t exp = toRep16(expected); - if (rep == expected){ + if (rep == exp){ return 0; } // test other possible NaN representation(signal NaN) - else if (expected == 0x7e00U){ + else if (exp == 0x7e00U){ if ((rep & 0x7c00U) == 0x7c00U && (rep & 0x3ffU) > 0){ return 0; @@ -199,7 +218,7 @@ return ""; } -static inline uint16_t makeQNaN16(void) +static inline TYPE_FP16 makeQNaN16(void) { return fromRep16(0x7e00U); } @@ -221,7 +240,7 @@ } #endif -static inline uint16_t makeNaN16(uint16_t rand) +static inline TYPE_FP16 makeNaN16(uint16_t rand) { return fromRep16(0x7c00U | (rand & 0x7fffU)); } @@ -243,7 +262,7 @@ } #endif -static inline uint16_t makeInf16(void) +static inline TYPE_FP16 makeInf16(void) { return fromRep16(0x7c00U); } Index: compiler-rt/test/builtins/Unit/truncdfhf2_test.c =================================================================== --- compiler-rt/test/builtins/Unit/truncdfhf2_test.c +++ compiler-rt/test/builtins/Unit/truncdfhf2_test.c @@ -5,16 +5,16 @@ #include "fp_test.h" -uint16_t __truncdfhf2(double a); +TYPE_FP16 __truncdfhf2(double a); -int test__truncdfhf2(double a, uint16_t expected) +int test__truncdfhf2(double a, TYPE_FP16 expected) { - uint16_t x = __truncdfhf2(a); + TYPE_FP16 x = __truncdfhf2(a); int ret = compareResultH(x, expected); if (ret){ - printf("error in test__truncdfhf2(%f) = %#.4x, " - "expected %#.4x\n", a, x, fromRep16(expected)); + printf("error in test__truncdfhf2(%lf) = %#.4x, " + "expected %#.4x\n", a, fromRep16(x), fromRep16(expected)); } return ret; } @@ -25,80 +25,80 @@ { // qNaN if (test__truncdfhf2(makeQNaN64(), - UINT16_C(0x7e00))) + fromRep16(0x7e00))) return 1; // NaN if (test__truncdfhf2(makeNaN64(UINT64_C(0x8000)), - UINT16_C(0x7e00))) + fromRep16(0x7e00))) return 1; // inf if (test__truncdfhf2(makeInf64(), - UINT16_C(0x7c00))) + fromRep16(0x7c00))) return 1; if (test__truncdfhf2(-makeInf64(), - UINT16_C(0xfc00))) + fromRep16(0xfc00))) return 1; // zero - if (test__truncdfhf2(0.0, UINT16_C(0x0))) + if (test__truncdfhf2(0.0, fromRep16(0x0))) return 1; - if (test__truncdfhf2(-0.0, UINT16_C(0x8000))) + if (test__truncdfhf2(-0.0, fromRep16(0x8000))) return 1; if (test__truncdfhf2(3.1415926535, - UINT16_C(0x4248))) + fromRep16(0x4248))) return 1; if (test__truncdfhf2(-3.1415926535, - UINT16_C(0xc248))) + fromRep16(0xc248))) return 1; if (test__truncdfhf2(0x1.987124876876324p+1000, - UINT16_C(0x7c00))) + fromRep16(0x7c00))) return 1; if (test__truncdfhf2(0x1.987124876876324p+12, - UINT16_C(0x6e62))) + fromRep16(0x6e62))) return 1; if (test__truncdfhf2(0x1.0p+0, - UINT16_C(0x3c00))) + fromRep16(0x3c00))) return 1; if (test__truncdfhf2(0x1.0p-14, - UINT16_C(0x0400))) + fromRep16(0x0400))) return 1; // denormal if (test__truncdfhf2(0x1.0p-20, - UINT16_C(0x0010))) + fromRep16(0x0010))) return 1; if (test__truncdfhf2(0x1.0p-24, - UINT16_C(0x0001))) + fromRep16(0x0001))) return 1; if (test__truncdfhf2(-0x1.0p-24, - UINT16_C(0x8001))) + fromRep16(0x8001))) return 1; if (test__truncdfhf2(0x1.5p-25, - UINT16_C(0x0001))) + fromRep16(0x0001))) return 1; // and back to zero if (test__truncdfhf2(0x1.0p-25, - UINT16_C(0x0000))) + fromRep16(0x0000))) return 1; if (test__truncdfhf2(-0x1.0p-25, - UINT16_C(0x8000))) + fromRep16(0x8000))) return 1; // max (precise) if (test__truncdfhf2(65504.0, - UINT16_C(0x7bff))) + fromRep16(0x7bff))) return 1; // max (rounded) if (test__truncdfhf2(65519.0, - UINT16_C(0x7bff))) + fromRep16(0x7bff))) return 1; // max (to +inf) if (test__truncdfhf2(65520.0, - UINT16_C(0x7c00))) + fromRep16(0x7c00))) return 1; if (test__truncdfhf2(-65520.0, - UINT16_C(0xfc00))) + fromRep16(0xfc00))) return 1; if (test__truncdfhf2(65536.0, - UINT16_C(0x7c00))) + fromRep16(0x7c00))) return 1; return 0; } Index: compiler-rt/test/builtins/Unit/truncsfhf2_test.c =================================================================== --- compiler-rt/test/builtins/Unit/truncsfhf2_test.c +++ compiler-rt/test/builtins/Unit/truncsfhf2_test.c @@ -5,16 +5,16 @@ #include "fp_test.h" -uint16_t __truncsfhf2(float a); +TYPE_FP16 __truncsfhf2(float a); -int test__truncsfhf2(float a, uint16_t expected) +int test__truncsfhf2(float a, TYPE_FP16 expected) { - uint16_t x = __truncsfhf2(a); + TYPE_FP16 x = __truncsfhf2(a); int ret = compareResultH(x, expected); if (ret){ printf("error in test__truncsfhf2(%f) = %#.4x, " - "expected %#.4x\n", a, x, fromRep16(expected)); + "expected %#.4x\n", a, fromRep16(x), fromRep16(expected)); } return ret; } @@ -25,80 +25,80 @@ { // qNaN if (test__truncsfhf2(makeQNaN32(), - UINT16_C(0x7e00))) + fromRep16(0x7e00))) return 1; // NaN if (test__truncsfhf2(makeNaN32(UINT32_C(0x8000)), - UINT16_C(0x7e00))) + fromRep16(0x7e00))) return 1; // inf if (test__truncsfhf2(makeInf32(), - UINT16_C(0x7c00))) + fromRep16(0x7c00))) return 1; if (test__truncsfhf2(-makeInf32(), - UINT16_C(0xfc00))) + fromRep16(0xfc00))) return 1; // zero - if (test__truncsfhf2(0.0f, UINT16_C(0x0))) + if (test__truncsfhf2(0.0f, fromRep16(0x0))) return 1; - if (test__truncsfhf2(-0.0f, UINT16_C(0x8000))) + if (test__truncsfhf2(-0.0f, fromRep16(0x8000))) return 1; if (test__truncsfhf2(3.1415926535f, - UINT16_C(0x4248))) + fromRep16(0x4248))) return 1; if (test__truncsfhf2(-3.1415926535f, - UINT16_C(0xc248))) + fromRep16(0xc248))) return 1; if (test__truncsfhf2(0x1.987124876876324p+100f, - UINT16_C(0x7c00))) + fromRep16(0x7c00))) return 1; if (test__truncsfhf2(0x1.987124876876324p+12f, - UINT16_C(0x6e62))) + fromRep16(0x6e62))) return 1; if (test__truncsfhf2(0x1.0p+0f, - UINT16_C(0x3c00))) + fromRep16(0x3c00))) return 1; if (test__truncsfhf2(0x1.0p-14f, - UINT16_C(0x0400))) + fromRep16(0x0400))) return 1; // denormal if (test__truncsfhf2(0x1.0p-20f, - UINT16_C(0x0010))) + fromRep16(0x0010))) return 1; if (test__truncsfhf2(0x1.0p-24f, - UINT16_C(0x0001))) + fromRep16(0x0001))) return 1; if (test__truncsfhf2(-0x1.0p-24f, - UINT16_C(0x8001))) + fromRep16(0x8001))) return 1; if (test__truncsfhf2(0x1.5p-25f, - UINT16_C(0x0001))) + fromRep16(0x0001))) return 1; // and back to zero if (test__truncsfhf2(0x1.0p-25f, - UINT16_C(0x0000))) + fromRep16(0x0000))) return 1; if (test__truncsfhf2(-0x1.0p-25f, - UINT16_C(0x8000))) + fromRep16(0x8000))) return 1; // max (precise) if (test__truncsfhf2(65504.0f, - UINT16_C(0x7bff))) + fromRep16(0x7bff))) return 1; // max (rounded) if (test__truncsfhf2(65519.0f, - UINT16_C(0x7bff))) + fromRep16(0x7bff))) return 1; // max (to +inf) if (test__truncsfhf2(65520.0f, - UINT16_C(0x7c00))) + fromRep16(0x7c00))) return 1; if (test__truncsfhf2(65536.0f, - UINT16_C(0x7c00))) + fromRep16(0x7c00))) return 1; if (test__truncsfhf2(-65520.0f, - UINT16_C(0xfc00))) + fromRep16(0xfc00))) return 1; return 0; } Index: compiler-rt/test/builtins/Unit/trunctfhf2_test.c =================================================================== --- /dev/null +++ compiler-rt/test/builtins/Unit/trunctfhf2_test.c @@ -0,0 +1,127 @@ +// RUN: %clang_builtins %s %librt -o %t && %run %t +// REQUIRES: librt_has_trunctfhf2 + +#include "int_lib.h" +#include + +#if __LDBL_MANT_DIG__ == 113 && defined (COMPILER_RT_HAS_FLOAT16) + +#include "fp_test.h" + +TYPE_FP16 __trunctfhf2(long double a); + +int test__trunctfhf2(long double a, TYPE_FP16 expected) +{ + TYPE_FP16 x = __trunctfhf2(a); + int ret = compareResultH(x, expected); + + if (ret) + { + printf("error in test__trunctfhf2(%.20Lf) = %#.4x, " + "expected %#.4x\n", a, fromRep16(x), fromRep16(expected)); + } + return ret; +} + +char assumption_1[sizeof(TYPE_FP16) * CHAR_BIT == 16] = {0}; + +#endif + +int main() +{ +#if __LDBL_MANT_DIG__ == 113 && defined (COMPILER_RT_HAS_FLOAT16) + // qNaN + if (test__trunctfhf2(makeQNaN128(), + fromRep16(0x7e00))) + return 1; + // NaN + if (test__trunctfhf2(makeNaN128(UINT64_C(0x810000000000)), + fromRep16(0x7e00))) + return 1; + // inf + if (test__trunctfhf2(makeInf128(), + fromRep16(0x7c00))) + return 1; + if (test__trunctfhf2(-makeInf128(), + fromRep16(0xfc00))) + return 1; + // zero + if (test__trunctfhf2(0.0L, fromRep16(0x0))) + return 1; + if (test__trunctfhf2(-0.0L, fromRep16(0x8000))) + return 1; + + if (test__trunctfhf2(3.1415926535L, + fromRep16(0x4248))) + return 1; + if (test__trunctfhf2(-3.1415926535L, + fromRep16(0xc248))) + return 1; + if (test__trunctfhf2(0x1.987124876876324p+100L, + fromRep16(0x7c00))) + return 1; + if (test__trunctfhf2(0x1.987124876876324p+12L, + fromRep16(0x6e62))) + return 1; + if (test__trunctfhf2(0x1.0p+0L, + fromRep16(0x3c00))) + return 1; + if (test__trunctfhf2(0x1.0p-14L, + fromRep16(0x0400))) + return 1; + // denormal + if (test__trunctfhf2(0x1.0p-20L, + fromRep16(0x0010))) + return 1; + if (test__trunctfhf2(0x1.0p-24L, + fromRep16(0x0001))) + return 1; + if (test__trunctfhf2(-0x1.0p-24L, + fromRep16(0x8001))) + return 1; + if (test__trunctfhf2(0x1.5p-25L, + fromRep16(0x0001))) + return 1; + // and back to zero + if (test__trunctfhf2(0x1.0p-25L, + fromRep16(0x0000))) + return 1; + if (test__trunctfhf2(-0x1.0p-25L, + fromRep16(0x8000))) + return 1; + // max (precise) + if (test__trunctfhf2(65504.0L, + fromRep16(0x7bff))) + return 1; + // max (rounded) + if (test__trunctfhf2(65519.0L, + fromRep16(0x7bff))) + return 1; + // max (to +inf) + if (test__trunctfhf2(65520.0L, + fromRep16(0x7c00))) + return 1; + if (test__trunctfhf2(65536.0L, + fromRep16(0x7c00))) + return 1; + if (test__trunctfhf2(-65520.0L, + fromRep16(0xfc00))) + return 1; + + if (test__trunctfhf2(0x1.23a2abb4a2ddee355f36789abcdep+5L, + fromRep16(0x508f))) + return 1; + if (test__trunctfhf2(0x1.e3d3c45bd3abfd98b76a54cc321fp-9L, + fromRep16(0x1b8f))) + return 1; + if (test__trunctfhf2(0x1.234eebb5faa678f4488693abcdefp+453L, + fromRep16(0x7c00))) + return 1; + if (test__trunctfhf2(0x1.edcba9bb8c76a5a43dd21f334634p-43L, + fromRep16(0x0))) + return 1; +#else + printf("skipped\n"); +#endif + return 0; +} Index: llvm/include/llvm/IR/RuntimeLibcalls.def =================================================================== --- llvm/include/llvm/IR/RuntimeLibcalls.def +++ llvm/include/llvm/IR/RuntimeLibcalls.def @@ -286,6 +286,7 @@ HANDLE_LIBCALL(FPEXT_F80_F128, "__extendxftf2") HANDLE_LIBCALL(FPEXT_F64_F128, "__extenddftf2") HANDLE_LIBCALL(FPEXT_F32_F128, "__extendsftf2") +HANDLE_LIBCALL(FPEXT_F16_F128, "__extendhftf2") HANDLE_LIBCALL(FPEXT_F32_F64, "__extendsfdf2") HANDLE_LIBCALL(FPEXT_F16_F32, "__gnu_h2f_ieee") HANDLE_LIBCALL(FPROUND_F32_F16, "__gnu_f2h_ieee") Index: llvm/lib/CodeGen/TargetLoweringBase.cpp =================================================================== --- llvm/lib/CodeGen/TargetLoweringBase.cpp +++ llvm/lib/CodeGen/TargetLoweringBase.cpp @@ -224,6 +224,8 @@ if (OpVT == MVT::f16) { if (RetVT == MVT::f32) return FPEXT_F16_F32; + if (RetVT == MVT::f128) + return FPEXT_F16_F128; } else if (OpVT == MVT::f32) { if (RetVT == MVT::f64) return FPEXT_F32_F64; Index: llvm/lib/Target/AArch64/AArch64ISelLowering.cpp =================================================================== --- llvm/lib/Target/AArch64/AArch64ISelLowering.cpp +++ llvm/lib/Target/AArch64/AArch64ISelLowering.cpp @@ -360,8 +360,10 @@ setOperationAction(ISD::STRICT_UINT_TO_FP, MVT::i32, Custom); setOperationAction(ISD::STRICT_UINT_TO_FP, MVT::i64, Custom); setOperationAction(ISD::STRICT_UINT_TO_FP, MVT::i128, Custom); + setOperationAction(ISD::FP_ROUND, MVT::f16, Custom); setOperationAction(ISD::FP_ROUND, MVT::f32, Custom); setOperationAction(ISD::FP_ROUND, MVT::f64, Custom); + setOperationAction(ISD::STRICT_FP_ROUND, MVT::f16, Custom); setOperationAction(ISD::STRICT_FP_ROUND, MVT::f32, Custom); setOperationAction(ISD::STRICT_FP_ROUND, MVT::f64, Custom); Index: llvm/test/CodeGen/AArch64/arm64-fp128.ll =================================================================== --- llvm/test/CodeGen/AArch64/arm64-fp128.ll +++ llvm/test/CodeGen/AArch64/arm64-fp128.ll @@ -219,6 +219,7 @@ ; CHECK: ret } +@varhalf = global half 0.0, align 2 @varfloat = global float 0.0, align 4 @vardouble = global double 0.0, align 8 @@ -227,6 +228,12 @@ %val = load fp128, fp128* @lhs, align 16 + %half = fptrunc fp128 %val to half + store half %half, half* @varhalf, align 2 +; CHECK: ldr q0, [{{x[0-9]+}}, :lo12:lhs] +; CHECK: bl __trunctfhf2 +; CHECK: str h0, [{{x[0-9]+}}, :lo12:varhalf] + %float = fptrunc fp128 %val to float store float %float, float* @varfloat, align 4 ; CHECK: bl __trunctfsf2 @@ -245,6 +252,13 @@ %val = load fp128, fp128* @lhs, align 16 + %half = load half, half* @varhalf + %fromhalf = fpext half %half to fp128 + store volatile fp128 %fromhalf, fp128* @lhs, align 16 +; CHECK: ldr h0, [{{x[0-9]+}}, :lo12:varhalf] +; CHECK: bl __extendhftf2 +; CHECK: str q0, [{{x[0-9]+}}, :lo12:lhs] + %float = load float, float* @varfloat %fromfloat = fpext float %float to fp128 store volatile fp128 %fromfloat, fp128* @lhs, align 16