diff --git a/llvm/include/llvm/ADT/APFixedPoint.h b/llvm/include/llvm/ADT/APFixedPoint.h --- a/llvm/include/llvm/ADT/APFixedPoint.h +++ b/llvm/include/llvm/ADT/APFixedPoint.h @@ -1,4 +1,4 @@ -//===- APFixedPoint.h - Fixed point constant handling -----------*- C++ -*-===// +//===- FixedPoint.h - Fixed point constant handling -------------*- C++ -*-===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. @@ -16,6 +16,7 @@ #ifndef LLVM_ADT_APFIXEDPOINT_H #define LLVM_ADT_APFIXEDPOINT_H +#include "llvm/ADT/APFloat.h" #include "llvm/ADT/APSInt.h" #include "llvm/ADT/SmallString.h" #include "llvm/Support/raw_ostream.h" @@ -159,6 +160,8 @@ APSInt convertToInt(unsigned DstWidth, bool DstSign, bool *Overflow = nullptr) const; + APFloat convertToFloat(const fltSemantics &FloatSema) const; + void toString(SmallVectorImpl &Str) const; std::string toString() const { SmallString<40> S; @@ -194,6 +197,9 @@ const FixedPointSemantics &DstFXSema, bool *Overflow = nullptr); + static APFixedPoint getFromFloatValue(const APFloat &Value, + const FixedPointSemantics &DstFXSema, + bool *Overflow = nullptr); private: APSInt Val; FixedPointSemantics Sema; diff --git a/llvm/lib/Support/APFixedPoint.cpp b/llvm/lib/Support/APFixedPoint.cpp --- a/llvm/lib/Support/APFixedPoint.cpp +++ b/llvm/lib/Support/APFixedPoint.cpp @@ -417,6 +417,34 @@ return Result.extOrTrunc(DstWidth); } +APFloat +APFixedPoint::convertToFloat(const fltSemantics &FloatSema) const { + // For some operations, rounding mode has an effect on the result, while + // other operations are lossless and should never result in rounding. + // To signify which these operations are, we define two rounding modes here. + APFloat::roundingMode RM = APFloat::rmNearestTiesToEven; + APFloat::roundingMode LosslessRM = APFloat::rmTowardZero; + + // Convert the fixed point value bits as an integer. If the floating point + // value does not have the required precision, we will round according to the + // given mode. + APFloat Flt(FloatSema); + APFloat::opStatus S = Flt.convertFromAPInt(Val, Sema.isSigned(), RM); + + // If we cared about checking for precision loss, we could look at this + // status. + (void)S; + + // Scale down the integer value in the float to match the correct scaling + // factor. + APFloat ScaleFactor(std::pow(2, -(int)Sema.getScale())); + bool Ignored; + ScaleFactor.convert(FloatSema, LosslessRM, &Ignored); + Flt.multiply(ScaleFactor, LosslessRM); + + return Flt; +} + APFixedPoint APFixedPoint::getFromIntValue(const APSInt &Value, const FixedPointSemantics &DstFXSema, bool *Overflow) { @@ -425,4 +453,62 @@ return APFixedPoint(Value, IntFXSema).convert(DstFXSema, Overflow); } +APFixedPoint +APFixedPoint::getFromFloatValue(const APFloat &Value, + const FixedPointSemantics &DstFXSema, + bool *Overflow) { + // For some operations, rounding mode has an effect on the result, while + // other operations are lossless and should never result in rounding. + // To signify which these operations are, we define two rounding modes here, + // even though they are the same mode. + APFloat::roundingMode RM = APFloat::rmTowardZero; + APFloat::roundingMode LosslessRM = APFloat::rmTowardZero; + + const fltSemantics &FloatSema = Value.getSemantics(); + + APFloat Val = Value; + + // Scale up the float so that the 'fractional' part of the mantissa ends up in + // the integer range instead. Rounding mode is irrelevant here. + // It is fine if this overflows to infinity even for saturating types, + // since we will use floating point comparisons to check for saturation. + APFloat ScaleFactor(std::pow(2, DstFXSema.getScale())); + bool Ignored; + ScaleFactor.convert(FloatSema, LosslessRM, &Ignored); + Val.multiply(ScaleFactor, LosslessRM); + + // Convert to the integral representation of the value. This rounding mode + // is significant. + APSInt Res(DstFXSema.getWidth(), !DstFXSema.isSigned()); + Val.convertToInteger(Res, RM, &Ignored); + + // Round the integral value and scale back. This makes the + // overflow calculations below work properly. If we do not round here, + // we risk checking for overflow with a value that is outside the + // representable range of the fixed-point semantic even though no overflow + // would occur had we rounded first. + ScaleFactor = APFloat(std::pow(2, -(int)DstFXSema.getScale())); + ScaleFactor.convert(FloatSema, LosslessRM, &Ignored); + Val.roundToIntegral(RM); + Val.multiply(ScaleFactor, LosslessRM); + + // Check for overflow/saturation by checking if the floating point value + // is outside the range representable by the fixed-point value. + APFloat FloatMax = getMax(DstFXSema).convertToFloat(FloatSema); + APFloat FloatMin = getMin(DstFXSema).convertToFloat(FloatSema); + bool Overflowed = false; + if (DstFXSema.isSaturated()) { + if (Val > FloatMax) + Res = getMax(DstFXSema).getValue(); + else if (Val < FloatMin) + Res = getMin(DstFXSema).getValue(); + } else + Overflowed = Val > FloatMax || Val < FloatMin; + + if (Overflow) + *Overflow = Overflowed; + + return APFixedPoint(Res, DstFXSema); +} + } // namespace clang diff --git a/llvm/unittests/ADT/APFixedPointTest.cpp b/llvm/unittests/ADT/APFixedPointTest.cpp --- a/llvm/unittests/ADT/APFixedPointTest.cpp +++ b/llvm/unittests/ADT/APFixedPointTest.cpp @@ -7,6 +7,7 @@ //===----------------------------------------------------------------------===// #include "llvm/ADT/APFixedPoint.h" +#include "llvm/ADT/APFloat.h" #include "llvm/ADT/APSInt.h" #include "gtest/gtest.h" @@ -641,4 +642,162 @@ 4294967295ULL << 32); } +enum OvfKind { + MinSat, + MaxSat +}; + +void CheckFloatToFixedConversion(APFloat &Val, const FixedPointSemantics &Sema, + int64_t ExpectedNonSat) { + bool Ovf; + ASSERT_EQ(APFixedPoint::getFromFloatValue(Val, Sema, &Ovf) + .getValue(), ExpectedNonSat); + ASSERT_EQ(Ovf, false); + ASSERT_EQ(APFixedPoint::getFromFloatValue(Val, Saturated(Sema), &Ovf) + .getValue(), ExpectedNonSat); + ASSERT_EQ(Ovf, false); +} + +void CheckFloatToFixedConversion(APFloat &Val, const FixedPointSemantics &Sema, + OvfKind ExpectedOvf) { + bool Ovf; + (void)APFixedPoint::getFromFloatValue(Val, Sema, &Ovf); + ASSERT_EQ(Ovf, true); + ASSERT_EQ(APFixedPoint::getFromFloatValue(Val, Saturated(Sema), &Ovf) + .getValue(), + (ExpectedOvf == MinSat ? APFixedPoint::getMin(Sema) + : APFixedPoint::getMax(Sema)).getValue()); + ASSERT_EQ(Ovf, false); +} + +TEST(FixedPoint, FloatToFixed) { + APFloat Val(0.0f); + + // Simple exact fraction + Val = APFloat(0.75f); + CheckFloatToFixedConversion(Val, getSAccumSema(), 3ULL << 5); + CheckFloatToFixedConversion(Val, getAccumSema(), 3ULL << 13); + CheckFloatToFixedConversion(Val, getLAccumSema(), 3ULL << 29); + + CheckFloatToFixedConversion(Val, getUSAccumSema(), 3ULL << 6); + CheckFloatToFixedConversion(Val, getUAccumSema(), 3ULL << 14); + CheckFloatToFixedConversion(Val, getULAccumSema(), 3ULL << 30); + + CheckFloatToFixedConversion(Val, getSFractSema(), 3ULL << 5); + CheckFloatToFixedConversion(Val, getFractSema(), 3ULL << 13); + CheckFloatToFixedConversion(Val, getLFractSema(), 3ULL << 29); + + CheckFloatToFixedConversion(Val, getUSFractSema(), 3ULL << 6); + CheckFloatToFixedConversion(Val, getUFractSema(), 3ULL << 14); + CheckFloatToFixedConversion(Val, getULFractSema(), 3ULL << 30); + + // Simple negative exact fraction + Val = APFloat(-0.75f); + CheckFloatToFixedConversion(Val, getSAccumSema(), -3ULL << 5); + CheckFloatToFixedConversion(Val, getAccumSema(), -3ULL << 13); + CheckFloatToFixedConversion(Val, getLAccumSema(), -3ULL << 29); + + CheckFloatToFixedConversion(Val, getUSAccumSema(), MinSat); + CheckFloatToFixedConversion(Val, getUAccumSema(), MinSat); + CheckFloatToFixedConversion(Val, getULAccumSema(), MinSat); + + CheckFloatToFixedConversion(Val, getSFractSema(), -3ULL << 5); + CheckFloatToFixedConversion(Val, getFractSema(), -3ULL << 13); + CheckFloatToFixedConversion(Val, getLFractSema(), -3ULL << 29); + + CheckFloatToFixedConversion(Val, getUSFractSema(), MinSat); + CheckFloatToFixedConversion(Val, getUFractSema(), MinSat); + CheckFloatToFixedConversion(Val, getULFractSema(), MinSat); + + // Highly precise fraction + Val = APFloat(0.999999940395355224609375f); + CheckFloatToFixedConversion(Val, getSAccumSema(), 0x7FULL); + CheckFloatToFixedConversion(Val, getAccumSema(), 0x7FFFULL); + CheckFloatToFixedConversion(Val, getLAccumSema(), 0xFFFFFFULL << 7); + + CheckFloatToFixedConversion(Val, getUSAccumSema(), 0xFFULL); + CheckFloatToFixedConversion(Val, getUAccumSema(), 0xFFFFULL); + CheckFloatToFixedConversion(Val, getULAccumSema(), 0xFFFFFFULL << 8); + + CheckFloatToFixedConversion(Val, getSFractSema(), 0x7FULL); + CheckFloatToFixedConversion(Val, getFractSema(), 0x7FFFULL); + CheckFloatToFixedConversion(Val, getLFractSema(), 0xFFFFFFULL << 7); + + CheckFloatToFixedConversion(Val, getUSFractSema(), 0xFFULL); + CheckFloatToFixedConversion(Val, getUFractSema(), 0xFFFFULL); + CheckFloatToFixedConversion(Val, getULFractSema(), 0xFFFFFFULL << 8); + + // Integral and fraction + Val = APFloat(17.99609375f); + CheckFloatToFixedConversion(Val, getSAccumSema(), 0x11FFULL >> 1); + CheckFloatToFixedConversion(Val, getAccumSema(), 0x11FFULL << 7); + CheckFloatToFixedConversion(Val, getLAccumSema(), 0x11FFULL << 23); + + CheckFloatToFixedConversion(Val, getUSAccumSema(), 0x11FFULL); + CheckFloatToFixedConversion(Val, getUAccumSema(), 0x11FFULL << 8); + CheckFloatToFixedConversion(Val, getULAccumSema(), 0x11FFULL << 24); + + CheckFloatToFixedConversion(Val, getSFractSema(), MaxSat); + CheckFloatToFixedConversion(Val, getFractSema(), MaxSat); + CheckFloatToFixedConversion(Val, getLFractSema(), MaxSat); + + CheckFloatToFixedConversion(Val, getUSFractSema(), MaxSat); + CheckFloatToFixedConversion(Val, getUFractSema(), MaxSat); + CheckFloatToFixedConversion(Val, getULFractSema(), MaxSat); + + // Negative integral and fraction + Val = APFloat(-17.99609375f); + CheckFloatToFixedConversion(Val, getSAccumSema(), -0x11FELL >> 1); + CheckFloatToFixedConversion(Val, getAccumSema(), -0x11FFULL << 7); + CheckFloatToFixedConversion(Val, getLAccumSema(), -0x11FFULL << 23); + + CheckFloatToFixedConversion(Val, getUSAccumSema(), MinSat); + CheckFloatToFixedConversion(Val, getUAccumSema(), MinSat); + CheckFloatToFixedConversion(Val, getULAccumSema(), MinSat); + + CheckFloatToFixedConversion(Val, getSFractSema(), MinSat); + CheckFloatToFixedConversion(Val, getFractSema(), MinSat); + CheckFloatToFixedConversion(Val, getLFractSema(), MinSat); + + CheckFloatToFixedConversion(Val, getUSFractSema(), MinSat); + CheckFloatToFixedConversion(Val, getUFractSema(), MinSat); + CheckFloatToFixedConversion(Val, getULFractSema(), MinSat); + + // Very large value + Val = APFloat(1.0e38f); + CheckFloatToFixedConversion(Val, getSAccumSema(), MaxSat); + CheckFloatToFixedConversion(Val, getAccumSema(), MaxSat); + CheckFloatToFixedConversion(Val, getLAccumSema(), MaxSat); + + CheckFloatToFixedConversion(Val, getUSAccumSema(), MaxSat); + CheckFloatToFixedConversion(Val, getUAccumSema(), MaxSat); + CheckFloatToFixedConversion(Val, getULAccumSema(), MaxSat); + + CheckFloatToFixedConversion(Val, getSFractSema(), MaxSat); + CheckFloatToFixedConversion(Val, getFractSema(), MaxSat); + CheckFloatToFixedConversion(Val, getLFractSema(), MaxSat); + + CheckFloatToFixedConversion(Val, getUSFractSema(), MaxSat); + CheckFloatToFixedConversion(Val, getUFractSema(), MaxSat); + CheckFloatToFixedConversion(Val, getULFractSema(), MaxSat); + + // Very small value + Val = APFloat(1.0e-38f); + CheckFloatToFixedConversion(Val, getSAccumSema(), 0); + CheckFloatToFixedConversion(Val, getAccumSema(), 0); + CheckFloatToFixedConversion(Val, getLAccumSema(), 0); + + CheckFloatToFixedConversion(Val, getUSAccumSema(), 0); + CheckFloatToFixedConversion(Val, getUAccumSema(), 0); + CheckFloatToFixedConversion(Val, getULAccumSema(), 0); + + CheckFloatToFixedConversion(Val, getSFractSema(), 0); + CheckFloatToFixedConversion(Val, getFractSema(), 0); + CheckFloatToFixedConversion(Val, getLFractSema(), 0); + + CheckFloatToFixedConversion(Val, getUSFractSema(), 0); + CheckFloatToFixedConversion(Val, getUFractSema(), 0); + CheckFloatToFixedConversion(Val, getULFractSema(), 0); +} + } // namespace