This is an archive of the discontinued LLVM Phabricator instance.

Wow, that has been a minute since that was discussed. I'm not 100% sure these days that I would encode this in the type system if I were doing it, but having the representation to do it is fine with me.

This revision is now accepted and ready to land.Nov 16 2020, 9:48 PM

Wow what a coincidence, thanks for quick review!

I don't have commit permission yet - can someone help me submitting this?

liufengdb added inline comments.Nov 17 2020, 8:42 AM

mlir/include/mlir/Dialect/Quant/QuantTypes.h
378	remove this storage type.
mlir/lib/Dialect/Quant/IR/QuantOps.cpp
29	alphabeta order?

Updating D91584: Add CalibratedQuantizedType to quant dialect

teijeong marked 2 inline comments as done.Nov 17 2020, 8:53 PM

Harbormaster completed remote builds in B79222: Diff 305968.Nov 17 2020, 9:18 PM

Closed by commit rG94e4ec6499a2: Add CalibratedQuantizedType to quant dialect (authored by Tei Jeong <taeheej@google.com>, committed by liufengdb). · Explain WhyNov 17 2020, 10:17 PM

This revision was automatically updated to reflect the committed changes.

liufengdb added a commit: rG94e4ec6499a2: Add CalibratedQuantizedType to quant dialect.

Revision Contents

Path

Size

mlir/

include/

mlir/

Dialect/

Quant/

QuantTypes.h

29 lines

lib/

Dialect/

Quant/

IR/

2 lines

29 lines

50 lines

65 lines

test/

Dialect/

Quant/

parse-calibrated-invalid.mlir

28 lines

parse-calibrated.mlir

10 lines

Diff 305981

mlir/include/mlir/Dialect/Quant/QuantTypes.h

Show All 22 Lines
class QuantizedIntegerType;		class QuantizedIntegerType;

namespace detail {		namespace detail {

struct QuantizedTypeStorage;		struct QuantizedTypeStorage;
struct AnyQuantizedTypeStorage;		struct AnyQuantizedTypeStorage;
struct UniformQuantizedTypeStorage;		struct UniformQuantizedTypeStorage;
struct UniformQuantizedPerAxisTypeStorage;		struct UniformQuantizedPerAxisTypeStorage;
		struct CalibratedQuantizedTypeStorage;

} // namespace detail		} // namespace detail

/// Enumeration of bit-mapped flags related to quantized types.		/// Enumeration of bit-mapped flags related to quantized types.
namespace QuantizationFlags {		namespace QuantizationFlags {
enum FlagValue {		enum FlagValue {
// Indicates that the storage type should be interpreted as a signed		// Indicates that the storage type should be interpreted as a signed
// integer. The default is to interpret it as an unsigned value.		// integer. The default is to interpret it as an unsigned value.
▲ Show 20 Lines • Show All 327 Lines • ▼ Show 20 Lines	public:
bool isFixedPoint() const {		bool isFixedPoint() const {
if (!isSigned())		if (!isSigned())
return false;		return false;
return llvm::all_of(getZeroPoints(),		return llvm::all_of(getZeroPoints(),
[](int64_t zeroPoint) { return zeroPoint != 0; });		[](int64_t zeroPoint) { return zeroPoint != 0; });
}		}
};		};

		/// A quantized type that infers its range from given min/max values.
		///
		/// Typical syntax:
		/// quant.calibrated<f32<-0.922,0.981>>
		liufengdbUnsubmitted Done Reply Inline Actions remove this storage type. liufengdb: remove this storage type.
		class CalibratedQuantizedType
		: public Type::TypeBase<CalibratedQuantizedType, QuantizedType,
		detail::CalibratedQuantizedTypeStorage> {
		public:
		using Base::Base;

		/// Gets an instance of the type with all parameters specified but not
		/// checked.
		static CalibratedQuantizedType get(Type expressedType, double min,
		double max);

		/// Gets an instance of the type with all specified parameters checked.
		/// Returns a nullptr convertible type on failure.
		static CalibratedQuantizedType getChecked(Type expressedType, double min,
		double max, Location location);

		/// Verifies construction invariants and issues errors/warnings.
		static LogicalResult verifyConstructionInvariants(Location loc,
		Type expressedType,
		double min, double max);
		double getMin() const;
		double getMax() const;
		};

} // namespace quant		} // namespace quant
} // namespace mlir		} // namespace mlir

#endif // MLIR_DIALECT_QUANT_QUANT_TYPES_H_		#endif // MLIR_DIALECT_QUANT_QUANT_TYPES_H_

mlir/lib/Dialect/Quant/IR/QuantOps.cpp

	Show All 18 Lines
	#include "llvm/Support/MathExtras.h"			#include "llvm/Support/MathExtras.h"
	#include <numeric>			#include <numeric>

	using namespace mlir;			using namespace mlir;
	using namespace mlir::quant;			using namespace mlir::quant;
	using namespace mlir::quant::detail;			using namespace mlir::quant::detail;

	void QuantizationDialect::initialize() {			void QuantizationDialect::initialize() {
	addTypes<AnyQuantizedType, UniformQuantizedType,			addTypes<AnyQuantizedType, CalibratedQuantizedType, UniformQuantizedType,
	UniformQuantizedPerAxisType>();			UniformQuantizedPerAxisType>();
	addOperations<			addOperations<
				liufengdbUnsubmitted Done Reply Inline Actions alphabeta order? liufengdb: alphabeta order?
	#define GET_OP_LIST			#define GET_OP_LIST
	#include "mlir/Dialect/Quant/QuantOps.cpp.inc"			#include "mlir/Dialect/Quant/QuantOps.cpp.inc"
	>();			>();
	}			}

	OpFoldResult StorageCastOp::fold(ArrayRef<Attribute> operands) {			OpFoldResult StorageCastOp::fold(ArrayRef<Attribute> operands) {
	// Matches x -> [scast -> scast] -> y, replacing the second scast with the			// Matches x -> [scast -> scast] -> y, replacing the second scast with the
	// value of x if the casts invert each other.			// value of x if the casts invert each other.
	▲ Show 20 Lines • Show All 58 Lines • Show Last 20 Lines

mlir/lib/Dialect/Quant/IR/QuantTypes.cpp

	Show First 20 Lines • Show All 348 Lines • ▼ Show 20 Lines

	ArrayRef<int64_t> UniformQuantizedPerAxisType::getZeroPoints() const {			ArrayRef<int64_t> UniformQuantizedPerAxisType::getZeroPoints() const {
	return getImpl()->getZeroPoints();			return getImpl()->getZeroPoints();
	}			}

	int32_t UniformQuantizedPerAxisType::getQuantizedDimension() const {			int32_t UniformQuantizedPerAxisType::getQuantizedDimension() const {
	return getImpl()->quantizedDimension;			return getImpl()->quantizedDimension;
	}			}

				CalibratedQuantizedType CalibratedQuantizedType::get(Type expressedType,
				double min, double max) {
				return Base::get(expressedType.getContext(), expressedType, min, max);
				}

				CalibratedQuantizedType CalibratedQuantizedType::getChecked(Type expressedType,
				double min,
				double max,
				Location location) {
				return Base::getChecked(location, expressedType, min, max);
				}

				LogicalResult CalibratedQuantizedType::verifyConstructionInvariants(
				Location loc, Type expressedType, double min, double max) {
				// Verify that the expressed type is floating point.
				// If this restriction is ever eliminated, the parser/printer must be
				// extended.
				if (!expressedType.isa<FloatType>())
				return emitError(loc, "expressed type must be floating point");
				if (max <= min)
				return emitError(loc, "illegal min and max: (") << min << ":" << max << ")";

				return success();
				}

				double CalibratedQuantizedType::getMin() const { return getImpl()->min; }

				double CalibratedQuantizedType::getMax() const { return getImpl()->max; }

mlir/lib/Dialect/Quant/IR/TypeDetail.h

Show First 20 Lines • Show All 247 Lines • ▼ Show 20 Lines	struct UniformQuantizedPerAxisTypeStorage : public QuantizedTypeStorage {
}		}

const double *scaleElements;		const double *scaleElements;
const int64_t *zeroPointElements;		const int64_t *zeroPointElements;
unsigned quantParamsSize;		unsigned quantParamsSize;
int32_t quantizedDimension;		int32_t quantizedDimension;
};		};

		struct CalibratedQuantizedTypeStorage : public QuantizedTypeStorage {
		struct KeyTy {
		KeyTy(Type expressedType, double min, double max)
		: expressedType(expressedType), min(min), max(max) {}
		// Floating point type that the quantized type approximates.
		Type expressedType;

		double min;
		double max;

		// Check for equality of two structures that share KeyTy data members
		// (by name).
		template <typename T, typename U>
		static bool genericIsEqual(const T &lhs, const U &rhs) {
		return lhs.expressedType == rhs.expressedType && lhs.min == rhs.min &&
		lhs.max == rhs.max;
		}

		bool operator==(const KeyTy &other) const {
		return genericIsEqual(*this, other);
		}

		unsigned getHashValue() const {
		int64_t minBits = llvm::bit_cast<double>(min);
		int64_t maxBits = llvm::bit_cast<double>(max);
		return llvm::hash_combine(expressedType, minBits, maxBits);
		}
		};

		CalibratedQuantizedTypeStorage(const KeyTy &key)
		: QuantizedTypeStorage(0, NoneType(), key.expressedType, 0, 0),
		min(key.min), max(key.max) {}

		bool operator==(const KeyTy &key) const {
		return KeyTy::genericIsEqual(*this, key);
		}

		/// Construction.
		static CalibratedQuantizedTypeStorage *
		construct(TypeStorageAllocator &allocator, const KeyTy &key) {
		return new (allocator.allocate<CalibratedQuantizedTypeStorage>())
		CalibratedQuantizedTypeStorage(key);
		}

		static unsigned hashKey(const KeyTy &key) { return key.getHashValue(); }

		double min;
		double max;
		};

} // namespace detail		} // namespace detail
} // namespace quant		} // namespace quant
} // namespace mlir		} // namespace mlir

#endif // TYPE_DETAIL_H_		#endif // TYPE_DETAIL_H_

mlir/lib/Dialect/Quant/IR/TypeParser.cpp

Show First 20 Lines • Show All 85 Lines • ▼ Show 20 Lines	static ParseResult parseStorageRange(DialectAsmParser &parser,
}		}
if (storageTypeMax > defaultIntegerMax) {		if (storageTypeMax > defaultIntegerMax) {
return parser.emitError(maxLoc, "illegal storage type maximum: ")		return parser.emitError(maxLoc, "illegal storage type maximum: ")
<< storageTypeMax;		<< storageTypeMax;
}		}
return success();		return success();
}		}

/// Parses a UniformQuantizedType.		static FloatType parseExpressedTypeAndRange(DialectAsmParser &parser,
		double &min, double &max) {
		auto typeLoc = parser.getCurrentLocation();
		FloatType type;

		if (failed(parser.parseType(type))) {
		parser.emitError(typeLoc, "expecting float expressed type");
		return nullptr;
		}

		// Calibrated min and max values.
		if (parser.parseLess() \|\| parser.parseFloat(min) \|\| parser.parseColon() \|\|
		parser.parseFloat(max) \|\| parser.parseGreater()) {
		parser.emitError(typeLoc, "calibrated values must be present");
		return nullptr;
		}
		return type;
		}

		/// Parses an AnyQuantizedType.
///		///
/// uniform_per_layer ::= `any<` storage-spec (expressed-type-spec)?`>`		/// any ::= `any<` storage-spec (expressed-type-spec)?`>`
/// storage-spec ::= storage-type (`<` storage-range `>`)?		/// storage-spec ::= storage-type (`<` storage-range `>`)?
/// storage-range ::= integer-literal `:` integer-literal		/// storage-range ::= integer-literal `:` integer-literal
/// storage-type ::= (`i` \| `u`) integer-literal		/// storage-type ::= (`i` \| `u`) integer-literal
/// expressed-type-spec ::= `:` `f` integer-literal		/// expressed-type-spec ::= `:` `f` integer-literal
static Type parseAnyType(DialectAsmParser &parser, Location loc) {		static Type parseAnyType(DialectAsmParser &parser, Location loc) {
IntegerType storageType;		IntegerType storageType;
FloatType expressedType;		FloatType expressedType;
unsigned typeFlags = 0;		unsigned typeFlags = 0;
▲ Show 20 Lines • Show All 159 Lines • ▼ Show 20 Lines	return UniformQuantizedPerAxisType::getChecked(
quantizedDimension, storageTypeMin, storageTypeMax, loc);		quantizedDimension, storageTypeMin, storageTypeMax, loc);
}		}

return UniformQuantizedType::getChecked(typeFlags, storageType, expressedType,		return UniformQuantizedType::getChecked(typeFlags, storageType, expressedType,
scales.front(), zeroPoints.front(),		scales.front(), zeroPoints.front(),
storageTypeMin, storageTypeMax, loc);		storageTypeMin, storageTypeMax, loc);
}		}

		/// Parses an CalibratedQuantizedType.
		///
		/// calibrated ::= `calibrated<` expressed-spec `>`
		/// expressed-spec ::= expressed-type `<` calibrated-range `>`
		/// expressed-type ::= `f` integer-literal
		/// calibrated-range ::= float-literal `:` float-literal
		static Type parseCalibratedType(DialectAsmParser &parser, Location loc) {
		FloatType expressedType;
		double min;
		double max;

		// Type specification.
		if (parser.parseLess())
		return nullptr;

		// Expressed type.
		expressedType = parseExpressedTypeAndRange(parser, min, max);
		if (!expressedType) {
		return nullptr;
		}

		if (parser.parseGreater()) {
		return nullptr;
		}

		return CalibratedQuantizedType::getChecked(expressedType, min, max, loc);
		}

/// Parse a type registered to this dialect.		/// Parse a type registered to this dialect.
Type QuantizationDialect::parseType(DialectAsmParser &parser) const {		Type QuantizationDialect::parseType(DialectAsmParser &parser) const {
Location loc = parser.getEncodedSourceLoc(parser.getNameLoc());		Location loc = parser.getEncodedSourceLoc(parser.getNameLoc());

// All types start with an identifier that we switch on.		// All types start with an identifier that we switch on.
StringRef typeNameSpelling;		StringRef typeNameSpelling;
if (failed(parser.parseKeyword(&typeNameSpelling)))		if (failed(parser.parseKeyword(&typeNameSpelling)))
return nullptr;		return nullptr;

if (typeNameSpelling == "uniform")		if (typeNameSpelling == "uniform")
return parseUniformType(parser, loc);		return parseUniformType(parser, loc);
if (typeNameSpelling == "any")		if (typeNameSpelling == "any")
return parseAnyType(parser, loc);		return parseAnyType(parser, loc);
		if (typeNameSpelling == "calibrated")
		return parseCalibratedType(parser, loc);

parser.emitError(parser.getNameLoc(),		parser.emitError(parser.getNameLoc(),
"unknown quantized type " + typeNameSpelling);		"unknown quantized type " + typeNameSpelling);
return nullptr;		return nullptr;
}		}

static void printStorageType(QuantizedType type, DialectAsmPrinter &out) {		static void printStorageType(QuantizedType type, DialectAsmPrinter &out) {
// storage type		// storage type
Show All 20 Lines
static void printQuantParams(double scale, int64_t zeroPoint,		static void printQuantParams(double scale, int64_t zeroPoint,
DialectAsmPrinter &out) {		DialectAsmPrinter &out) {
out << scale;		out << scale;
if (zeroPoint != 0) {		if (zeroPoint != 0) {
out << ":" << zeroPoint;		out << ":" << zeroPoint;
}		}
}		}

/// Helper that prints a UniformQuantizedType.		/// Helper that prints a AnyQuantizedType.
static void printAnyQuantizedType(AnyQuantizedType type,		static void printAnyQuantizedType(AnyQuantizedType type,
DialectAsmPrinter &out) {		DialectAsmPrinter &out) {
out << "any<";		out << "any<";
printStorageType(type, out);		printStorageType(type, out);
if (Type expressedType = type.getExpressedType()) {		if (Type expressedType = type.getExpressedType()) {
out << ":" << expressedType;		out << ":" << expressedType;
}		}
out << ">";		out << ">";
Show All 28 Lines	llvm::interleave(
llvm::seq<size_t>(0, scales.size()), out,		llvm::seq<size_t>(0, scales.size()), out,
[&](size_t index) {		[&](size_t index) {
printQuantParams(scales[index], zeroPoints[index], out);		printQuantParams(scales[index], zeroPoints[index], out);
},		},
",");		",");
out << "}>";		out << "}>";
}		}

		/// Helper that prints a CalibratedQuantizedType.
		static void printCalibratedQuantizedType(CalibratedQuantizedType type,
		DialectAsmPrinter &out) {
		out << "calibrated<" << type.getExpressedType();
		out << "<" << type.getMin() << ", " << type.getMax() << ">";
		out << ">";
		}

/// Print a type registered to this dialect.		/// Print a type registered to this dialect.
void QuantizationDialect::printType(Type type, DialectAsmPrinter &os) const {		void QuantizationDialect::printType(Type type, DialectAsmPrinter &os) const {
if (auto anyType = type.dyn_cast<AnyQuantizedType>())		if (auto anyType = type.dyn_cast<AnyQuantizedType>())
printAnyQuantizedType(anyType, os);		printAnyQuantizedType(anyType, os);
else if (auto uniformType = type.dyn_cast<UniformQuantizedType>())		else if (auto uniformType = type.dyn_cast<UniformQuantizedType>())
printUniformQuantizedType(uniformType, os);		printUniformQuantizedType(uniformType, os);
else if (auto perAxisType = type.dyn_cast<UniformQuantizedPerAxisType>())		else if (auto perAxisType = type.dyn_cast<UniformQuantizedPerAxisType>())
printUniformQuantizedPerAxisType(perAxisType, os);		printUniformQuantizedPerAxisType(perAxisType, os);
		else if (auto calibratedType = type.dyn_cast<CalibratedQuantizedType>())
		printCalibratedQuantizedType(calibratedType, os);
else		else
llvm_unreachable("Unhandled quantized type");		llvm_unreachable("Unhandled quantized type");
}		}

mlir/test/Dialect/Quant/parse-calibrated-invalid.mlir

This file was added.

				// RUN: mlir-opt %s -split-input-file -verify-diagnostics

				// -----
				// Unrecognized token: missing calibrated type maximum
				// expected-error@+2 {{calibrated values must be present}}
				// expected-error@+1 {{expected ':'}}
				!qalias = type !quant.calibrated<f32<-0.998>>

				// -----
				// Unrecognized token: missing closing angle bracket
				// expected-error@+1 {{expected '>'}}
				!qalias = type !quant<"calibrated<f32<-0.998:1.232>">

				// -----
				// Unrecognized expressed type: integer type
				// expected-error@+2 {{invalid kind of type specified}}
				// expected-error@+1 {{expecting float expressed type}}
				!qalias = type !quant.calibrated<i8<-4:3>>

				// -----
				// Illegal storage min/max: max - min < 0
				// expected-error@+1 {{illegal min and max: (1.000000e+00:-1.000000e+00)}}
				!qalias = type !quant.calibrated<f32<1.0:-1.0>>

				// -----
				// Illegal storage min/max: max - min == 0
				// expected-error@+1 {{illegal min and max: (1.000000e+00:1.000000e+00)}}
				!qalias = type !quant.calibrated<f32<1.0:1.0>>

mlir/test/Dialect/Quant/parse-calibrated.mlir

This file was added.

				// RUN: mlir-opt -allow-unregistered-dialect %s -split-input-file \| FileCheck %s

				// -----
				// CHECK-LABEL: parseCalibrated
				// CHECK: !quant.calibrated<f32<-0.998, 1.232100e+00>
				!qalias = type !quant.calibrated<f32<-0.998:1.2321>>
				func @parseCalibrated() -> !qalias {
				%0 = "foo"() : () -> !qalias
				return %0 : !qalias
				}

This is an archive of the discontinued LLVM Phabricator instance.

Add CalibratedQuantizedType to quant dialectClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 305981

mlir/include/mlir/Dialect/Quant/QuantTypes.h

mlir/lib/Dialect/Quant/IR/QuantOps.cpp

mlir/lib/Dialect/Quant/IR/QuantTypes.cpp

mlir/lib/Dialect/Quant/IR/TypeDetail.h

mlir/lib/Dialect/Quant/IR/TypeParser.cpp

mlir/test/Dialect/Quant/parse-calibrated-invalid.mlir

mlir/test/Dialect/Quant/parse-calibrated.mlir

Add CalibratedQuantizedType to quant dialect
ClosedPublic