Diff 379228

mlir/include/mlir/Dialect/Linalg/Transforms/ComprehensiveBufferize.h

Show First 20 Lines • Show All 78 Lines • ▼ Show 20 Lines	public:
/// be visible from R).		/// be visible from R).
/// 2. one cannot find an intermediate clobbering write `C` to W, such that		/// 2. one cannot find an intermediate clobbering write `C` to W, such that
/// C interleaved between W and R (i.e. W -> C -> R where -> denotes		/// C interleaved between W and R (i.e. W -> C -> R where -> denotes
/// dominance).		/// dominance).
bool wouldCreateReadAfterWriteInterference(		bool wouldCreateReadAfterWriteInterference(
Operation opToBufferize, DenseSet<OpOperand > &usesRead,		Operation opToBufferize, DenseSet<OpOperand > &usesRead,
DenseSet<OpOperand *> &usesWrite, const DominanceInfo &domInfo) const;		DenseSet<OpOperand *> &usesWrite, const DominanceInfo &domInfo) const;

/// Return true if bufferizing `opResult` inplace would create a write to a		/// Return true if bufferizing `opOperand` inplace with `opResult` would
/// non-writable buffer.		/// create a write to a non-writable buffer.
bool wouldCreateWriteToNonWritableBuffer(OpResult opResult) const;		bool wouldCreateWriteToNonWritableBuffer(OpOperand &opOperand,
		OpResult opResult) const;

/// Assume that result bufferizes in-place with one of the operation's		/// Assume that result bufferizes in-place with one of the operation's
/// operands. Return true if it is possible to find an inplace write W (resp.		/// operands. Return true if it is possible to find an inplace write W (resp.
/// a read R) among the uses of `aliasInfo[result]`, and a read R (resp. an		/// a read R) among the uses of `aliasInfo[result]`, and a read R (resp. an
/// inplace write W) among the uses of		/// inplace write W) among the uses of
/// `aliasInfo[getAliasingOpOperand(result)]`, such that W and R interfere.		/// `aliasInfo[getAliasingOpOperand(result)]`, such that W and R interfere.
/// Interference detection is needed to determine which cases may bufferize		/// Interference detection is needed to determine which cases may bufferize
/// inplace without interferences. Such cases comprise:		/// inplace without interferences. Such cases comprise:
///		///
/// ```		/// ```
/// %0 = op_to_bufferize(%1)		/// %0 = op_to_bufferize(%1)
/// read(%1)		/// read(%1)
///		///
/// %0 = op_to_bufferize(%1)		/// %0 = op_to_bufferize(%1)
/// write(%0)		/// write(%0)
/// read(%1)		/// read(%1)
///		///
/// %0 = op_to_bufferize(%1)		/// %0 = op_to_bufferize(%1)
/// write(%1)		/// write(%1)
/// read(%0)		/// read(%0)
/// ```		/// ```
bool		bool
wouldCreateReadAfterWriteInterference(OpResult result,		wouldCreateReadAfterWriteInterference(OpOperand &operand, OpResult result,
const DominanceInfo &domInfo) const;		const DominanceInfo &domInfo) const;

/// Return true if `v1` and `v2` bufferize to equivalent buffers.		/// Return true if `v1` and `v2` bufferize to equivalent buffers.
bool areEquivalentBufferizedValues(Value v1, Value v2) const {		bool areEquivalentBufferizedValues(Value v1, Value v2) const {
return equivalentInfo.getLeaderValue(v1) ==		return equivalentInfo.getLeaderValue(v1) ==
equivalentInfo.getLeaderValue(v2);		equivalentInfo.getLeaderValue(v2);
}		}

▲ Show 20 Lines • Show All 104 Lines • ▼ Show 20 Lines	private:
/// These are the conservative cases that can further decompose into		/// These are the conservative cases that can further decompose into
/// "equivalent" buffer relationships.		/// "equivalent" buffer relationships.
llvm::EquivalenceClasses<ValueWrapper> aliasInfo;		llvm::EquivalenceClasses<ValueWrapper> aliasInfo;

/// Auxiliary structure to store all the equivalent buffer classes.		/// Auxiliary structure to store all the equivalent buffer classes.
llvm::EquivalenceClasses<ValueWrapper> equivalentInfo;		llvm::EquivalenceClasses<ValueWrapper> equivalentInfo;
};		};

/// Analyze the `ops` to determine which OpResults are inplaceable:		/// Analyze the `ops` to determine which OpResults are inplaceable.
LogicalResult inPlaceAnalysis(SmallVector<Operation *> &ops,		LogicalResult inPlaceAnalysis(SmallVector<Operation *> &ops,
BufferizationAliasInfo &aliasInfo,		BufferizationAliasInfo &aliasInfo,
const DominanceInfo &domInfo);		const DominanceInfo &domInfo);

/// Bufferize one particular op.		/// Bufferize one particular op.
/// `bufferizedFunctionTypes` (resp. `globalCreator`) are expected to be		/// `bufferizedFunctionTypes` (resp. `globalCreator`) are expected to be
/// non-null if `op` is a CallOpInterface (resp. GlobalCreator).		/// non-null if `op` is a CallOpInterface (resp. GlobalCreator).
LogicalResult		LogicalResult
Show All 9 Lines

mlir/lib/Dialect/Linalg/Transforms/ComprehensiveBufferize.cpp

Show First 20 Lines • Show All 555 Lines • ▼ Show 20 Lines
/// bufferization aliasing behavior, which indicates that the op must allocate		/// bufferization aliasing behavior, which indicates that the op must allocate
/// all of its tensor results.		/// all of its tensor results.
/// TODO: in the future this may need to evolve towards a list of OpOperand*.		/// TODO: in the future this may need to evolve towards a list of OpOperand*.
static Optional<OpOperand *> getAliasingOpOperand(OpResult result) {		static Optional<OpOperand *> getAliasingOpOperand(OpResult result) {
if (!hasKnownBufferizationAliasingBehavior(result.getDefiningOp()))		if (!hasKnownBufferizationAliasingBehavior(result.getDefiningOp()))
return None;		return None;
return TypeSwitch<Operation , OpOperand >(result.getDefiningOp())		return TypeSwitch<Operation , OpOperand >(result.getDefiningOp())
.Case([&](tensor::CastOp op) { return &op->getOpOperand(0); })		.Case([&](tensor::CastOp op) { return &op->getOpOperand(0); })
.Case([&](ConstantOp op) { return nullptr; })		.Case([&](ConstantOp op) { return nullptr; })
		nicolasvasilacheUnsubmitted Done Reply Inline Actions This fix is independent, please split it in a separate revision. nicolasvasilache: This fix is independent, please split it in a separate revision.
.Case([&](ExtractSliceOp op) { return &op->getOpOperand(0); })		.Case([&](ExtractSliceOp op) { return &op->getOpOperand(0); })
// In the case of scf::ForOp, this currently assumes the iter_args / yield		// In the case of scf::ForOp, this currently assumes the iter_args / yield
// are 1-1. This may fail and is verified at the end.		// are 1-1. This may fail and is verified at the end.
// TODO: update this.		// TODO: update this.
.Case([&](scf::ForOp op) {		.Case([&](scf::ForOp op) {
return &op.getIterOpOperands()[result.getResultNumber()];		return &op.getIterOpOperands()[result.getResultNumber()];
})		})
.Case([&](InitTensorOp op) { return nullptr; })		.Case([&](InitTensorOp op) { return nullptr; })
▲ Show 20 Lines • Show All 111 Lines • ▼ Show 20 Lines	bufferizesToMemoryWrite(OpOperand &opOperand,
// If we have a matching OpResult, this is a write.		// If we have a matching OpResult, this is a write.
// Additionally allow to restrict to only inPlace write, if so specified.		// Additionally allow to restrict to only inPlace write, if so specified.
return inPlaceSpec == InPlaceSpec::None \|\|		return inPlaceSpec == InPlaceSpec::None \|\|
getInPlace(opResult) == inPlaceSpec;		getInPlace(opResult) == inPlaceSpec;
}		}

/// Returns the relationship between the operand and the its corresponding		/// Returns the relationship between the operand and the its corresponding
/// OpResult that it may alias with.		/// OpResult that it may alias with.
static BufferRelation bufferRelation(OpOperand &operand) {		static BufferRelation bufferRelation(OpOperand &operand) {
		nicolasvasilacheUnsubmitted Done Reply Inline Actions this NFC API change can be in its own CL, please do that and land it without review to reduce the amount of changes in this revision. nicolasvasilache: this NFC API change can be in its own CL, please do that and land it without review to reduce…
return TypeSwitch<Operation *, BufferRelation>(operand.getOwner())		return TypeSwitch<Operation *, BufferRelation>(operand.getOwner())
// ExtractSliceOp returns a subview of the original tensor.		// ExtractSliceOp returns a subview of the original tensor.
.Case([&](ExtractSliceOp op) { return BufferRelation::None; })		.Case([&](ExtractSliceOp op) { return BufferRelation::None; })
// All other ops: Buffers are equivalent.		// All other ops: Buffers are equivalent.
.Default([&](Operation *op) { return BufferRelation::Equivalent; });		.Default([&](Operation *op) { return BufferRelation::Equivalent; });
}		}

//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//
Show All 32 Lines
void BufferizationAliasInfo::insertNewBufferEquivalence(Value newValue,		void BufferizationAliasInfo::insertNewBufferEquivalence(Value newValue,
Value alias) {		Value alias) {
insertNewBufferAlias(newValue, alias);		insertNewBufferAlias(newValue, alias);
equivalentInfo.unionSets(newValue, alias);		equivalentInfo.unionSets(newValue, alias);
}		}

/// Return true if, under current bufferization decisions, the buffer of `value`		/// Return true if, under current bufferization decisions, the buffer of `value`
/// is not writable.		/// is not writable.
bool BufferizationAliasInfo::aliasesNonWritableBuffer(Value value) const {		bool BufferizationAliasInfo::aliasesNonWritableBuffer(Value value) const {
		nicolasvasilacheUnsubmitted Done Reply Inline Actions this NFC API change can be in its own CL, please do that and land it without review to reduce the amount of changes in this revision. nicolasvasilache: this NFC API change can be in its own CL, please do that and land it without review to reduce…
LDBG("----Start aliasesNonWritableBuffer\n");		LDBG("----Start aliasesNonWritableBuffer\n");
for (Value v : getAliases(value)) {		for (Value v : getAliases(value)) {
LDBG("-----------examine: " << printValueInfo(v) << '\n');		LDBG("-----------examine: " << printValueInfo(v) << '\n');
if (bufferizesToWritableMemory(v)) {		if (bufferizesToWritableMemory(v)) {
LDBG("-----------Value is known to be writable -> skip: "		LDBG("-----------Value is known to be writable -> skip: "
<< printValueInfo(v) << '\n');		<< printValueInfo(v) << '\n');
continue;		continue;
}		}
▲ Show 20 Lines • Show All 122 Lines • ▼ Show 20 Lines
/// such that W and R interfere.		/// such that W and R interfere.
/// Such a (W, R) pair is an interference to the inplace bufferization of		/// Such a (W, R) pair is an interference to the inplace bufferization of
/// opResult when:		/// opResult when:
/// 1. R is not known to properly dominate W (i.e. the effects of the write		/// 1. R is not known to properly dominate W (i.e. the effects of the write
/// may be visible from R).		/// may be visible from R).
/// 2. one cannot find an intermediate clobbering write `C` to W, such that		/// 2. one cannot find an intermediate clobbering write `C` to W, such that
/// C interleaved between W and R (i.e. W -> C -> R where -> denotes		/// C interleaved between W and R (i.e. W -> C -> R where -> denotes
/// dominance).		/// dominance).
bool BufferizationAliasInfo::wouldCreateReadAfterWriteInterference(		bool BufferizationAliasInfo::wouldCreateReadAfterWriteInterference(
OpResult result, const DominanceInfo &domInfo) const {		OpOperand &operand, OpResult result, const DominanceInfo &domInfo) const {
Optional<OpOperand *> maybeAliasingOperand = getAliasingOpOperand(result);		assert(getAliasingOpOperand(result) == &operand &&
if (!maybeAliasingOperand)		"operand and result do not match");
		nicolasvasilacheUnsubmitted Not Done Reply Inline Actions I don't understand why this API needs to change in this revision. Losing the connection between opOperand and opResult is problematic to me here and below. At the very least we should have strong documentation and loud assertion about the cases we allow. nicolasvasilache: I don't understand why this API needs to change in this revision. Losing the connection between…
		springermAuthorUnsubmitted Done Reply Inline Actions This was just for convenience. Since we already have the OpOperand in the caller. We could add another assert here, expand the comment to say that they have to match, or just abandon this revision. Either one is fine with me. I just think that the `Optional<OpOperand >` leads to unnecessarily complex (hard to parse understand) code. springerm:* This was just for convenience. Since we already have the OpOperand in the caller. We could add…
		nicolasvasilacheUnsubmitted Not Done Reply Inline Actions with the assert, this WFM, thanks! nicolasvasilache: with the assert, this WFM, thanks!
return false;

Operation *opToBufferize = result.getDefiningOp();		Operation *opToBufferize = result.getDefiningOp();
Value opResult = result;		Value opResult = result;
Value opOperand = (*maybeAliasingOperand)->get();		Value opOperand = operand.get();

LDBG("----Start wouldCreateReadAfterWriteInterference\n");		LDBG("----Start wouldCreateReadAfterWriteInterference\n");
LDBG("--------consider all aliases to root read: "		LDBG("--------consider all aliases to root read: "
<< printValueInfo(opOperand) << "\n");		<< printValueInfo(opOperand) << "\n");
LDBG("--------consider all aliases to root write: "		LDBG("--------consider all aliases to root write: "
<< printValueInfo(opResult) << "\n");		<< printValueInfo(opResult) << "\n");

/// Helper function to iterate on aliases of `root` and capture the reads.		/// Helper function to iterate on aliases of `root` and capture the reads.
Show All 35 Lines	bool BufferizationAliasInfo::wouldCreateReadAfterWriteInterference(
// read(%3)		// read(%3)
// ```		// ```
DenseSet<OpOperand *> usesRead, usesWrite;		DenseSet<OpOperand *> usesRead, usesWrite;
LDBG("--------\n");		LDBG("--------\n");
LDBG("--------Test reads(opOperand) vs writes(opResult)\n");		LDBG("--------Test reads(opOperand) vs writes(opResult)\n");
getAliasingReads(usesRead, opOperand);		getAliasingReads(usesRead, opOperand);
getAliasingInplaceWrites(usesWrite, opResult);		getAliasingInplaceWrites(usesWrite, opResult);
// Additionally, `result` is not yet bufferized and we need to check for		// Additionally, `result` is not yet bufferized and we need to check for
// interferences as if it were bufferized inplace: add `maybeAliasingOperand`		// interferences as if it were bufferized inplace: add `operand` if it is a
// if it is a write. This handles the case:		// write. This handles the case:
//		//
// ```		// ```
// %0 = op_to_bufferize_maybe_inplace(%1)		// %0 = op_to_bufferize_maybe_inplace(%1)
// %2 = some_alias(%1)		// %2 = some_alias(%1)
// read(%2)		// read(%2)
// ```		// ```
if (bufferizesToMemoryWrite(**maybeAliasingOperand))		if (bufferizesToMemoryWrite(operand))
usesWrite.insert(*maybeAliasingOperand);		usesWrite.insert(&operand);
if (wouldCreateReadAfterWriteInterference(opToBufferize, usesRead, usesWrite,		if (wouldCreateReadAfterWriteInterference(opToBufferize, usesRead, usesWrite,
domInfo))		domInfo))
return true;		return true;

// Check if we can find any interference between writes to		// Check if we can find any interference between writes to
// aliases[`opOperand`] and reads to aliases[`opResult`]. This handles the		// aliases[`opOperand`] and reads to aliases[`opResult`]. This handles the
// case:		// case:
//		//
Show All 9 Lines	bool BufferizationAliasInfo::wouldCreateReadAfterWriteInterference(
usesRead.clear();		usesRead.clear();
usesWrite.clear();		usesWrite.clear();
getAliasingReads(usesRead, opResult);		getAliasingReads(usesRead, opResult);
getAliasingInplaceWrites(usesWrite, opOperand);		getAliasingInplaceWrites(usesWrite, opOperand);
return wouldCreateReadAfterWriteInterference(opToBufferize, usesRead,		return wouldCreateReadAfterWriteInterference(opToBufferize, usesRead,
usesWrite, domInfo);		usesWrite, domInfo);
}		}

/// Return true if bufferizing `opResult` inplace would create a write to a		/// Return true if bufferizing `opOperand` inplace with `opResult` would create
/// non-writable buffer.		/// a write to a non-writable buffer.
bool BufferizationAliasInfo::wouldCreateWriteToNonWritableBuffer(		bool BufferizationAliasInfo::wouldCreateWriteToNonWritableBuffer(
OpResult opResult) const {		OpOperand &opOperand, OpResult opResult) const {
		nicolasvasilacheUnsubmitted Not Done Reply Inline Actions losing the connection between opOperand and opResult is problematic to me here. nicolasvasilache: losing the connection between opOperand and opResult is problematic to me here.
Optional<OpOperand *> maybeAliasingOperand = getAliasingOpOperand(opResult);		assert(getAliasingOpOperand(opResult) == &opOperand &&
if (!maybeAliasingOperand \|\| !*maybeAliasingOperand)		"operand and result do not match");
return false;

// Certain buffers are not writeable:		// Certain buffers are not writeable:
// 1. A function bbArg that is not inplaceable or		// 1. A function bbArg that is not inplaceable or
		nicolasvasilacheUnsubmitted Done Reply Inline Actions Since we lost the connection between opOperand and opResult, opOperand may be readonly and it does not make sense to call aliasesNonWritableBuffer on it. nicolasvasilache: Since we lost the connection between opOperand and opResult, opOperand may be readonly and it…
		springermAuthorUnsubmitted Done Reply Inline Actions `aliasesNonWritableBuffer` can be called on any Value. Should not be a problem. The main change around this location has moved to D111379. While the new version may cover a few cases that may never appear in reality, I find it easier to understand. In particular, I was thinking for a while that the existing conflict detection code non-writable buffer is missing a case. %r = tensor.extract_slice %t * %t aliases in-place write * %r aliases non-writable buffer This case is not covered by the existing code. The new one (D111379) does. I now believe that it is not possible to construct such an example. However, this was not immediately obvious to me. So for the sake of simplicity/understandability, my suggestion would be to go with a version similar to D111379. springerm: `aliasesNonWritableBuffer` can be called on any Value. Should not be a problem. The main…
// 2. A constant op.		// 2. A constant op.
assert(!aliasesNonWritableBuffer(opResult) &&		assert(!aliasesNonWritableBuffer(opResult) &&
"expected that opResult does not alias non-writable buffer");		"expected that opResult does not alias non-writable buffer");
bool nonWritable = aliasesNonWritableBuffer((*maybeAliasingOperand)->get());		bool nonWritable = aliasesNonWritableBuffer(opOperand.get());
if (!nonWritable)		if (!nonWritable)
return false;		return false;

// This is a problem only if the buffer is written to via some alias.		// This is a problem only if the buffer is written to via some alias.
bool hasWrite = aliasesInPlaceWrite(opResult) \|\|		bool hasWrite = aliasesInPlaceWrite(opResult) \|\|
aliasesInPlaceWrite((*maybeAliasingOperand)->get()) \|\|		aliasesInPlaceWrite(opOperand.get()) \|\|
bufferizesToMemoryWrite(**maybeAliasingOperand);		bufferizesToMemoryWrite(opOperand);
if (!hasWrite)		if (!hasWrite)
return false;		return false;

LDBG("->the corresponding buffer is not writeable\n");		LDBG("->the corresponding buffer is not writeable\n");
return true;		return true;
}		}

/// Return true if the source of a `insertSliceOp` bufferizes to an		/// Return true if the source of a `insertSliceOp` bufferizes to an
▲ Show 20 Lines • Show All 1,246 Lines • ▼ Show 20 Lines	bufferizableInPlaceAnalysisImpl(OpOperand &operand, OpResult result,
int64_t resultNumber = result.getResultNumber();		int64_t resultNumber = result.getResultNumber();
(void)resultNumber;		(void)resultNumber;
LDBG('\n');		LDBG('\n');
LDBG("Inplace analysis for <- #" << resultNumber << " -> #"		LDBG("Inplace analysis for <- #" << resultNumber << " -> #"
<< operand.getOperandNumber() << " in "		<< operand.getOperandNumber() << " in "
<< printValueInfo(result) << '\n');		<< printValueInfo(result) << '\n');

bool foundInterference =		bool foundInterference =
aliasInfo.wouldCreateWriteToNonWritableBuffer(result) \|\|		aliasInfo.wouldCreateWriteToNonWritableBuffer(operand, result) \|\|
aliasInfo.wouldCreateReadAfterWriteInterference(result, domInfo);		aliasInfo.wouldCreateReadAfterWriteInterference(operand, result, domInfo);

if (foundInterference)		if (foundInterference)
aliasInfo.bufferizeOutOfPlace(result);		aliasInfo.bufferizeOutOfPlace(result);
else		else
aliasInfo.bufferizeInPlace(result, operand);		aliasInfo.bufferizeInPlace(result, operand);

LDBG("Done inplace analysis for result #" << resultNumber << '\n');		LDBG("Done inplace analysis for result #" << resultNumber << '\n');

return success();		return success();
}		}

///		///
/// Rationale for bufferizing `%1 = tensor.extract_slice %0[...]` inplace.		/// Rationale for bufferizing `%1 = tensor.extract_slice %0[...]` inplace.
nicolasvasilacheUnsubmitted Done Reply Inline Actions Please do not drop these comments as they are not trivial to infer. A lot of load-bearing semantic is now carried by BufferRelation::None which hides this discussion. We need to find a way to document this to avoid surprises in the future. nicolasvasilache: Please do not drop these comments as they are not trivial to infer. A lot of load-bearing…
springermAuthorUnsubmitted Done Reply Inline Actions Moved into the body of `mlir::linalg::inPlaceAnalysis`. springerm: Moved into the body of `mlir::linalg::inPlaceAnalysis`.
/// ===========================================================		/// ===========================================================
///		///
/// When bufferized out of place, a ExtractSlice lowers to alloc + copy. This		/// When bufferized out of place, a ExtractSlice lowers to alloc + copy. This
/// cannot change the flow of information for either the source or the		/// cannot change the flow of information for either the source or the
/// result buffers.		/// result buffers.
///		///
/// When bufferized inplace, a ExtractSliceOp does not by itself create any read		/// When bufferized inplace, a ExtractSliceOp does not by itself create any read
/// or write from memory. Instead, it has the effect of merging the alias sets		/// or write from memory. Instead, it has the effect of merging the alias sets
/// of the source and the result buffers.		/// of the source and the result buffers.
///		///
/// An analysis is required to ensure inplace bufferization would not result in		/// An analysis is required to ensure inplace bufferization would not result in
/// RaW dependence violations.		/// RaW dependence violations.
static LogicalResult		static LogicalResult
bufferizableInPlaceAnalysis(ExtractSliceOp extractSliceOp,		bufferizableInPlaceAnalysis(ExtractSliceOp extractSliceOp,
		nicolasvasilacheUnsubmitted Done Reply Inline Actions Let's call this one bufferizableInPlaceAnalysisImpl and add some assert that operand and result are related and cannot be random things. Atm we lose this information and it is unclear who should call what. Let's keep the ExtractSliceOp version and make it call the Impl. nicolasvasilache: Let's call this one bufferizableInPlaceAnalysisImpl and add some assert that operand and result…
BufferizationAliasInfo &aliasInfo,		BufferizationAliasInfo &aliasInfo,
const DominanceInfo &domInfo) {		const DominanceInfo &domInfo) {
return bufferizableInPlaceAnalysisImpl(extractSliceOp->getOpOperand(0),		return bufferizableInPlaceAnalysisImpl(extractSliceOp->getOpOperand(0),
extractSliceOp->getOpResult(0),		extractSliceOp->getOpResult(0),
aliasInfo, domInfo);		aliasInfo, domInfo);
}		}

/// Determine if `operand` can be bufferized in-place with one of the op's		/// Determine if `operand` can be bufferized in-place with one of the op's
/// results. If so, set InPlaceSpec::True on the result. Otherwise, set		/// results. If so, set InPlaceSpec::True on the result. Otherwise, set
/// InPlaceSpec::False on the result.		/// InPlaceSpec::False on the result.
static LogicalResult		static LogicalResult
bufferizableInPlaceAnalysis(OpOperand &operand,		bufferizableInPlaceAnalysis(OpOperand &operand,
BufferizationAliasInfo &aliasInfo,		BufferizationAliasInfo &aliasInfo,
const DominanceInfo &domInfo) {		const DominanceInfo &domInfo) {
OpResult result = getInplaceableOpResult(operand);		OpResult result = getInplaceableOpResult(operand);
		nicolasvasilacheUnsubmitted Done Reply Inline Actions This is fishy: there may be ops in the future that have an input which aliases only a part of the result. When bufferized, these don't have enough room to fit the result. Putting a blocker until this is discussed. nicolasvasilache: This is fishy: there may be ops in the future that have an input which aliases only a part of…
		springermAuthorUnsubmitted Done Reply Inline Actions Currently, the entire machinery assumes (conservatively) that two tensors alias either entirely or not at all. It's not just `getAliasingOpResult`, but also `wouldCreateReadAfterWriteInterference`. `This is fishy: there may be ops in the future that have an input which aliases only a part of the result. When bufferized, these don't have enough room to fit the result.` I'm trying to understand when there would not be enough room to fit the result. E.g., this would be an op where the result tensor is larger than the argument tensor? This would require some redesign. There has to be an allocation somewhere. We currently avoid these cases by having explicit "output" tensors (like in linalg.generic). Then we would always have a suitable tensor (with the right size) to alias with. If we have to support such ops that we cannot change, we have to find a different solution. However, my thinking is: If `getAliasingOpResult` returns an OpResult and `getInplaceableOpResult` returns `null` (that's presumably the case you are concerned about; and that's also the case for ExtractSliceOp), the OpOperand is guaranteed to not bufferize to a memory write. "Proof" by contradiction: Let's assume that: `getAliasingOpResult` returns an OpResult `getInplaceableOpResult` returns `null` The OpOperand bufferizes to a memory write Since `getInplaceableOpResult` is `null` and the operation is writing, it must create a new allocation and copy, i.e., bufferize out-of-place. But in that case, it cannot have an aliasing OpResult. Does this make sense? springerm: Currently, the entire machinery assumes (conservatively) that two tensors alias either entirely…
		springermAuthorUnsubmitted Done Reply Inline Actions As discussed, special handling of ExtractSliceOp for the moment. springerm: As discussed, special handling of ExtractSliceOp for the moment.
if (!result)		if (!result)
return success();		return success();
return bufferizableInPlaceAnalysisImpl(operand, result, aliasInfo, domInfo);		return bufferizableInPlaceAnalysisImpl(operand, result, aliasInfo, domInfo);
}		}

/// Analyze the `ops` to determine which OpResults are inplaceable:		/// Analyze the `ops` to determine which OpResults are inplaceable. Walk ops in
/// 1. First, analyze InsertSliceOp greedily: we almost never want to		/// reverse and bufferize ops greedily. This is a good starter heuristic.
/// bufferize the tensor "inserted into" to become out-of-place.
/// 2. Walk the other ops in reverse. This is a good starter heuristic.
/// ExtractSliceOps are interleaved with other ops in traversal order.		/// ExtractSliceOps are interleaved with other ops in traversal order.
///
LogicalResult mlir::linalg::inPlaceAnalysis(SmallVector<Operation *> &ops,		LogicalResult mlir::linalg::inPlaceAnalysis(SmallVector<Operation *> &ops,
BufferizationAliasInfo &aliasInfo,		BufferizationAliasInfo &aliasInfo,
const DominanceInfo &domInfo) {		const DominanceInfo &domInfo) {
// Walk ops in reverse for better interference analysis.		// Walk ops in reverse for better interference analysis.
for (Operation *op : reverse(ops)) {		for (Operation *op : reverse(ops)) {
for (OpOperand &opOperand : op->getOpOperands())		for (OpOperand &opOperand : op->getOpOperands())
if (failed(bufferizableInPlaceAnalysis(opOperand, aliasInfo, domInfo)))		if (failed(bufferizableInPlaceAnalysis(opOperand, aliasInfo, domInfo)))
return failure();		return failure();

// Special logic to analyze ExtractSliceOp.		// Special logic to analyze ExtractSliceOp.
// Note that ExtractSliceOp analysis needs to be interleaved with other ops		// Note that ExtractSliceOp analysis needs to be interleaved with other ops
// to properly capture aliases.		// to properly capture aliases.
// Walk ExtractSliceOps in reverse for better clobbering analysis behavior:		// Walk ExtractSliceOps in reverse for better clobbering analysis behavior:
// it is easier to detect clobbers of smaller slices before larger ones.		// it is easier to detect clobbers of smaller slices before larger ones.
if (auto extractSliceOp = dyn_cast<ExtractSliceOp>(op)) {		if (auto extractSliceOp = dyn_cast<ExtractSliceOp>(op))
if (failed(		if (failed(
bufferizableInPlaceAnalysis(extractSliceOp, aliasInfo, domInfo)))		bufferizableInPlaceAnalysis(extractSliceOp, aliasInfo, domInfo)))
return failure();		return failure();
continue;
}
}		}

return success();		return success();
}		}

/// Analyze the `funcOp` body to determine which OpResults are inplaceable.		/// Analyze the `funcOp` body to determine which OpResults are inplaceable.
static LogicalResult		static LogicalResult
inPlaceAnalysisFuncOpBody(FuncOp funcOp, BufferizationAliasInfo &aliasInfo,		inPlaceAnalysisFuncOpBody(FuncOp funcOp, BufferizationAliasInfo &aliasInfo,
const DominanceInfo &domInfo) {		const DominanceInfo &domInfo) {
LLVM_DEBUG(llvm::dbgs() << "\n\n");		LLVM_DEBUG(llvm::dbgs() << "\n\n");
LDBG("Begin InPlaceAnalysisFuncOpInternals:\n" << funcOp << '\n');		LDBG("Begin InPlaceAnalysisFuncOpInternals:\n" << funcOp << '\n');
assert(funcOp && funcOp->getNumRegions() > 0 && !funcOp.body().empty() &&		assert(funcOp && funcOp->getNumRegions() > 0 && !funcOp.body().empty() &&
"expected a funcOp definition with a body");		"expected a funcOp definition with a body");

		nicolasvasilacheUnsubmitted Done Reply Inline Actions Let's not jump the step here, call a `bufferizableInPlaceAnalysis(ExtractSliceOp` which can in turn call the lower level `bufferizableInPlaceAnalysisImpl`. nicolasvasilache: Let's not jump the step here, call a `bufferizableInPlaceAnalysis(ExtractSliceOp` which can in…
// Collect ops so we can build our own reverse traversal.		// Collect ops so we can build our own reverse traversal.
SmallVector<Operation *> ops;		SmallVector<Operation *> ops;
funcOp.walk([&](Operation *op) {		funcOp.walk([&](Operation *op) {
// No tensors => no buffers.		// No tensors => no buffers.
if (none_of(op->getOperandTypes(), isaTensor) &&		if (none_of(op->getOperandTypes(), isaTensor) &&
none_of(op->getResultTypes(), isaTensor))		none_of(op->getResultTypes(), isaTensor))
return;		return;
ops.push_back(op);		ops.push_back(op);
▲ Show 20 Lines • Show All 549 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[mlir][linalg][bufferize][NFC] Conflict detection funcs take OpOperand and OpResult
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 379228

mlir/include/mlir/Dialect/Linalg/Transforms/ComprehensiveBufferize.h

mlir/lib/Dialect/Linalg/Transforms/ComprehensiveBufferize.cpp

This is an archive of the discontinued LLVM Phabricator instance.

[mlir][linalg][bufferize][NFC] Conflict detection funcs take OpOperand and OpResultClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 379228

mlir/include/mlir/Dialect/Linalg/Transforms/ComprehensiveBufferize.h

mlir/lib/Dialect/Linalg/Transforms/ComprehensiveBufferize.cpp

[mlir][linalg][bufferize][NFC] Conflict detection funcs take OpOperand and OpResult
ClosedPublic