Diff 277645

llvm/include/llvm/CodeGen/GlobalISel/CombinerHelper.h

Show First 20 Lines • Show All 101 Lines • ▼ Show 20 Lines	public:
void applyCombineExtendingLoads(MachineInstr &MI, PreferredTuple &MatchInfo);		void applyCombineExtendingLoads(MachineInstr &MI, PreferredTuple &MatchInfo);

/// Combine \p MI into a pre-indexed or post-indexed load/store operation if		/// Combine \p MI into a pre-indexed or post-indexed load/store operation if
/// legal and the surrounding code makes it useful.		/// legal and the surrounding code makes it useful.
bool tryCombineIndexedLoadStore(MachineInstr &MI);		bool tryCombineIndexedLoadStore(MachineInstr &MI);
bool matchCombineIndexedLoadStore(MachineInstr &MI, IndexedLoadStoreMatchInfo &MatchInfo);		bool matchCombineIndexedLoadStore(MachineInstr &MI, IndexedLoadStoreMatchInfo &MatchInfo);
void applyCombineIndexedLoadStore(MachineInstr &MI, IndexedLoadStoreMatchInfo &MatchInfo);		void applyCombineIndexedLoadStore(MachineInstr &MI, IndexedLoadStoreMatchInfo &MatchInfo);

		bool matchSextAlreadyExtended(MachineInstr &MI);
		bool applySextAlreadyExtended(MachineInstr &MI);

bool matchElideBrByInvertingCond(MachineInstr &MI);		bool matchElideBrByInvertingCond(MachineInstr &MI);
void applyElideBrByInvertingCond(MachineInstr &MI);		void applyElideBrByInvertingCond(MachineInstr &MI);
bool tryElideBrByInvertingCond(MachineInstr &MI);		bool tryElideBrByInvertingCond(MachineInstr &MI);

/// If \p MI is G_CONCAT_VECTORS, try to combine it.		/// If \p MI is G_CONCAT_VECTORS, try to combine it.
/// Returns true if MI changed.		/// Returns true if MI changed.
/// Right now, we support:		/// Right now, we support:
/// - concat_vector(undef, undef) => undef		/// - concat_vector(undef, undef) => undef
▲ Show 20 Lines • Show All 166 Lines • Show Last 20 Lines

llvm/include/llvm/Target/GlobalISel/Combine.td

	Show First 20 Lines • Show All 119 Lines • ▼ Show 20 Lines

	def extending_loads : GICombineRule<			def extending_loads : GICombineRule<
	(defs root:$root, extending_load_matchdata:$matchinfo),			(defs root:$root, extending_load_matchdata:$matchinfo),
	(match (wip_match_opcode G_LOAD, G_SEXTLOAD, G_ZEXTLOAD):$root,			(match (wip_match_opcode G_LOAD, G_SEXTLOAD, G_ZEXTLOAD):$root,
	[{ return Helper.matchCombineExtendingLoads(*${root}, ${matchinfo}); }]),			[{ return Helper.matchCombineExtendingLoads(*${root}, ${matchinfo}); }]),
	(apply [{ Helper.applyCombineExtendingLoads(*${root}, ${matchinfo}); }])>;			(apply [{ Helper.applyCombineExtendingLoads(*${root}, ${matchinfo}); }])>;
	def combines_for_extload: GICombineGroup<[extending_loads]>;			def combines_for_extload: GICombineGroup<[extending_loads]>;

				def sext_already_extended : GICombineRule<
				(defs root:$d),
				(match (wip_match_opcode G_SEXT_INREG):$d,
				[{ return Helper.matchSextAlreadyExtended(*${d}); }]),
				(apply [{ Helper.applySextAlreadyExtended(*${d}); }])>;

	def combine_indexed_load_store : GICombineRule<			def combine_indexed_load_store : GICombineRule<
	(defs root:$root, indexed_load_store_matchdata:$matchinfo),			(defs root:$root, indexed_load_store_matchdata:$matchinfo),
	(match (wip_match_opcode G_LOAD, G_SEXTLOAD, G_ZEXTLOAD, G_STORE):$root,			(match (wip_match_opcode G_LOAD, G_SEXTLOAD, G_ZEXTLOAD, G_STORE):$root,
	[{ return Helper.matchCombineIndexedLoadStore(*${root}, ${matchinfo}); }]),			[{ return Helper.matchCombineIndexedLoadStore(*${root}, ${matchinfo}); }]),
	(apply [{ Helper.applyCombineIndexedLoadStore(*${root}, ${matchinfo}); }])>;			(apply [{ Helper.applyCombineIndexedLoadStore(*${root}, ${matchinfo}); }])>;

	// FIXME: Is there a reason this wasn't in tryCombine? I've left it out of			// FIXME: Is there a reason this wasn't in tryCombine? I've left it out of
	// all_combines because it wasn't there.			// all_combines because it wasn't there.
	▲ Show 20 Lines • Show All 134 Lines • Show Last 20 Lines

llvm/lib/CodeGen/GlobalISel/CombinerHelper.cpp

Show First 20 Lines • Show All 570 Lines • ▼ Show 20 Lines	bool CombinerHelper::dominates(const MachineInstr &DefMI,
if (MDT)		if (MDT)
return MDT->dominates(&DefMI, &UseMI);		return MDT->dominates(&DefMI, &UseMI);
else if (DefMI.getParent() != UseMI.getParent())		else if (DefMI.getParent() != UseMI.getParent())
return false;		return false;

return isPredecessor(DefMI, UseMI);		return isPredecessor(DefMI, UseMI);
}		}

		bool CombinerHelper::matchSextAlreadyExtended(MachineInstr &MI) {
		assert(MI.getOpcode() == TargetOpcode::G_SEXT_INREG);
		Register SrcReg = MI.getOperand(1).getReg();
		unsigned SrcSignBits = KB->computeNumSignBits(SrcReg);
		unsigned NumSextBits =
		MRI.getType(MI.getOperand(0).getReg()).getScalarSizeInBits() -
		arsenmUnsubmitted Not Done Reply Inline Actions getScalarSizeInBits arsenm: getScalarSizeInBits
		MI.getOperand(2).getImm();
		return SrcSignBits >= NumSextBits;
		arsenmUnsubmitted Not Done Reply Inline Actions This should be >=? arsenm: This should be >=?
		}

		arsenmUnsubmitted Not Done Reply Inline Actions This is just a special case of checking computeNumSignBits? Do we recognize the number of sign bits in a sextload yet? arsenm: This is just a special case of checking computeNumSignBits? Do we recognize the number of sign…
		aemersonAuthorUnsubmitted Done Reply Inline Actions We don't, but using computeNumSignBits doesn't tell us how to find the original def in the chain that has redundantly been sign extended. E.g. in this case we won't know how to look through the truncate. aemerson: We don't, but using computeNumSignBits doesn't tell us how to find the original def in the…
		bool CombinerHelper::applySextAlreadyExtended(MachineInstr &MI) {
		assert(MI.getOpcode() == TargetOpcode::G_SEXT_INREG);
		MachineIRBuilder MIB(MI);
		MIB.buildCopy(MI.getOperand(0).getReg(), MI.getOperand(1).getReg());
		arsenmUnsubmitted Not Done Reply Inline Actions I don't think introducing a new AnyExt would be right? arsenm: I don't think introducing a new AnyExt would be right?
		MI.eraseFromParent();
		return true;
		}

bool CombinerHelper::findPostIndexCandidate(MachineInstr &MI, Register &Addr,		bool CombinerHelper::findPostIndexCandidate(MachineInstr &MI, Register &Addr,
Register &Base, Register &Offset) {		Register &Base, Register &Offset) {
auto &MF = *MI.getParent()->getParent();		auto &MF = *MI.getParent()->getParent();
const auto &TLI = *MF.getSubtarget().getTargetLowering();		const auto &TLI = *MF.getSubtarget().getTargetLowering();

#ifndef NDEBUG		#ifndef NDEBUG
unsigned Opcode = MI.getOpcode();		unsigned Opcode = MI.getOpcode();
assert(Opcode == TargetOpcode::G_LOAD \|\| Opcode == TargetOpcode::G_SEXTLOAD \|\|		assert(Opcode == TargetOpcode::G_LOAD \|\| Opcode == TargetOpcode::G_SEXTLOAD \|\|
▲ Show 20 Lines • Show All 1,134 Lines • Show Last 20 Lines

llvm/lib/CodeGen/GlobalISel/GISelKnownBits.cpp

//===- lib/CodeGen/GlobalISel/GISelKnownBits.cpp --------------- C++ -===//		//===- lib/CodeGen/GlobalISel/GISelKnownBits.cpp --------------- C++ -===//
//		//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.		// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.		// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception		// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//		//
//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//
//		//
/// Provides analysis for querying information about KnownBits during GISel		/// Provides analysis for querying information about KnownBits during GISel
/// passes.		/// passes.
//		//
//===------------------		//===------------------
#include "llvm/CodeGen/GlobalISel/GISelKnownBits.h"		#include "llvm/CodeGen/GlobalISel/GISelKnownBits.h"
		#include "llvm/Analysis/TargetTransformInfo.h"
#include "llvm/Analysis/ValueTracking.h"		#include "llvm/Analysis/ValueTracking.h"
#include "llvm/CodeGen/GlobalISel/Utils.h"		#include "llvm/CodeGen/GlobalISel/Utils.h"
#include "llvm/CodeGen/MachineFrameInfo.h"		#include "llvm/CodeGen/MachineFrameInfo.h"
#include "llvm/CodeGen/MachineRegisterInfo.h"		#include "llvm/CodeGen/MachineRegisterInfo.h"
#include "llvm/CodeGen/TargetLowering.h"		#include "llvm/CodeGen/TargetLowering.h"
#include "llvm/CodeGen/TargetOpcodes.h"		#include "llvm/CodeGen/TargetOpcodes.h"

#define DEBUG_TYPE "gisel-known-bits"		#define DEBUG_TYPE "gisel-known-bits"
▲ Show 20 Lines • Show All 414 Lines • ▼ Show 20 Lines	case TargetOpcode::COPY: {
return 1;		return 1;
}		}
case TargetOpcode::G_SEXT: {		case TargetOpcode::G_SEXT: {
Register Src = MI.getOperand(1).getReg();		Register Src = MI.getOperand(1).getReg();
LLT SrcTy = MRI.getType(Src);		LLT SrcTy = MRI.getType(Src);
unsigned Tmp = DstTy.getScalarSizeInBits() - SrcTy.getScalarSizeInBits();		unsigned Tmp = DstTy.getScalarSizeInBits() - SrcTy.getScalarSizeInBits();
return computeNumSignBits(Src, DemandedElts, Depth + 1) + Tmp;		return computeNumSignBits(Src, DemandedElts, Depth + 1) + Tmp;
}		}
		case TargetOpcode::G_SEXTLOAD: {
		Register Dst = MI.getOperand(0).getReg();
		LLT Ty = MRI.getType(Dst);
		arsenmUnsubmitted Not Done Reply Inline Actions I think this needs to be careful about a vector sextload arsenm: I think this needs to be careful about a vector sextload
		// TODO: add vector support
		if (Ty.isVector())
		arsenmUnsubmitted Not Done Reply Inline Actions Should add TODO to handle vectors arsenm: Should add TODO to handle vectors
		break;
		if (MI.hasOneMemOperand())
		return Ty.getSizeInBits() - (*MI.memoperands_begin())->getSizeInBits();
		break;
		}
case TargetOpcode::G_TRUNC: {		case TargetOpcode::G_TRUNC: {
Register Src = MI.getOperand(1).getReg();		Register Src = MI.getOperand(1).getReg();
LLT SrcTy = MRI.getType(Src);		LLT SrcTy = MRI.getType(Src);

// Check if the sign bits of source go down as far as the truncated value.		// Check if the sign bits of source go down as far as the truncated value.
unsigned DstTyBits = DstTy.getScalarSizeInBits();		unsigned DstTyBits = DstTy.getScalarSizeInBits();
unsigned NumSrcBits = SrcTy.getScalarSizeInBits();		unsigned NumSrcBits = SrcTy.getScalarSizeInBits();
unsigned NumSrcSignBits = computeNumSignBits(Src, DemandedElts, Depth + 1);		unsigned NumSrcSignBits = computeNumSignBits(Src, DemandedElts, Depth + 1);
▲ Show 20 Lines • Show All 50 Lines • Show Last 20 Lines

llvm/lib/Target/AArch64/AArch64Combine.td

	Show First 20 Lines • Show All 73 Lines • ▼ Show 20 Lines

	// Combines which replace a G_SHUFFLE_VECTOR with a target-specific pseudo			// Combines which replace a G_SHUFFLE_VECTOR with a target-specific pseudo
	// instruction.			// instruction.
	def shuffle_vector_pseudos : GICombineGroup<[dup, rev, ext, zip, uzp, trn]>;			def shuffle_vector_pseudos : GICombineGroup<[dup, rev, ext, zip, uzp, trn]>;

	def AArch64PostLegalizerCombinerHelper			def AArch64PostLegalizerCombinerHelper
	: GICombinerHelper<"AArch64GenPostLegalizerCombinerHelper",			: GICombinerHelper<"AArch64GenPostLegalizerCombinerHelper",
	[erase_undef_store, combines_for_extload,			[erase_undef_store, combines_for_extload,
	shuffle_vector_pseudos]> {			sext_already_extended, shuffle_vector_pseudos]> {
	let DisableRuleOption = "aarch64postlegalizercombiner-disable-rule";			let DisableRuleOption = "aarch64postlegalizercombiner-disable-rule";
	}			}

llvm/test/CodeGen/AArch64/GlobalISel/combine-sext-trunc-sextload.mir

This file was added.

				# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py
				# RUN: llc -mtriple aarch64 -run-pass=aarch64-postlegalizer-combiner -verify-machineinstrs %s -o - \| FileCheck %s
				---
				name: test_combine_sext_trunc_of_sextload
				legalized: true
				tracksRegLiveness: true
				body: \|
				bb.0.entry:
				liveins: $x0
				; CHECK-LABEL: name: test_combine_sext_trunc_of_sextload
				; CHECK: liveins: $x0
				; CHECK: [[COPY:%[0-9]+]]:_(p0) = COPY $x0
				; CHECK: [[SEXTLOAD:%[0-9]+]]:_(s64) = G_SEXTLOAD [[COPY]](p0) :: (load 2)
				; CHECK: [[TRUNC:%[0-9]+]]:_(s32) = G_TRUNC [[SEXTLOAD]](s64)
				; CHECK: [[COPY1:%[0-9]+]]:_(s32) = COPY [[TRUNC]](s32)
				; CHECK: $w0 = COPY [[COPY1]](s32)
				%0:_(p0) = COPY $x0
				%1:_(s64) = G_SEXTLOAD %0:_(p0) :: (load 2)
				%2:_(s32) = G_TRUNC %1:_(s64)
				%3:_(s32) = G_SEXT_INREG %2:_(s32), 16
				$w0 = COPY %3(s32)
				...
				---
				name: test_combine_sext_of_sextload
				legalized: true
				tracksRegLiveness: true
				body: \|
				bb.0.entry:
				liveins: $x0
				; CHECK-LABEL: name: test_combine_sext_of_sextload
				; CHECK: liveins: $x0
				; CHECK: [[COPY:%[0-9]+]]:_(p0) = COPY $x0
				; CHECK: [[SEXTLOAD:%[0-9]+]]:_(s32) = G_SEXTLOAD [[COPY]](p0) :: (load 2)
				; CHECK: [[COPY1:%[0-9]+]]:_(s32) = COPY [[SEXTLOAD]](s32)
				; CHECK: [[COPY2:%[0-9]+]]:_(s32) = COPY [[COPY1]](s32)
				; CHECK: $w0 = COPY [[COPY2]](s32)
				%0:_(p0) = COPY $x0
				%1:_(s32) = G_SEXTLOAD %0:_(p0) :: (load 2)
				%2:_(s32) = COPY %1:_(s32)
				%3:_(s32) = G_SEXT_INREG %2:_(s32), 16
				$w0 = COPY %3(s32)
				...
				---
				name: test_combine_sext_of_sextload_not_matching
				legalized: true
				tracksRegLiveness: true
				body: \|
				bb.0.entry:
				liveins: $x0
				; Here we're trying to extend from a larger width than was extended in the load.
				; CHECK-LABEL: name: test_combine_sext_of_sextload_not_matching
				; CHECK: liveins: $x0
				; CHECK: [[COPY:%[0-9]+]]:_(p0) = COPY $x0
				; CHECK: [[SEXTLOAD:%[0-9]+]]:_(s32) = G_SEXTLOAD [[COPY]](p0) :: (load 2)
				; CHECK: [[COPY1:%[0-9]+]]:_(s32) = COPY [[SEXTLOAD]](s32)
				; CHECK: $w0 = COPY [[COPY1]](s32)
				%0:_(p0) = COPY $x0
				%1:_(s32) = G_SEXTLOAD %0:_(p0) :: (load 2)
				%2:_(s32) = G_SEXT_INREG %1:_(s32), 24
				$w0 = COPY %2(s32)
				...
				---
				name: test_combine_sext_of_sextload_not_enough_src_signbits
				legalized: true
				tracksRegLiveness: true
				body: \|
				bb.0.entry:
				liveins: $x0
				; Here we're trying to extend from a smaller width than was extended in the load.
				; Don't perform the combine.
				; CHECK-LABEL: name: test_combine_sext_of_sextload_not_enough_src_signbits
				; CHECK: liveins: $x0
				; CHECK: [[COPY:%[0-9]+]]:_(p0) = COPY $x0
				; CHECK: [[SEXTLOAD:%[0-9]+]]:_(s32) = G_SEXTLOAD [[COPY]](p0) :: (load 2)
				; CHECK: [[SEXT_INREG:%[0-9]+]]:_(s32) = G_SEXT_INREG [[SEXTLOAD]], 8
				; CHECK: $w0 = COPY [[SEXT_INREG]](s32)
				%0:_(p0) = COPY $x0
				%1:_(s32) = G_SEXTLOAD %0:_(p0) :: (load 2)
				%2:_(s32) = G_SEXT_INREG %1:_(s32), 8
				$w0 = COPY %2(s32)
				...

This is an archive of the discontinued LLVM Phabricator instance.

[AArch64][GlobalISel] Add post-legalize combine for sext(trunc(sextload)) -> trunc/copy
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 277645

llvm/include/llvm/CodeGen/GlobalISel/CombinerHelper.h

llvm/include/llvm/Target/GlobalISel/Combine.td

llvm/lib/CodeGen/GlobalISel/CombinerHelper.cpp

llvm/lib/CodeGen/GlobalISel/GISelKnownBits.cpp

llvm/lib/Target/AArch64/AArch64Combine.td

llvm/test/CodeGen/AArch64/GlobalISel/combine-sext-trunc-sextload.mir

This is an archive of the discontinued LLVM Phabricator instance.

[AArch64][GlobalISel] Add post-legalize combine for sext(trunc(sextload)) -> trunc/copyClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 277645

llvm/include/llvm/CodeGen/GlobalISel/CombinerHelper.h

llvm/include/llvm/Target/GlobalISel/Combine.td

llvm/lib/CodeGen/GlobalISel/CombinerHelper.cpp

llvm/lib/CodeGen/GlobalISel/GISelKnownBits.cpp

llvm/lib/Target/AArch64/AArch64Combine.td

llvm/test/CodeGen/AArch64/GlobalISel/combine-sext-trunc-sextload.mir

[AArch64][GlobalISel] Add post-legalize combine for sext(trunc(sextload)) -> trunc/copy
ClosedPublic